1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
26 #include <sys/types.h>
32 #include <sys/prctl.h>
33 #include <sys/mount.h>
35 #ifdef HAVE_VALGRIND_VALGRIND_H
36 #include <valgrind/valgrind.h>
39 #include "sd-daemon.h"
40 #include "sd-messages.h"
44 #include "load-fragment.h"
47 #include "conf-parser.h"
55 #include "path-util.h"
56 #include "switch-root.h"
57 #include "capability.h"
62 #include "dbus-manager.h"
63 #include "bus-error.h"
66 #include "mount-setup.h"
67 #include "loopback-setup.h"
68 #include "hostname-setup.h"
69 #include "machine-id-setup.h"
70 #include "selinux-setup.h"
71 #include "ima-setup.h"
72 #include "smack-setup.h"
74 #include "kmod-setup.h"
82 ACTION_DUMP_CONFIGURATION_ITEMS,
84 } arg_action = ACTION_RUN;
85 static char *arg_default_unit = NULL;
86 static SystemdRunningAs arg_running_as = _SYSTEMD_RUNNING_AS_INVALID;
87 static bool arg_dump_core = true;
88 static bool arg_crash_shell = false;
89 static int arg_crash_chvt = -1;
90 static bool arg_confirm_spawn = false;
91 static ShowStatus arg_show_status = SHOW_STATUS_UNSET;
92 static bool arg_switched_root = false;
93 static char ***arg_join_controllers = NULL;
94 static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
95 static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
96 static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
97 static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
98 static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
99 static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
100 static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
101 static usec_t arg_runtime_watchdog = 0;
102 static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
103 static char **arg_default_environment = NULL;
104 static struct rlimit *arg_default_rlimit[RLIMIT_NLIMITS] = {};
105 static uint64_t arg_capability_bounding_set_drop = 0;
106 static nsec_t arg_timer_slack_nsec = (nsec_t) -1;
107 static Set* arg_syscall_archs = NULL;
108 static FILE* arg_serialization = NULL;
110 static void nop_handler(int sig) {}
112 noreturn static void crash(int sig) {
115 /* Pass this on immediately, if this is not PID 1 */
117 else if (!arg_dump_core)
118 log_error("Caught <%s>, not dumping core.", signal_to_string(sig));
120 struct sigaction sa = {
121 .sa_handler = nop_handler,
122 .sa_flags = SA_NOCLDSTOP|SA_RESTART,
126 /* We want to wait for the core process, hence let's enable SIGCHLD */
127 sigaction(SIGCHLD, &sa, NULL);
131 log_error("Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
134 struct rlimit rl = {};
136 /* Enable default signal handler for core dump */
138 sa.sa_handler = SIG_DFL;
139 sigaction(sig, &sa, NULL);
141 /* Don't limit the core dump size */
142 rl.rlim_cur = RLIM_INFINITY;
143 rl.rlim_max = RLIM_INFINITY;
144 setrlimit(RLIMIT_CORE, &rl);
146 /* Just to be sure... */
149 /* Raise the signal again */
152 assert_not_reached("We shouldn't be here...");
159 /* Order things nicely. */
160 r = wait_for_terminate(pid, &status);
162 log_error("Caught <%s>, waitpid() failed: %s", signal_to_string(sig), strerror(-r));
163 else if (status.si_code != CLD_DUMPED)
164 log_error("Caught <%s>, core dump failed.", signal_to_string(sig));
166 log_error("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
171 chvt(arg_crash_chvt);
173 if (arg_crash_shell) {
174 struct sigaction sa = {
175 .sa_handler = SIG_IGN,
176 .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
180 log_info("Executing crash shell in 10s...");
183 /* Let the kernel reap children for us */
184 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
188 log_error("Failed to fork off crash shell: %m");
190 make_console_stdio();
191 execl("/bin/sh", "/bin/sh", NULL);
193 log_error("execl() failed: %m");
197 log_info("Successfully spawned crash shell as pid "PID_FMT".", pid);
200 log_info("Freezing execution.");
204 static void install_crash_handler(void) {
205 struct sigaction sa = {
207 .sa_flags = SA_NODEFER,
210 sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
213 static int console_setup(bool do_reset) {
216 /* If we are init, we connect stdin/stdout/stderr to /dev/null
217 * and make sure we don't have a controlling tty. */
224 tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
226 log_error("Failed to open /dev/console: %s", strerror(-tty_fd));
230 /* We don't want to force text mode.
231 * plymouth may be showing pictures already from initrd. */
232 r = reset_terminal_fd(tty_fd, false);
234 log_error("Failed to reset /dev/console: %s", strerror(-r));
236 close_nointr_nofail(tty_fd);
240 static int set_default_unit(const char *u) {
249 free(arg_default_unit);
250 arg_default_unit = c;
255 static int parse_proc_cmdline_word(const char *word) {
257 static const char * const rlmap[] = {
258 "emergency", SPECIAL_EMERGENCY_TARGET,
259 "-b", SPECIAL_EMERGENCY_TARGET,
260 "single", SPECIAL_RESCUE_TARGET,
261 "-s", SPECIAL_RESCUE_TARGET,
262 "s", SPECIAL_RESCUE_TARGET,
263 "S", SPECIAL_RESCUE_TARGET,
264 "1", SPECIAL_RESCUE_TARGET,
265 "2", SPECIAL_RUNLEVEL2_TARGET,
266 "3", SPECIAL_RUNLEVEL3_TARGET,
267 "4", SPECIAL_RUNLEVEL4_TARGET,
268 "5", SPECIAL_RUNLEVEL5_TARGET,
273 if (startswith(word, "systemd.unit=")) {
276 return set_default_unit(word + 13);
278 } else if (startswith(word, "rd.systemd.unit=")) {
281 return set_default_unit(word + 16);
283 } else if (startswith(word, "systemd.log_target=")) {
285 if (log_set_target_from_string(word + 19) < 0)
286 log_warning("Failed to parse log target %s. Ignoring.", word + 19);
288 } else if (startswith(word, "systemd.log_level=")) {
290 if (log_set_max_level_from_string(word + 18) < 0)
291 log_warning("Failed to parse log level %s. Ignoring.", word + 18);
293 } else if (startswith(word, "systemd.log_color=")) {
295 if (log_show_color_from_string(word + 18) < 0)
296 log_warning("Failed to parse log color setting %s. Ignoring.", word + 18);
298 } else if (startswith(word, "systemd.log_location=")) {
300 if (log_show_location_from_string(word + 21) < 0)
301 log_warning("Failed to parse log location setting %s. Ignoring.", word + 21);
303 } else if (startswith(word, "systemd.dump_core=")) {
306 if ((r = parse_boolean(word + 18)) < 0)
307 log_warning("Failed to parse dump core switch %s. Ignoring.", word + 18);
311 } else if (startswith(word, "systemd.crash_shell=")) {
314 if ((r = parse_boolean(word + 20)) < 0)
315 log_warning("Failed to parse crash shell switch %s. Ignoring.", word + 20);
319 } else if (startswith(word, "systemd.confirm_spawn=")) {
322 if ((r = parse_boolean(word + 22)) < 0)
323 log_warning("Failed to parse confirm spawn switch %s. Ignoring.", word + 22);
325 arg_confirm_spawn = r;
327 } else if (startswith(word, "systemd.crash_chvt=")) {
330 if (safe_atoi(word + 19, &k) < 0)
331 log_warning("Failed to parse crash chvt switch %s. Ignoring.", word + 19);
335 } else if (startswith(word, "systemd.show_status=")) {
338 r = parse_show_status(word + 20, &arg_show_status);
340 log_warning("Failed to parse show status switch %s. Ignoring.", word + 20);
341 } else if (startswith(word, "systemd.default_standard_output=")) {
344 if ((r = exec_output_from_string(word + 32)) < 0)
345 log_warning("Failed to parse default standard output switch %s. Ignoring.", word + 32);
347 arg_default_std_output = r;
348 } else if (startswith(word, "systemd.default_standard_error=")) {
351 if ((r = exec_output_from_string(word + 31)) < 0)
352 log_warning("Failed to parse default standard error switch %s. Ignoring.", word + 31);
354 arg_default_std_error = r;
355 } else if (startswith(word, "systemd.setenv=")) {
356 _cleanup_free_ char *cenv = NULL;
358 cenv = strdup(word + 15);
362 if (env_assignment_is_valid(cenv)) {
365 env = strv_env_set(arg_default_environment, cenv);
367 arg_default_environment = env;
369 log_warning("Setting environment variable '%s' failed, ignoring: %m", cenv);
371 log_warning("Environment variable name '%s' is not valid. Ignoring.", cenv);
373 } else if (startswith(word, "systemd.") ||
374 (in_initrd() && startswith(word, "rd.systemd."))) {
378 /* Ignore systemd.journald.xyz and friends */
380 if (startswith(c, "rd."))
382 if (startswith(c, "systemd."))
384 if (c[strcspn(c, ".=")] != '.') {
386 log_warning("Unknown kernel switch %s. Ignoring.", word);
388 log_info("Supported kernel switches:\n"
389 "systemd.unit=UNIT Default unit to start\n"
390 "rd.systemd.unit=UNIT Default unit to start when run in initrd\n"
391 "systemd.dump_core=0|1 Dump core on crash\n"
392 "systemd.crash_shell=0|1 Run shell on crash\n"
393 "systemd.crash_chvt=N Change to VT #N on crash\n"
394 "systemd.confirm_spawn=0|1 Confirm every process spawn\n"
395 "systemd.show_status=0|1|auto Show status updates on the console during bootup\n"
396 "systemd.log_target=console|kmsg|journal|journal-or-kmsg|syslog|syslog-or-kmsg|null\n"
398 "systemd.log_level=LEVEL Log level\n"
399 "systemd.log_color=0|1 Highlight important log messages\n"
400 "systemd.log_location=0|1 Include code location in log messages\n"
401 "systemd.default_standard_output=null|tty|syslog|syslog+console|kmsg|kmsg+console|journal|journal+console\n"
402 " Set default log output for services\n"
403 "systemd.default_standard_error=null|tty|syslog|syslog+console|kmsg|kmsg+console|journal|journal+console\n"
404 " Set default log error output for services\n"
405 "systemd.setenv=ASSIGNMENT Set an environment variable for all spawned processes\n");
408 } else if (streq(word, "quiet")) {
409 if (arg_show_status == SHOW_STATUS_UNSET)
410 arg_show_status = SHOW_STATUS_AUTO;
411 } else if (streq(word, "debug")) {
412 /* Log to kmsg, the journal socket will fill up before the
413 * journal is started and tools running during that time
414 * will block with every log message for for 60 seconds,
415 * before they give up. */
416 log_set_max_level(LOG_DEBUG);
417 log_set_target(detect_container(NULL) > 0 ? LOG_TARGET_CONSOLE : LOG_TARGET_KMSG);
418 } else if (!in_initrd()) {
421 /* SysV compatibility */
422 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
423 if (streq(word, rlmap[i]))
424 return set_default_unit(rlmap[i+1]);
430 #define DEFINE_SETTER(name, func, descr) \
431 static int name(const char *unit, \
432 const char *filename, \
434 const char *section, \
435 unsigned section_line, \
436 const char *lvalue, \
438 const char *rvalue, \
450 log_syntax(unit, LOG_ERR, filename, line, -r, \
451 "Invalid " descr "'%s': %s", \
452 rvalue, strerror(-r)); \
457 DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
458 DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
459 DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
460 DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
462 static int config_parse_cpu_affinity2(const char *unit,
463 const char *filename,
466 unsigned section_line,
483 FOREACH_WORD_QUOTED(w, l, rvalue, state) {
488 if (!(t = strndup(w, l)))
491 r = safe_atou(t, &cpu);
495 if (!(c = cpu_set_malloc(&ncpus)))
498 if (r < 0 || cpu >= ncpus) {
499 log_syntax(unit, LOG_ERR, filename, line, -r,
500 "Failed to parse CPU affinity '%s'", rvalue);
505 CPU_SET_S(cpu, CPU_ALLOC_SIZE(ncpus), c);
509 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
510 log_warning_unit(unit, "Failed to set CPU affinity: %m");
518 static void strv_free_free(char ***l) {
530 static void free_join_controllers(void) {
531 strv_free_free(arg_join_controllers);
532 arg_join_controllers = NULL;
535 static int config_parse_join_controllers(const char *unit,
536 const char *filename,
539 unsigned section_line,
554 free_join_controllers();
556 FOREACH_WORD_QUOTED(w, length, rvalue, state) {
559 s = strndup(w, length);
563 l = strv_split(s, ",");
568 if (strv_length(l) <= 1) {
573 if (!arg_join_controllers) {
574 arg_join_controllers = new(char**, 2);
575 if (!arg_join_controllers) {
580 arg_join_controllers[0] = l;
581 arg_join_controllers[1] = NULL;
588 t = new0(char**, n+2);
596 for (a = arg_join_controllers; *a; a++) {
598 if (strv_overlap(*a, l)) {
599 if (strv_extend_strv(&l, *a) < 0) {
619 t[n++] = strv_uniq(l);
621 strv_free_free(arg_join_controllers);
622 arg_join_controllers = t;
629 static int parse_config_file(void) {
631 const ConfigTableItem items[] = {
632 { "Manager", "LogLevel", config_parse_level2, 0, NULL },
633 { "Manager", "LogTarget", config_parse_target, 0, NULL },
634 { "Manager", "LogColor", config_parse_color, 0, NULL },
635 { "Manager", "LogLocation", config_parse_location, 0, NULL },
636 { "Manager", "DumpCore", config_parse_bool, 0, &arg_dump_core },
637 { "Manager", "CrashShell", config_parse_bool, 0, &arg_crash_shell },
638 { "Manager", "ShowStatus", config_parse_show_status, 0, &arg_show_status },
639 { "Manager", "CrashChVT", config_parse_int, 0, &arg_crash_chvt },
640 { "Manager", "CPUAffinity", config_parse_cpu_affinity2, 0, NULL },
641 { "Manager", "JoinControllers", config_parse_join_controllers, 0, &arg_join_controllers },
642 { "Manager", "RuntimeWatchdogSec", config_parse_sec, 0, &arg_runtime_watchdog },
643 { "Manager", "ShutdownWatchdogSec", config_parse_sec, 0, &arg_shutdown_watchdog },
644 { "Manager", "CapabilityBoundingSet", config_parse_bounding_set, 0, &arg_capability_bounding_set_drop },
646 { "Manager", "SystemCallArchitectures", config_parse_syscall_archs, 0, &arg_syscall_archs },
648 { "Manager", "TimerSlackNSec", config_parse_nsec, 0, &arg_timer_slack_nsec },
649 { "Manager", "DefaultStandardOutput", config_parse_output, 0, &arg_default_std_output },
650 { "Manager", "DefaultStandardError", config_parse_output, 0, &arg_default_std_error },
651 { "Manager", "DefaultTimeoutStartSec", config_parse_sec, 0, &arg_default_timeout_start_usec },
652 { "Manager", "DefaultTimeoutStopSec", config_parse_sec, 0, &arg_default_timeout_stop_usec },
653 { "Manager", "DefaultRestartSec", config_parse_sec, 0, &arg_default_restart_usec },
654 { "Manager", "DefaultStartLimitInterval", config_parse_sec, 0, &arg_default_start_limit_interval },
655 { "Manager", "DefaultStartLimitBurst", config_parse_unsigned, 0, &arg_default_start_limit_burst },
656 { "Manager", "DefaultEnvironment", config_parse_environ, 0, &arg_default_environment },
657 { "Manager", "DefaultLimitCPU", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CPU] },
658 { "Manager", "DefaultLimitFSIZE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_FSIZE] },
659 { "Manager", "DefaultLimitDATA", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_DATA] },
660 { "Manager", "DefaultLimitSTACK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_STACK] },
661 { "Manager", "DefaultLimitCORE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CORE] },
662 { "Manager", "DefaultLimitRSS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RSS] },
663 { "Manager", "DefaultLimitNOFILE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NOFILE] },
664 { "Manager", "DefaultLimitAS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_AS] },
665 { "Manager", "DefaultLimitNPROC", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NPROC] },
666 { "Manager", "DefaultLimitMEMLOCK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MEMLOCK] },
667 { "Manager", "DefaultLimitLOCKS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_LOCKS] },
668 { "Manager", "DefaultLimitSIGPENDING", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
669 { "Manager", "DefaultLimitMSGQUEUE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MSGQUEUE] },
670 { "Manager", "DefaultLimitNICE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NICE] },
671 { "Manager", "DefaultLimitRTPRIO", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTPRIO] },
672 { "Manager", "DefaultLimitRTTIME", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTTIME] },
676 _cleanup_fclose_ FILE *f;
680 fn = arg_running_as == SYSTEMD_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
686 log_warning("Failed to open configuration file '%s': %m", fn);
690 r = config_parse(NULL, fn, f, "Manager\0", config_item_table_lookup, (void*) items, false, false, NULL);
692 log_warning("Failed to parse configuration file: %s", strerror(-r));
697 static int parse_proc_cmdline(void) {
698 _cleanup_free_ char *line = NULL;
703 r = proc_cmdline(&line);
705 log_warning("Failed to read /proc/cmdline, ignoring: %s", strerror(-r));
709 FOREACH_WORD_QUOTED(w, l, line, state) {
710 _cleanup_free_ char *word;
712 word = strndup(w, l);
716 r = parse_proc_cmdline_word(word);
718 log_error("Failed on cmdline argument %s: %s", word, strerror(-r));
726 static int parse_argv(int argc, char *argv[]) {
729 ARG_LOG_LEVEL = 0x100,
738 ARG_DUMP_CONFIGURATION_ITEMS,
745 ARG_DEFAULT_STD_OUTPUT,
746 ARG_DEFAULT_STD_ERROR
749 static const struct option options[] = {
750 { "log-level", required_argument, NULL, ARG_LOG_LEVEL },
751 { "log-target", required_argument, NULL, ARG_LOG_TARGET },
752 { "log-color", optional_argument, NULL, ARG_LOG_COLOR },
753 { "log-location", optional_argument, NULL, ARG_LOG_LOCATION },
754 { "unit", required_argument, NULL, ARG_UNIT },
755 { "system", no_argument, NULL, ARG_SYSTEM },
756 { "user", no_argument, NULL, ARG_USER },
757 { "test", no_argument, NULL, ARG_TEST },
758 { "help", no_argument, NULL, 'h' },
759 { "version", no_argument, NULL, ARG_VERSION },
760 { "dump-configuration-items", no_argument, NULL, ARG_DUMP_CONFIGURATION_ITEMS },
761 { "dump-core", optional_argument, NULL, ARG_DUMP_CORE },
762 { "crash-shell", optional_argument, NULL, ARG_CRASH_SHELL },
763 { "confirm-spawn", optional_argument, NULL, ARG_CONFIRM_SPAWN },
764 { "show-status", optional_argument, NULL, ARG_SHOW_STATUS },
765 { "deserialize", required_argument, NULL, ARG_DESERIALIZE },
766 { "switched-root", no_argument, NULL, ARG_SWITCHED_ROOT },
767 { "default-standard-output", required_argument, NULL, ARG_DEFAULT_STD_OUTPUT, },
768 { "default-standard-error", required_argument, NULL, ARG_DEFAULT_STD_ERROR, },
780 while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
785 if ((r = log_set_max_level_from_string(optarg)) < 0) {
786 log_error("Failed to parse log level %s.", optarg);
794 if ((r = log_set_target_from_string(optarg)) < 0) {
795 log_error("Failed to parse log target %s.", optarg);
804 if ((r = log_show_color_from_string(optarg)) < 0) {
805 log_error("Failed to parse log color setting %s.", optarg);
809 log_show_color(true);
813 case ARG_LOG_LOCATION:
816 if ((r = log_show_location_from_string(optarg)) < 0) {
817 log_error("Failed to parse log location setting %s.", optarg);
821 log_show_location(true);
825 case ARG_DEFAULT_STD_OUTPUT:
827 if ((r = exec_output_from_string(optarg)) < 0) {
828 log_error("Failed to parse default standard output setting %s.", optarg);
831 arg_default_std_output = r;
834 case ARG_DEFAULT_STD_ERROR:
836 if ((r = exec_output_from_string(optarg)) < 0) {
837 log_error("Failed to parse default standard error output setting %s.", optarg);
840 arg_default_std_error = r;
845 if ((r = set_default_unit(optarg)) < 0) {
846 log_error("Failed to set default unit %s: %s", optarg, strerror(-r));
853 arg_running_as = SYSTEMD_SYSTEM;
857 arg_running_as = SYSTEMD_USER;
861 arg_action = ACTION_TEST;
865 arg_action = ACTION_VERSION;
868 case ARG_DUMP_CONFIGURATION_ITEMS:
869 arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
873 r = optarg ? parse_boolean(optarg) : 1;
875 log_error("Failed to parse dump core boolean %s.", optarg);
881 case ARG_CRASH_SHELL:
882 r = optarg ? parse_boolean(optarg) : 1;
884 log_error("Failed to parse crash shell boolean %s.", optarg);
890 case ARG_CONFIRM_SPAWN:
891 r = optarg ? parse_boolean(optarg) : 1;
893 log_error("Failed to parse confirm spawn boolean %s.", optarg);
896 arg_confirm_spawn = r;
899 case ARG_SHOW_STATUS:
901 r = parse_show_status(optarg, &arg_show_status);
903 log_error("Failed to parse show status boolean %s.", optarg);
907 arg_show_status = SHOW_STATUS_YES;
910 case ARG_DESERIALIZE: {
914 r = safe_atoi(optarg, &fd);
915 if (r < 0 || fd < 0) {
916 log_error("Failed to parse deserialize option %s.", optarg);
917 return r < 0 ? r : -EINVAL;
920 fd_cloexec(fd, true);
924 log_error("Failed to open serialization fd: %m");
928 if (arg_serialization)
929 fclose(arg_serialization);
931 arg_serialization = f;
936 case ARG_SWITCHED_ROOT:
937 arg_switched_root = true;
941 arg_action = ACTION_HELP;
945 log_set_max_level(LOG_DEBUG);
951 /* Just to eat away the sysvinit kernel
952 * cmdline args without getopt() error
953 * messages that we'll parse in
954 * parse_proc_cmdline_word() or ignore. */
959 log_error("Unknown option code %c", c);
966 if (optind < argc && getpid() != 1) {
967 /* Hmm, when we aren't run as init system
968 * let's complain about excess arguments */
970 log_error("Excess arguments.");
974 if (detect_container(NULL) > 0) {
977 /* All /proc/cmdline arguments the kernel didn't
978 * understand it passed to us. We're not really
979 * interested in that usually since /proc/cmdline is
980 * more interesting and complete. With one exception:
981 * if we are run in a container /proc/cmdline is not
982 * relevant for the container, hence we rely on argv[]
985 for (a = argv; a < argv + argc; a++) {
986 r = parse_proc_cmdline_word(*a);
988 log_error("Failed on cmdline argument %s: %s", *a, strerror(-r));
997 static int help(void) {
999 printf("%s [OPTIONS...]\n\n"
1000 "Starts up and maintains the system or user services.\n\n"
1001 " -h --help Show this help\n"
1002 " --test Determine startup sequence, dump it and exit\n"
1003 " --dump-configuration-items Dump understood unit configuration items\n"
1004 " --unit=UNIT Set default unit\n"
1005 " --system Run a system instance, even if PID != 1\n"
1006 " --user Run a user instance\n"
1007 " --dump-core[=0|1] Dump core on crash\n"
1008 " --crash-shell[=0|1] Run shell on crash\n"
1009 " --confirm-spawn[=0|1] Ask for confirmation when spawning processes\n"
1010 " --show-status[=0|1] Show status updates on the console during bootup\n"
1011 " --log-target=TARGET Set log target (console, journal, syslog, kmsg, journal-or-kmsg, syslog-or-kmsg, null)\n"
1012 " --log-level=LEVEL Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
1013 " --log-color[=0|1] Highlight important log messages\n"
1014 " --log-location[=0|1] Include code location in log messages\n"
1015 " --default-standard-output= Set default standard output for services\n"
1016 " --default-standard-error= Set default standard error output for services\n",
1017 program_invocation_short_name);
1022 static int version(void) {
1023 puts(PACKAGE_STRING);
1024 puts(SYSTEMD_FEATURES);
1029 static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
1038 r = manager_open_serialization(m, &f);
1040 log_error("Failed to create serialization file: %s", strerror(-r));
1044 /* Make sure nothing is really destructed when we shut down */
1046 bus_manager_send_reloading(m, true);
1051 log_error("Failed to allocate fd set: %s", strerror(-r));
1055 r = manager_serialize(m, f, fds, switching_root);
1057 log_error("Failed to serialize state: %s", strerror(-r));
1061 if (fseeko(f, 0, SEEK_SET) < 0) {
1062 log_error("Failed to rewind serialization fd: %m");
1066 r = fd_cloexec(fileno(f), false);
1068 log_error("Failed to disable O_CLOEXEC for serialization: %s", strerror(-r));
1072 r = fdset_cloexec(fds, false);
1074 log_error("Failed to disable O_CLOEXEC for serialization fds: %s", strerror(-r));
1092 static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1096 assert(saved_rlimit);
1098 /* Save the original RLIMIT_NOFILE so that we can reset it
1099 * later when transitioning from the initrd to the main
1100 * systemd or suchlike. */
1101 if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0) {
1102 log_error("Reading RLIMIT_NOFILE failed: %m");
1106 /* Make sure forked processes get the default kernel setting */
1107 if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1110 rl = newdup(struct rlimit, saved_rlimit, 1);
1114 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1117 /* Bump up the resource limit for ourselves substantially */
1118 nl.rlim_cur = nl.rlim_max = 64*1024;
1119 r = setrlimit_closest(RLIMIT_NOFILE, &nl);
1121 log_error("Setting RLIMIT_NOFILE failed: %s", strerror(-r));
1128 static void test_mtab(void) {
1131 /* Check that /etc/mtab is a symlink */
1133 if (readlink_malloc("/etc/mtab", &p) >= 0) {
1136 b = streq(p, "/proc/self/mounts") || streq(p, "/proc/mounts");
1143 log_warning("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1144 "This is not supported anymore. "
1145 "Please make sure to replace this file by a symlink to avoid incorrect or misleading mount(8) output.");
1148 static void test_usr(void) {
1150 /* Check that /usr is not a separate fs */
1152 if (dir_is_empty("/usr") <= 0)
1155 log_warning("/usr appears to be on its own filesytem and is not already mounted. This is not a supported setup. "
1156 "Some things will probably break (sometimes even silently) in mysterious ways. "
1157 "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1160 static void test_cgroups(void) {
1162 if (access("/proc/cgroups", F_OK) >= 0)
1165 log_warning("CONFIG_CGROUPS was not set when your kernel was compiled. "
1166 "Systems without control groups are not supported. "
1167 "We will now sleep for 10s, and then continue boot-up. "
1168 "Expect breakage and please do not file bugs. "
1169 "Instead fix your kernel and enable CONFIG_CGROUPS. "
1170 "Consult http://0pointer.de/blog/projects/cgroups-vs-cgroups.html for more information.");
1175 static int initialize_join_controllers(void) {
1176 /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1177 * + "net_prio". We'd like to add "cpuset" to the mix, but
1178 * "cpuset" does't really work for groups with no initialized
1181 arg_join_controllers = new(char**, 3);
1182 if (!arg_join_controllers)
1185 arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
1186 arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
1187 arg_join_controllers[2] = NULL;
1189 if (!arg_join_controllers[0] || !arg_join_controllers[1]) {
1190 free_join_controllers();
1197 static int enforce_syscall_archs(Set *archs) {
1199 scmp_filter_ctx *seccomp;
1204 seccomp = seccomp_init(SCMP_ACT_ALLOW);
1208 SET_FOREACH(id, arg_syscall_archs, i) {
1209 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1213 log_error("Failed to add architecture to seccomp: %s", strerror(-r));
1218 r = seccomp_load(seccomp);
1220 log_error("Failed to add install architecture seccomp: %s", strerror(-r));
1223 seccomp_release(seccomp);
1230 int main(int argc, char *argv[]) {
1232 int r, retval = EXIT_FAILURE;
1233 usec_t before_startup, after_startup;
1234 char timespan[FORMAT_TIMESPAN_MAX];
1236 bool reexecute = false;
1237 const char *shutdown_verb = NULL;
1238 dual_timestamp initrd_timestamp = { 0ULL, 0ULL };
1239 dual_timestamp userspace_timestamp = { 0ULL, 0ULL };
1240 dual_timestamp kernel_timestamp = { 0ULL, 0ULL };
1241 dual_timestamp security_start_timestamp = { 0ULL, 0ULL };
1242 dual_timestamp security_finish_timestamp = { 0ULL, 0ULL };
1243 static char systemd[] = "systemd";
1244 bool skip_setup = false;
1246 bool loaded_policy = false;
1247 bool arm_reboot_watchdog = false;
1248 bool queue_default_job = false;
1249 char *switch_root_dir = NULL, *switch_root_init = NULL;
1250 static struct rlimit saved_rlimit_nofile = { 0, 0 };
1252 #ifdef HAVE_SYSV_COMPAT
1253 if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
1254 /* This is compatibility support for SysV, where
1255 * calling init as a user is identical to telinit. */
1258 execv(SYSTEMCTL_BINARY_PATH, argv);
1259 log_error("Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
1264 dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1265 dual_timestamp_get(&userspace_timestamp);
1267 /* Determine if this is a reexecution or normal bootup. We do
1268 * the full command line parsing much later, so let's just
1269 * have a quick peek here. */
1270 if (strv_find(argv+1, "--deserialize"))
1273 /* If we have switched root, do all the special setup
1275 if (strv_find(argv+1, "--switched-root"))
1278 /* If we get started via the /sbin/init symlink then we are
1279 called 'init'. After a subsequent reexecution we are then
1280 called 'systemd'. That is confusing, hence let's call us
1281 systemd right-away. */
1282 program_invocation_short_name = systemd;
1283 prctl(PR_SET_NAME, systemd);
1288 log_show_color(isatty(STDERR_FILENO) > 0);
1290 /* Disable the umask logic */
1294 if (getpid() == 1 && detect_container(NULL) <= 0) {
1296 /* Running outside of a container as PID 1 */
1297 arg_running_as = SYSTEMD_SYSTEM;
1299 log_set_target(LOG_TARGET_KMSG);
1303 initrd_timestamp = userspace_timestamp;
1306 mount_setup_early();
1307 dual_timestamp_get(&security_start_timestamp);
1308 if (selinux_setup(&loaded_policy) < 0)
1310 if (ima_setup() < 0)
1312 if (smack_setup() < 0)
1314 dual_timestamp_get(&security_finish_timestamp);
1317 if (label_init(NULL) < 0)
1321 if (hwclock_is_localtime() > 0) {
1324 /* The first-time call to settimeofday() does a time warp in the kernel */
1325 r = hwclock_set_timezone(&min);
1327 log_error("Failed to apply local time delta, ignoring: %s", strerror(-r));
1329 log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
1330 } else if (!in_initrd()) {
1332 * Do dummy first-time call to seal the kernel's time warp magic
1334 * Do not call this this from inside the initrd. The initrd might not
1335 * carry /etc/adjtime with LOCAL, but the real system could be set up
1336 * that way. In such case, we need to delay the time-warp or the sealing
1337 * until we reach the real system.
1339 hwclock_reset_timezone();
1341 /* Tell the kernel our timezone */
1342 r = hwclock_set_timezone(NULL);
1344 log_error("Failed to set the kernel's timezone, ignoring: %s", strerror(-r));
1348 /* Set the default for later on, but don't actually
1349 * open the logs like this for now. Note that if we
1350 * are transitioning from the initrd there might still
1351 * be journal fd open, and we shouldn't attempt
1352 * opening that before we parsed /proc/cmdline which
1353 * might redirect output elsewhere. */
1354 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1356 } else if (getpid() == 1) {
1357 /* Running inside a container, as PID 1 */
1358 arg_running_as = SYSTEMD_SYSTEM;
1359 log_set_target(LOG_TARGET_CONSOLE);
1360 log_close_console(); /* force reopen of /dev/console */
1363 /* For the later on, see above... */
1364 log_set_target(LOG_TARGET_JOURNAL);
1366 /* clear the kernel timestamp,
1367 * because we are in a container */
1368 kernel_timestamp.monotonic = 0ULL;
1369 kernel_timestamp.realtime = 0ULL;
1372 /* Running as user instance */
1373 arg_running_as = SYSTEMD_USER;
1374 log_set_target(LOG_TARGET_AUTO);
1377 /* clear the kernel timestamp,
1378 * because we are not PID 1 */
1379 kernel_timestamp.monotonic = 0ULL;
1380 kernel_timestamp.realtime = 0ULL;
1383 /* Initialize default unit */
1384 r = set_default_unit(SPECIAL_DEFAULT_TARGET);
1386 log_error("Failed to set default unit %s: %s", SPECIAL_DEFAULT_TARGET, strerror(-r));
1390 r = initialize_join_controllers();
1394 /* Mount /proc, /sys and friends, so that /proc/cmdline and
1395 * /proc/$PID/fd is available. */
1396 if (getpid() == 1) {
1397 r = mount_setup(loaded_policy);
1402 /* Reset all signal handlers. */
1403 assert_se(reset_all_signal_handlers() == 0);
1405 ignore_signals(SIGNALS_IGNORE, -1);
1407 if (parse_config_file() < 0)
1410 if (arg_running_as == SYSTEMD_SYSTEM)
1411 if (parse_proc_cmdline() < 0)
1414 log_parse_environment();
1416 if (parse_argv(argc, argv) < 0)
1419 if (arg_action == ACTION_TEST &&
1421 log_error("Don't run test mode as root.");
1425 if (arg_running_as == SYSTEMD_USER &&
1426 arg_action == ACTION_RUN &&
1428 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1432 if (arg_running_as == SYSTEMD_SYSTEM &&
1433 arg_action == ACTION_RUN &&
1434 running_in_chroot() > 0) {
1435 log_error("Cannot be run in a chroot() environment.");
1439 if (arg_action == ACTION_HELP) {
1442 } else if (arg_action == ACTION_VERSION) {
1445 } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
1446 unit_dump_config_items(stdout);
1447 retval = EXIT_SUCCESS;
1449 } else if (arg_action == ACTION_DONE) {
1450 retval = EXIT_SUCCESS;
1454 if (arg_running_as == SYSTEMD_USER &&
1455 !getenv("XDG_RUNTIME_DIR")) {
1456 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1460 assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
1462 /* Close logging fds, in order not to confuse fdset below */
1465 /* Remember open file descriptors for later deserialization */
1466 r = fdset_new_fill(&fds);
1468 log_error("Failed to allocate fd set: %s", strerror(-r));
1471 fdset_cloexec(fds, true);
1473 if (arg_serialization)
1474 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
1476 if (arg_running_as == SYSTEMD_SYSTEM)
1477 /* Become a session leader if we aren't one yet. */
1480 /* Move out of the way, so that we won't block unmounts */
1481 assert_se(chdir("/") == 0);
1483 /* Reset the console, but only if this is really init and we
1484 * are freshly booted */
1485 if (arg_running_as == SYSTEMD_SYSTEM && arg_action == ACTION_RUN)
1486 console_setup(getpid() == 1 && !skip_setup);
1488 /* Open the logging devices, if possible and necessary */
1491 /* Make sure we leave a core dump without panicing the
1493 if (getpid() == 1) {
1494 install_crash_handler();
1496 r = mount_cgroup_controllers(arg_join_controllers);
1501 if (arg_running_as == SYSTEMD_SYSTEM) {
1502 const char *virtualization = NULL;
1504 log_info(PACKAGE_STRING " running in system mode. (" SYSTEMD_FEATURES ")");
1506 detect_virtualization(&virtualization);
1508 log_info("Detected virtualization '%s'.", virtualization);
1511 log_info("Running in initial RAM disk.");
1514 _cleanup_free_ char *t = uid_to_name(getuid());
1515 log_debug(PACKAGE_STRING " running in user mode for user "PID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1519 if (arg_running_as == SYSTEMD_SYSTEM && !skip_setup) {
1520 if (arg_show_status > 0 || plymouth_running())
1524 if (detect_container(NULL) <= 0)
1536 if (arg_running_as == SYSTEMD_SYSTEM && arg_runtime_watchdog > 0)
1537 watchdog_set_timeout(&arg_runtime_watchdog);
1539 if (arg_timer_slack_nsec != (nsec_t) -1)
1540 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
1541 log_error("Failed to adjust timer slack: %m");
1543 if (arg_capability_bounding_set_drop) {
1544 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
1546 log_error("Failed to drop capability bounding set of usermode helpers: %s", strerror(-r));
1549 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
1551 log_error("Failed to drop capability bounding set: %s", strerror(-r));
1556 if (arg_syscall_archs) {
1557 r = enforce_syscall_archs(arg_syscall_archs);
1562 if (arg_running_as == SYSTEMD_USER) {
1563 /* Become reaper of our children */
1564 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0) {
1565 log_warning("Failed to make us a subreaper: %m");
1566 if (errno == EINVAL)
1567 log_info("Perhaps the kernel version is too old (< 3.4?)");
1571 if (arg_running_as == SYSTEMD_SYSTEM)
1572 bump_rlimit_nofile(&saved_rlimit_nofile);
1574 r = manager_new(arg_running_as, &m);
1576 log_error("Failed to allocate manager object: %s", strerror(-r));
1580 m->confirm_spawn = arg_confirm_spawn;
1581 m->default_std_output = arg_default_std_output;
1582 m->default_std_error = arg_default_std_error;
1583 m->default_restart_usec = arg_default_restart_usec;
1584 m->default_timeout_start_usec = arg_default_timeout_start_usec;
1585 m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
1586 m->default_start_limit_interval = arg_default_start_limit_interval;
1587 m->default_start_limit_burst = arg_default_start_limit_burst;
1588 m->runtime_watchdog = arg_runtime_watchdog;
1589 m->shutdown_watchdog = arg_shutdown_watchdog;
1590 m->userspace_timestamp = userspace_timestamp;
1591 m->kernel_timestamp = kernel_timestamp;
1592 m->initrd_timestamp = initrd_timestamp;
1593 m->security_start_timestamp = security_start_timestamp;
1594 m->security_finish_timestamp = security_finish_timestamp;
1596 manager_set_default_rlimits(m, arg_default_rlimit);
1598 if (arg_default_environment)
1599 manager_environment_add(m, NULL, arg_default_environment);
1601 if (arg_show_status == SHOW_STATUS_UNSET)
1602 arg_show_status = SHOW_STATUS_YES;
1603 manager_set_show_status(m, arg_show_status);
1605 /* Remember whether we should queue the default job */
1606 queue_default_job = !arg_serialization || arg_switched_root;
1608 before_startup = now(CLOCK_MONOTONIC);
1610 r = manager_startup(m, arg_serialization, fds);
1612 log_error("Failed to fully start up daemon: %s", strerror(-r));
1614 /* This will close all file descriptors that were opened, but
1615 * not claimed by any unit. */
1619 if (arg_serialization) {
1620 fclose(arg_serialization);
1621 arg_serialization = NULL;
1624 if (queue_default_job) {
1625 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
1626 Unit *target = NULL;
1627 Job *default_unit_job;
1629 log_debug("Activating default unit: %s", arg_default_unit);
1631 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
1633 log_error("Failed to load default target: %s", bus_error_message(&error, r));
1634 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
1635 log_error("Failed to load default target: %s", strerror(-target->load_error));
1636 else if (target->load_state == UNIT_MASKED)
1637 log_error("Default target masked.");
1639 if (!target || target->load_state != UNIT_LOADED) {
1640 log_info("Trying to load rescue target...");
1642 r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1644 log_error("Failed to load rescue target: %s", bus_error_message(&error, r));
1646 } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
1647 log_error("Failed to load rescue target: %s", strerror(-target->load_error));
1649 } else if (target->load_state == UNIT_MASKED) {
1650 log_error("Rescue target masked.");
1655 assert(target->load_state == UNIT_LOADED);
1657 if (arg_action == ACTION_TEST) {
1658 printf("-> By units:\n");
1659 manager_dump_units(m, stdout, "\t");
1662 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
1664 log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
1666 r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1668 log_error("Failed to start default target: %s", bus_error_message(&error, r));
1672 log_error("Failed to isolate default target: %s", bus_error_message(&error, r));
1676 m->default_unit_job_id = default_unit_job->id;
1678 after_startup = now(CLOCK_MONOTONIC);
1679 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1680 "Loaded units and determined initial transaction in %s.",
1681 format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 0));
1683 if (arg_action == ACTION_TEST) {
1684 printf("-> By jobs:\n");
1685 manager_dump_jobs(m, stdout, "\t");
1686 retval = EXIT_SUCCESS;
1692 r = manager_loop(m);
1694 log_error("Failed to run mainloop: %s", strerror(-r));
1698 switch (m->exit_code) {
1701 retval = EXIT_SUCCESS;
1705 case MANAGER_RELOAD:
1706 log_info("Reloading.");
1707 r = manager_reload(m);
1709 log_error("Failed to reload: %s", strerror(-r));
1712 case MANAGER_REEXECUTE:
1714 if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0)
1718 log_notice("Reexecuting.");
1721 case MANAGER_SWITCH_ROOT:
1722 /* Steal the switch root parameters */
1723 switch_root_dir = m->switch_root;
1724 switch_root_init = m->switch_root_init;
1725 m->switch_root = m->switch_root_init = NULL;
1727 if (!switch_root_init)
1728 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0)
1732 log_notice("Switching root.");
1735 case MANAGER_REBOOT:
1736 case MANAGER_POWEROFF:
1738 case MANAGER_KEXEC: {
1739 static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
1740 [MANAGER_REBOOT] = "reboot",
1741 [MANAGER_POWEROFF] = "poweroff",
1742 [MANAGER_HALT] = "halt",
1743 [MANAGER_KEXEC] = "kexec"
1746 assert_se(shutdown_verb = table[m->exit_code]);
1747 arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
1749 log_notice("Shutting down.");
1754 assert_not_reached("Unknown exit code.");
1764 for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++) {
1765 free(arg_default_rlimit[j]);
1766 arg_default_rlimit[j] = NULL;
1769 free(arg_default_unit);
1770 arg_default_unit = NULL;
1772 free_join_controllers();
1774 strv_free(arg_default_environment);
1775 arg_default_environment = NULL;
1777 set_free(arg_syscall_archs);
1778 arg_syscall_archs = NULL;
1784 unsigned i, args_size;
1786 /* Close and disarm the watchdog, so that the new
1787 * instance can reinitialize it, but doesn't get
1788 * rebooted while we do that */
1789 watchdog_close(true);
1791 /* Reset the RLIMIT_NOFILE to the kernel default, so
1792 * that the new systemd can pass the kernel default to
1793 * its child processes */
1794 if (saved_rlimit_nofile.rlim_cur > 0)
1795 setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
1797 if (switch_root_dir) {
1798 /* Kill all remaining processes from the
1799 * initrd, but don't wait for them, so that we
1800 * can handle the SIGCHLD for them after
1802 broadcast_signal(SIGTERM, false, true);
1804 /* And switch root */
1805 r = switch_root(switch_root_dir);
1807 log_error("Failed to switch root, ignoring: %s", strerror(-r));
1810 args_size = MAX(6, argc+1);
1811 args = newa(const char*, args_size);
1813 if (!switch_root_init) {
1816 /* First try to spawn ourselves with the right
1817 * path, and with full serialization. We do
1818 * this only if the user didn't specify an
1819 * explicit init to spawn. */
1821 assert(arg_serialization);
1824 snprintf(sfd, sizeof(sfd), "%i", fileno(arg_serialization));
1828 args[i++] = SYSTEMD_BINARY_PATH;
1829 if (switch_root_dir)
1830 args[i++] = "--switched-root";
1831 args[i++] = arg_running_as == SYSTEMD_SYSTEM ? "--system" : "--user";
1832 args[i++] = "--deserialize";
1836 /* do not pass along the environment we inherit from the kernel or initrd */
1837 if (switch_root_dir)
1840 assert(i <= args_size);
1841 execv(args[0], (char* const*) args);
1844 /* Try the fallback, if there is any, without any
1845 * serialization. We pass the original argv[] and
1846 * envp[]. (Well, modulo the ordering changes due to
1847 * getopt() in argv[], and some cleanups in envp[],
1848 * but let's hope that doesn't matter.) */
1850 if (arg_serialization) {
1851 fclose(arg_serialization);
1852 arg_serialization = NULL;
1860 /* Reopen the console */
1861 make_console_stdio();
1863 for (j = 1, i = 1; j < (unsigned) argc; j++)
1864 args[i++] = argv[j];
1866 assert(i <= args_size);
1868 if (switch_root_init) {
1869 args[0] = switch_root_init;
1870 execv(args[0], (char* const*) args);
1871 log_warning("Failed to execute configured init, trying fallback: %m");
1874 args[0] = "/sbin/init";
1875 execv(args[0], (char* const*) args);
1877 if (errno == ENOENT) {
1878 log_warning("No /sbin/init, trying fallback");
1880 args[0] = "/bin/sh";
1882 execv(args[0], (char* const*) args);
1883 log_error("Failed to execute /bin/sh, giving up: %m");
1885 log_warning("Failed to execute /sbin/init, giving up: %m");
1888 if (arg_serialization) {
1889 fclose(arg_serialization);
1890 arg_serialization = NULL;
1898 #ifdef HAVE_VALGRIND_VALGRIND_H
1899 /* If we are PID 1 and running under valgrind, then let's exit
1900 * here explicitly. valgrind will only generate nice output on
1901 * exit(), not on exec(), hence let's do the former not the
1903 if (getpid() == 1 && RUNNING_ON_VALGRIND)
1907 if (shutdown_verb) {
1908 const char * command_line[] = {
1909 SYSTEMD_SHUTDOWN_BINARY_PATH,
1913 _cleanup_strv_free_ char **env_block = NULL;
1914 env_block = strv_copy(environ);
1916 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
1919 /* If we reboot let's set the shutdown
1920 * watchdog and tell the shutdown binary to
1921 * repeatedly ping it */
1922 watchdog_set_timeout(&arg_shutdown_watchdog);
1923 watchdog_close(false);
1925 /* Tell the binary how often to ping, ignore failure */
1926 if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
1927 strv_push(&env_block, e);
1929 watchdog_close(true);
1931 /* Avoid the creation of new processes forked by the
1932 * kernel; at this point, we will not listen to the
1934 if (detect_container(NULL) <= 0)
1935 cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
1937 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
1938 log_error("Failed to execute shutdown binary, freezing: %m");