1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
26 #include <sys/types.h>
32 #include <sys/prctl.h>
33 #include <sys/mount.h>
35 #ifdef HAVE_VALGRIND_VALGRIND_H
36 #include <valgrind/valgrind.h>
42 #include "sd-daemon.h"
43 #include "sd-messages.h"
47 #include "load-fragment.h"
50 #include "conf-parser.h"
58 #include "architecture.h"
60 #include "path-util.h"
61 #include "switch-root.h"
62 #include "capability.h"
65 #include "clock-util.h"
67 #include "dbus-manager.h"
68 #include "bus-error.h"
71 #include "mount-setup.h"
72 #include "loopback-setup.h"
73 #include "hostname-setup.h"
74 #include "machine-id-setup.h"
75 #include "selinux-setup.h"
76 #include "ima-setup.h"
77 #include "smack-setup.h"
79 #include "kmod-setup.h"
87 ACTION_DUMP_CONFIGURATION_ITEMS,
89 } arg_action = ACTION_RUN;
90 static char *arg_default_unit = NULL;
91 static SystemdRunningAs arg_running_as = _SYSTEMD_RUNNING_AS_INVALID;
92 static bool arg_dump_core = true;
93 static bool arg_crash_shell = false;
94 static int arg_crash_chvt = -1;
95 static bool arg_confirm_spawn = false;
96 static ShowStatus arg_show_status = _SHOW_STATUS_UNSET;
97 static bool arg_switched_root = false;
98 static int arg_no_pager = -1;
99 static char ***arg_join_controllers = NULL;
100 static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
101 static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
102 static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
103 static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
104 static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
105 static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
106 static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
107 static usec_t arg_runtime_watchdog = 0;
108 static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
109 static char **arg_default_environment = NULL;
110 static struct rlimit *arg_default_rlimit[_RLIMIT_MAX] = {};
111 static uint64_t arg_capability_bounding_set_drop = 0;
112 static nsec_t arg_timer_slack_nsec = NSEC_INFINITY;
113 static usec_t arg_default_timer_accuracy_usec = 1 * USEC_PER_MINUTE;
114 static Set* arg_syscall_archs = NULL;
115 static FILE* arg_serialization = NULL;
116 static bool arg_default_cpu_accounting = false;
117 static bool arg_default_blockio_accounting = false;
118 static bool arg_default_memory_accounting = false;
120 static void nop_handler(int sig) {}
122 static void pager_open_if_enabled(void) {
124 if (arg_no_pager <= 0)
130 noreturn static void crash(int sig) {
133 /* Pass this on immediately, if this is not PID 1 */
135 else if (!arg_dump_core)
136 log_error("Caught <%s>, not dumping core.", signal_to_string(sig));
138 struct sigaction sa = {
139 .sa_handler = nop_handler,
140 .sa_flags = SA_NOCLDSTOP|SA_RESTART,
144 /* We want to wait for the core process, hence let's enable SIGCHLD */
145 sigaction(SIGCHLD, &sa, NULL);
149 log_error("Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
152 struct rlimit rl = {};
154 /* Enable default signal handler for core dump */
156 sa.sa_handler = SIG_DFL;
157 sigaction(sig, &sa, NULL);
159 /* Don't limit the core dump size */
160 rl.rlim_cur = RLIM_INFINITY;
161 rl.rlim_max = RLIM_INFINITY;
162 setrlimit(RLIMIT_CORE, &rl);
164 /* Just to be sure... */
167 /* Raise the signal again */
170 assert_not_reached("We shouldn't be here...");
177 /* Order things nicely. */
178 r = wait_for_terminate(pid, &status);
180 log_error("Caught <%s>, waitpid() failed: %s", signal_to_string(sig), strerror(-r));
181 else if (status.si_code != CLD_DUMPED)
182 log_error("Caught <%s>, core dump failed.", signal_to_string(sig));
184 log_error("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
189 chvt(arg_crash_chvt);
191 if (arg_crash_shell) {
192 struct sigaction sa = {
193 .sa_handler = SIG_IGN,
194 .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
198 log_info("Executing crash shell in 10s...");
201 /* Let the kernel reap children for us */
202 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
206 log_error("Failed to fork off crash shell: %m");
208 make_console_stdio();
209 execl("/bin/sh", "/bin/sh", NULL);
211 log_error("execl() failed: %m");
215 log_info("Successfully spawned crash shell as pid "PID_FMT".", pid);
218 log_info("Freezing execution.");
222 static void install_crash_handler(void) {
223 struct sigaction sa = {
225 .sa_flags = SA_NODEFER,
228 sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
231 static int console_setup(bool do_reset) {
234 /* If we are init, we connect stdin/stdout/stderr to /dev/null
235 * and make sure we don't have a controlling tty. */
242 tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
244 log_error("Failed to open /dev/console: %s", strerror(-tty_fd));
248 /* We don't want to force text mode.
249 * plymouth may be showing pictures already from initrd. */
250 r = reset_terminal_fd(tty_fd, false);
252 log_error("Failed to reset /dev/console: %s", strerror(-r));
258 static int set_default_unit(const char *u) {
267 free(arg_default_unit);
268 arg_default_unit = c;
273 static int parse_proc_cmdline_item(const char *key, const char *value) {
275 static const char * const rlmap[] = {
276 "emergency", SPECIAL_EMERGENCY_TARGET,
277 "-b", SPECIAL_EMERGENCY_TARGET,
278 "single", SPECIAL_RESCUE_TARGET,
279 "-s", SPECIAL_RESCUE_TARGET,
280 "s", SPECIAL_RESCUE_TARGET,
281 "S", SPECIAL_RESCUE_TARGET,
282 "1", SPECIAL_RESCUE_TARGET,
283 "2", SPECIAL_RUNLEVEL2_TARGET,
284 "3", SPECIAL_RUNLEVEL3_TARGET,
285 "4", SPECIAL_RUNLEVEL4_TARGET,
286 "5", SPECIAL_RUNLEVEL5_TARGET,
292 if (streq(key, "systemd.unit") && value) {
295 return set_default_unit(value);
297 } else if (streq(key, "rd.systemd.unit") && value) {
300 return set_default_unit(value);
302 } else if (streq(key, "systemd.log_target") && value) {
304 if (log_set_target_from_string(value) < 0)
305 log_warning("Failed to parse log target %s. Ignoring.", value);
307 } else if (streq(key, "systemd.log_level") && value) {
309 if (log_set_max_level_from_string(value) < 0)
310 log_warning("Failed to parse log level %s. Ignoring.", value);
312 } else if (streq(key, "systemd.log_color") && value) {
314 if (log_show_color_from_string(value) < 0)
315 log_warning("Failed to parse log color setting %s. Ignoring.", value);
317 } else if (streq(key, "systemd.log_location") && value) {
319 if (log_show_location_from_string(value) < 0)
320 log_warning("Failed to parse log location setting %s. Ignoring.", value);
322 } else if (streq(key, "systemd.dump_core") && value) {
324 r = parse_boolean(value);
326 log_warning("Failed to parse dump core switch %s. Ignoring.", value);
330 } else if (streq(key, "systemd.crash_shell") && value) {
332 r = parse_boolean(value);
334 log_warning("Failed to parse crash shell switch %s. Ignoring.", value);
338 } else if (streq(key, "systemd.crash_chvt") && value) {
340 if (safe_atoi(value, &r) < 0)
341 log_warning("Failed to parse crash chvt switch %s. Ignoring.", value);
345 } else if (streq(key, "systemd.confirm_spawn") && value) {
347 r = parse_boolean(value);
349 log_warning("Failed to parse confirm spawn switch %s. Ignoring.", value);
351 arg_confirm_spawn = r;
353 } else if (streq(key, "systemd.show_status") && value) {
355 r = parse_show_status(value, &arg_show_status);
357 log_warning("Failed to parse show status switch %s. Ignoring.", value);
359 } else if (streq(key, "systemd.default_standard_output") && value) {
361 r = exec_output_from_string(value);
363 log_warning("Failed to parse default standard output switch %s. Ignoring.", value);
365 arg_default_std_output = r;
367 } else if (streq(key, "systemd.default_standard_error") && value) {
369 r = exec_output_from_string(value);
371 log_warning("Failed to parse default standard error switch %s. Ignoring.", value);
373 arg_default_std_error = r;
375 } else if (streq(key, "systemd.setenv") && value) {
377 if (env_assignment_is_valid(value)) {
380 env = strv_env_set(arg_default_environment, value);
382 arg_default_environment = env;
384 log_warning("Setting environment variable '%s' failed, ignoring: %s", value, strerror(ENOMEM));
386 log_warning("Environment variable name '%s' is not valid. Ignoring.", value);
388 } else if (streq(key, "quiet") && !value) {
390 log_set_max_level(LOG_NOTICE);
392 if (arg_show_status == _SHOW_STATUS_UNSET)
393 arg_show_status = SHOW_STATUS_AUTO;
395 } else if (streq(key, "debug") && !value) {
397 log_set_max_level(LOG_DEBUG);
399 if (detect_container(NULL) > 0)
400 log_set_target(LOG_TARGET_CONSOLE);
402 } else if (!in_initrd() && !value) {
405 /* SysV compatibility */
406 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
407 if (streq(key, rlmap[i]))
408 return set_default_unit(rlmap[i+1]);
414 #define DEFINE_SETTER(name, func, descr) \
415 static int name(const char *unit, \
416 const char *filename, \
418 const char *section, \
419 unsigned section_line, \
420 const char *lvalue, \
422 const char *rvalue, \
434 log_syntax(unit, LOG_ERR, filename, line, -r, \
435 "Invalid " descr "'%s': %s", \
436 rvalue, strerror(-r)); \
441 DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
442 DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
443 DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
444 DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
446 static int config_parse_cpu_affinity2(
448 const char *filename,
451 unsigned section_line,
458 const char *word, *state;
467 FOREACH_WORD_QUOTED(word, l, rvalue, state) {
472 if (!(t = strndup(word, l)))
475 r = safe_atou(t, &cpu);
479 if (!(c = cpu_set_malloc(&ncpus)))
482 if (r < 0 || cpu >= ncpus) {
483 log_syntax(unit, LOG_ERR, filename, line, -r,
484 "Failed to parse CPU affinity '%s'", rvalue);
489 CPU_SET_S(cpu, CPU_ALLOC_SIZE(ncpus), c);
492 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
493 "Trailing garbage, ignoring.");
496 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
497 log_warning_unit(unit, "Failed to set CPU affinity: %m");
505 static int config_parse_show_status(
507 const char *filename,
510 unsigned section_line,
518 ShowStatus *b = data;
525 k = parse_show_status(rvalue, b);
527 log_syntax(unit, LOG_ERR, filename, line, -k,
528 "Failed to parse show status setting, ignoring: %s", rvalue);
535 static void strv_free_free(char ***l) {
547 static void free_join_controllers(void) {
548 strv_free_free(arg_join_controllers);
549 arg_join_controllers = NULL;
552 static int config_parse_join_controllers(const char *unit,
553 const char *filename,
556 unsigned section_line,
564 const char *word, *state;
571 free_join_controllers();
573 FOREACH_WORD_QUOTED(word, length, rvalue, state) {
576 s = strndup(word, length);
580 l = strv_split(s, ",");
585 if (strv_length(l) <= 1) {
590 if (!arg_join_controllers) {
591 arg_join_controllers = new(char**, 2);
592 if (!arg_join_controllers) {
597 arg_join_controllers[0] = l;
598 arg_join_controllers[1] = NULL;
605 t = new0(char**, n+2);
613 for (a = arg_join_controllers; *a; a++) {
615 if (strv_overlap(*a, l)) {
616 if (strv_extend_strv(&l, *a) < 0) {
636 t[n++] = strv_uniq(l);
638 strv_free_free(arg_join_controllers);
639 arg_join_controllers = t;
643 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
644 "Trailing garbage, ignoring.");
649 static int parse_config_file(void) {
651 const ConfigTableItem items[] = {
652 { "Manager", "LogLevel", config_parse_level2, 0, NULL },
653 { "Manager", "LogTarget", config_parse_target, 0, NULL },
654 { "Manager", "LogColor", config_parse_color, 0, NULL },
655 { "Manager", "LogLocation", config_parse_location, 0, NULL },
656 { "Manager", "DumpCore", config_parse_bool, 0, &arg_dump_core },
657 { "Manager", "CrashShell", config_parse_bool, 0, &arg_crash_shell },
658 { "Manager", "ShowStatus", config_parse_show_status, 0, &arg_show_status },
659 { "Manager", "CrashChVT", config_parse_int, 0, &arg_crash_chvt },
660 { "Manager", "CPUAffinity", config_parse_cpu_affinity2, 0, NULL },
661 { "Manager", "JoinControllers", config_parse_join_controllers, 0, &arg_join_controllers },
662 { "Manager", "RuntimeWatchdogSec", config_parse_sec, 0, &arg_runtime_watchdog },
663 { "Manager", "ShutdownWatchdogSec", config_parse_sec, 0, &arg_shutdown_watchdog },
664 { "Manager", "CapabilityBoundingSet", config_parse_bounding_set, 0, &arg_capability_bounding_set_drop },
666 { "Manager", "SystemCallArchitectures", config_parse_syscall_archs, 0, &arg_syscall_archs },
668 { "Manager", "TimerSlackNSec", config_parse_nsec, 0, &arg_timer_slack_nsec },
669 { "Manager", "DefaultTimerAccuracySec", config_parse_sec, 0, &arg_default_timer_accuracy_usec },
670 { "Manager", "DefaultStandardOutput", config_parse_output, 0, &arg_default_std_output },
671 { "Manager", "DefaultStandardError", config_parse_output, 0, &arg_default_std_error },
672 { "Manager", "DefaultTimeoutStartSec", config_parse_sec, 0, &arg_default_timeout_start_usec },
673 { "Manager", "DefaultTimeoutStopSec", config_parse_sec, 0, &arg_default_timeout_stop_usec },
674 { "Manager", "DefaultRestartSec", config_parse_sec, 0, &arg_default_restart_usec },
675 { "Manager", "DefaultStartLimitInterval", config_parse_sec, 0, &arg_default_start_limit_interval },
676 { "Manager", "DefaultStartLimitBurst", config_parse_unsigned, 0, &arg_default_start_limit_burst },
677 { "Manager", "DefaultEnvironment", config_parse_environ, 0, &arg_default_environment },
678 { "Manager", "DefaultLimitCPU", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CPU] },
679 { "Manager", "DefaultLimitFSIZE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_FSIZE] },
680 { "Manager", "DefaultLimitDATA", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_DATA] },
681 { "Manager", "DefaultLimitSTACK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_STACK] },
682 { "Manager", "DefaultLimitCORE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CORE] },
683 { "Manager", "DefaultLimitRSS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RSS] },
684 { "Manager", "DefaultLimitNOFILE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NOFILE] },
685 { "Manager", "DefaultLimitAS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_AS] },
686 { "Manager", "DefaultLimitNPROC", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NPROC] },
687 { "Manager", "DefaultLimitMEMLOCK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MEMLOCK] },
688 { "Manager", "DefaultLimitLOCKS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_LOCKS] },
689 { "Manager", "DefaultLimitSIGPENDING", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
690 { "Manager", "DefaultLimitMSGQUEUE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MSGQUEUE] },
691 { "Manager", "DefaultLimitNICE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NICE] },
692 { "Manager", "DefaultLimitRTPRIO", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTPRIO] },
693 { "Manager", "DefaultLimitRTTIME", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTTIME] },
694 { "Manager", "DefaultCPUAccounting", config_parse_bool, 0, &arg_default_cpu_accounting },
695 { "Manager", "DefaultBlockIOAccounting", config_parse_bool, 0, &arg_default_blockio_accounting },
696 { "Manager", "DefaultMemoryAccounting", config_parse_bool, 0, &arg_default_memory_accounting },
702 fn = arg_running_as == SYSTEMD_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
703 config_parse(NULL, fn, NULL,
705 config_item_table_lookup, items,
706 false, false, true, NULL);
711 static int parse_argv(int argc, char *argv[]) {
714 ARG_LOG_LEVEL = 0x100,
724 ARG_DUMP_CONFIGURATION_ITEMS,
731 ARG_DEFAULT_STD_OUTPUT,
732 ARG_DEFAULT_STD_ERROR
735 static const struct option options[] = {
736 { "log-level", required_argument, NULL, ARG_LOG_LEVEL },
737 { "log-target", required_argument, NULL, ARG_LOG_TARGET },
738 { "log-color", optional_argument, NULL, ARG_LOG_COLOR },
739 { "log-location", optional_argument, NULL, ARG_LOG_LOCATION },
740 { "unit", required_argument, NULL, ARG_UNIT },
741 { "system", no_argument, NULL, ARG_SYSTEM },
742 { "user", no_argument, NULL, ARG_USER },
743 { "test", no_argument, NULL, ARG_TEST },
744 { "no-pager", no_argument, NULL, ARG_NO_PAGER },
745 { "help", no_argument, NULL, 'h' },
746 { "version", no_argument, NULL, ARG_VERSION },
747 { "dump-configuration-items", no_argument, NULL, ARG_DUMP_CONFIGURATION_ITEMS },
748 { "dump-core", optional_argument, NULL, ARG_DUMP_CORE },
749 { "crash-shell", optional_argument, NULL, ARG_CRASH_SHELL },
750 { "confirm-spawn", optional_argument, NULL, ARG_CONFIRM_SPAWN },
751 { "show-status", optional_argument, NULL, ARG_SHOW_STATUS },
752 { "deserialize", required_argument, NULL, ARG_DESERIALIZE },
753 { "switched-root", no_argument, NULL, ARG_SWITCHED_ROOT },
754 { "default-standard-output", required_argument, NULL, ARG_DEFAULT_STD_OUTPUT, },
755 { "default-standard-error", required_argument, NULL, ARG_DEFAULT_STD_ERROR, },
767 while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
772 r = log_set_max_level_from_string(optarg);
774 log_error("Failed to parse log level %s.", optarg);
781 r = log_set_target_from_string(optarg);
783 log_error("Failed to parse log target %s.", optarg);
792 r = log_show_color_from_string(optarg);
794 log_error("Failed to parse log color setting %s.", optarg);
798 log_show_color(true);
802 case ARG_LOG_LOCATION:
804 r = log_show_location_from_string(optarg);
806 log_error("Failed to parse log location setting %s.", optarg);
810 log_show_location(true);
814 case ARG_DEFAULT_STD_OUTPUT:
815 r = exec_output_from_string(optarg);
817 log_error("Failed to parse default standard output setting %s.", optarg);
820 arg_default_std_output = r;
823 case ARG_DEFAULT_STD_ERROR:
824 r = exec_output_from_string(optarg);
826 log_error("Failed to parse default standard error output setting %s.", optarg);
829 arg_default_std_error = r;
834 r = set_default_unit(optarg);
836 log_error("Failed to set default unit %s: %s", optarg, strerror(-r));
843 arg_running_as = SYSTEMD_SYSTEM;
847 arg_running_as = SYSTEMD_USER;
851 arg_action = ACTION_TEST;
852 if (arg_no_pager < 0)
861 arg_action = ACTION_VERSION;
864 case ARG_DUMP_CONFIGURATION_ITEMS:
865 arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
869 r = optarg ? parse_boolean(optarg) : 1;
871 log_error("Failed to parse dump core boolean %s.", optarg);
877 case ARG_CRASH_SHELL:
878 r = optarg ? parse_boolean(optarg) : 1;
880 log_error("Failed to parse crash shell boolean %s.", optarg);
886 case ARG_CONFIRM_SPAWN:
887 r = optarg ? parse_boolean(optarg) : 1;
889 log_error("Failed to parse confirm spawn boolean %s.", optarg);
892 arg_confirm_spawn = r;
895 case ARG_SHOW_STATUS:
897 r = parse_show_status(optarg, &arg_show_status);
899 log_error("Failed to parse show status boolean %s.", optarg);
903 arg_show_status = SHOW_STATUS_YES;
906 case ARG_DESERIALIZE: {
910 r = safe_atoi(optarg, &fd);
911 if (r < 0 || fd < 0) {
912 log_error("Failed to parse deserialize option %s.", optarg);
913 return r < 0 ? r : -EINVAL;
916 fd_cloexec(fd, true);
920 log_error("Failed to open serialization fd: %m");
924 if (arg_serialization)
925 fclose(arg_serialization);
927 arg_serialization = f;
932 case ARG_SWITCHED_ROOT:
933 arg_switched_root = true;
937 arg_action = ACTION_HELP;
938 if (arg_no_pager < 0)
943 log_set_max_level(LOG_DEBUG);
949 /* Just to eat away the sysvinit kernel
950 * cmdline args without getopt() error
951 * messages that we'll parse in
952 * parse_proc_cmdline_word() or ignore. */
961 assert_not_reached("Unhandled option code.");
964 if (optind < argc && getpid() != 1) {
965 /* Hmm, when we aren't run as init system
966 * let's complain about excess arguments */
968 log_error("Excess arguments.");
972 if (detect_container(NULL) > 0) {
975 /* All /proc/cmdline arguments the kernel didn't
976 * understand it passed to us. We're not really
977 * interested in that usually since /proc/cmdline is
978 * more interesting and complete. With one exception:
979 * if we are run in a container /proc/cmdline is not
980 * relevant for the container, hence we rely on argv[]
983 for (a = argv; a < argv + argc; a++) {
984 _cleanup_free_ char *w;
991 value = strchr(w, '=');
995 r = parse_proc_cmdline_item(w, value);
997 log_error("Failed on cmdline argument %s: %s", *a, strerror(-r));
1006 static int help(void) {
1008 printf("%s [OPTIONS...]\n\n"
1009 "Starts up and maintains the system or user services.\n\n"
1010 " -h --help Show this help\n"
1011 " --test Determine startup sequence, dump it and exit\n"
1012 " --no-pager Do not pipe output into a pager\n"
1013 " --dump-configuration-items Dump understood unit configuration items\n"
1014 " --unit=UNIT Set default unit\n"
1015 " --system Run a system instance, even if PID != 1\n"
1016 " --user Run a user instance\n"
1017 " --dump-core[=0|1] Dump core on crash\n"
1018 " --crash-shell[=0|1] Run shell on crash\n"
1019 " --confirm-spawn[=0|1] Ask for confirmation when spawning processes\n"
1020 " --show-status[=0|1] Show status updates on the console during bootup\n"
1021 " --log-target=TARGET Set log target (console, journal, kmsg, journal-or-kmsg, null)\n"
1022 " --log-level=LEVEL Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
1023 " --log-color[=0|1] Highlight important log messages\n"
1024 " --log-location[=0|1] Include code location in log messages\n"
1025 " --default-standard-output= Set default standard output for services\n"
1026 " --default-standard-error= Set default standard error output for services\n",
1027 program_invocation_short_name);
1032 static int version(void) {
1033 puts(PACKAGE_STRING);
1034 puts(SYSTEMD_FEATURES);
1039 static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
1048 r = manager_open_serialization(m, &f);
1050 log_error("Failed to create serialization file: %s", strerror(-r));
1054 /* Make sure nothing is really destructed when we shut down */
1056 bus_manager_send_reloading(m, true);
1061 log_error("Failed to allocate fd set: %s", strerror(-r));
1065 r = manager_serialize(m, f, fds, switching_root);
1067 log_error("Failed to serialize state: %s", strerror(-r));
1071 if (fseeko(f, 0, SEEK_SET) < 0) {
1072 log_error("Failed to rewind serialization fd: %m");
1076 r = fd_cloexec(fileno(f), false);
1078 log_error("Failed to disable O_CLOEXEC for serialization: %s", strerror(-r));
1082 r = fdset_cloexec(fds, false);
1084 log_error("Failed to disable O_CLOEXEC for serialization fds: %s", strerror(-r));
1102 static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1106 assert(saved_rlimit);
1108 /* Save the original RLIMIT_NOFILE so that we can reset it
1109 * later when transitioning from the initrd to the main
1110 * systemd or suchlike. */
1111 if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0) {
1112 log_error("Reading RLIMIT_NOFILE failed: %m");
1116 /* Make sure forked processes get the default kernel setting */
1117 if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1120 rl = newdup(struct rlimit, saved_rlimit, 1);
1124 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1127 /* Bump up the resource limit for ourselves substantially */
1128 nl.rlim_cur = nl.rlim_max = 64*1024;
1129 r = setrlimit_closest(RLIMIT_NOFILE, &nl);
1131 log_error("Setting RLIMIT_NOFILE failed: %s", strerror(-r));
1138 static void test_mtab(void) {
1140 static const char ok[] =
1141 "/proc/self/mounts\0"
1143 "../proc/self/mounts\0"
1146 _cleanup_free_ char *p = NULL;
1149 /* Check that /etc/mtab is a symlink to the right place or
1150 * non-existing. But certainly not a file, or a symlink to
1151 * some weird place... */
1153 r = readlink_malloc("/etc/mtab", &p);
1156 if (r >= 0 && nulstr_contains(ok, p))
1159 log_warning("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1160 "This is not supported anymore. "
1161 "Please make sure to replace this file by a symlink to avoid incorrect or misleading mount(8) output.");
1164 static void test_usr(void) {
1166 /* Check that /usr is not a separate fs */
1168 if (dir_is_empty("/usr") <= 0)
1171 log_warning("/usr appears to be on its own filesytem and is not already mounted. This is not a supported setup. "
1172 "Some things will probably break (sometimes even silently) in mysterious ways. "
1173 "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1176 static int initialize_join_controllers(void) {
1177 /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1178 * + "net_prio". We'd like to add "cpuset" to the mix, but
1179 * "cpuset" does't really work for groups with no initialized
1182 arg_join_controllers = new(char**, 3);
1183 if (!arg_join_controllers)
1186 arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
1187 arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
1188 arg_join_controllers[2] = NULL;
1190 if (!arg_join_controllers[0] || !arg_join_controllers[1]) {
1191 free_join_controllers();
1198 static int enforce_syscall_archs(Set *archs) {
1200 scmp_filter_ctx *seccomp;
1205 seccomp = seccomp_init(SCMP_ACT_ALLOW);
1209 SET_FOREACH(id, arg_syscall_archs, i) {
1210 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1214 log_error("Failed to add architecture to seccomp: %s", strerror(-r));
1219 r = seccomp_attr_set(seccomp, SCMP_FLTATR_CTL_NNP, 0);
1221 log_error("Failed to unset NO_NEW_PRIVS: %s", strerror(-r));
1225 r = seccomp_load(seccomp);
1227 log_error("Failed to add install architecture seccomp: %s", strerror(-r));
1230 seccomp_release(seccomp);
1237 static int status_welcome(void) {
1238 _cleanup_free_ char *pretty_name = NULL, *ansi_color = NULL;
1241 r = parse_env_file("/etc/os-release", NEWLINE,
1242 "PRETTY_NAME", &pretty_name,
1243 "ANSI_COLOR", &ansi_color,
1246 r = parse_env_file("/usr/lib/os-release", NEWLINE,
1247 "PRETTY_NAME", &pretty_name,
1248 "ANSI_COLOR", &ansi_color,
1252 if (r < 0 && r != -ENOENT)
1253 log_warning("Failed to read os-release file: %s", strerror(-r));
1255 return status_printf(NULL, false, false,
1256 "\nWelcome to \x1B[%sm%s\x1B[0m!\n",
1257 isempty(ansi_color) ? "1" : ansi_color,
1258 isempty(pretty_name) ? "Linux" : pretty_name);
1261 static int write_container_id(void) {
1264 c = getenv("container");
1268 return write_string_file("/run/systemd/container", c);
1271 int main(int argc, char *argv[]) {
1273 int r, retval = EXIT_FAILURE;
1274 usec_t before_startup, after_startup;
1275 char timespan[FORMAT_TIMESPAN_MAX];
1277 bool reexecute = false;
1278 const char *shutdown_verb = NULL;
1279 dual_timestamp initrd_timestamp = { 0ULL, 0ULL };
1280 dual_timestamp userspace_timestamp = { 0ULL, 0ULL };
1281 dual_timestamp kernel_timestamp = { 0ULL, 0ULL };
1282 dual_timestamp security_start_timestamp = { 0ULL, 0ULL };
1283 dual_timestamp security_finish_timestamp = { 0ULL, 0ULL };
1284 static char systemd[] = "systemd";
1285 bool skip_setup = false;
1287 bool loaded_policy = false;
1288 bool arm_reboot_watchdog = false;
1289 bool queue_default_job = false;
1290 bool empty_etc = false;
1291 char *switch_root_dir = NULL, *switch_root_init = NULL;
1292 static struct rlimit saved_rlimit_nofile = { 0, 0 };
1294 #ifdef HAVE_SYSV_COMPAT
1295 if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
1296 /* This is compatibility support for SysV, where
1297 * calling init as a user is identical to telinit. */
1300 execv(SYSTEMCTL_BINARY_PATH, argv);
1301 log_error("Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
1306 dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1307 dual_timestamp_get(&userspace_timestamp);
1309 /* Determine if this is a reexecution or normal bootup. We do
1310 * the full command line parsing much later, so let's just
1311 * have a quick peek here. */
1312 if (strv_find(argv+1, "--deserialize"))
1315 /* If we have switched root, do all the special setup
1317 if (strv_find(argv+1, "--switched-root"))
1320 /* If we get started via the /sbin/init symlink then we are
1321 called 'init'. After a subsequent reexecution we are then
1322 called 'systemd'. That is confusing, hence let's call us
1323 systemd right-away. */
1324 program_invocation_short_name = systemd;
1325 prctl(PR_SET_NAME, systemd);
1330 log_show_color(isatty(STDERR_FILENO) > 0);
1331 log_set_upgrade_syslog_to_journal(true);
1333 /* Disable the umask logic */
1337 if (getpid() == 1 && detect_container(NULL) <= 0) {
1339 /* Running outside of a container as PID 1 */
1340 arg_running_as = SYSTEMD_SYSTEM;
1342 log_set_target(LOG_TARGET_KMSG);
1346 initrd_timestamp = userspace_timestamp;
1349 mount_setup_early();
1350 dual_timestamp_get(&security_start_timestamp);
1351 if (selinux_setup(&loaded_policy) < 0)
1353 if (ima_setup() < 0)
1355 if (smack_setup(&loaded_policy) < 0)
1357 dual_timestamp_get(&security_finish_timestamp);
1360 if (label_init(NULL) < 0)
1364 if (clock_is_localtime() > 0) {
1368 * The very first call of settimeofday() also does a time warp in the kernel.
1370 * In the rtc-in-local time mode, we set the kernel's timezone, and rely on
1371 * external tools to take care of maintaining the RTC and do all adjustments.
1372 * This matches the behavior of Windows, which leaves the RTC alone if the
1373 * registry tells that the RTC runs in UTC.
1375 r = clock_set_timezone(&min);
1377 log_error("Failed to apply local time delta, ignoring: %s", strerror(-r));
1379 log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
1380 } else if (!in_initrd()) {
1382 * Do a dummy very first call to seal the kernel's time warp magic.
1384 * Do not call this this from inside the initrd. The initrd might not
1385 * carry /etc/adjtime with LOCAL, but the real system could be set up
1386 * that way. In such case, we need to delay the time-warp or the sealing
1387 * until we reach the real system.
1389 * Do no set the kernel's timezone. The concept of local time cannot
1390 * be supported reliably, the time will jump or be incorrect at every daylight
1391 * saving time change. All kernel local time concepts will be treated
1394 clock_reset_timewarp();
1398 /* Set the default for later on, but don't actually
1399 * open the logs like this for now. Note that if we
1400 * are transitioning from the initrd there might still
1401 * be journal fd open, and we shouldn't attempt
1402 * opening that before we parsed /proc/cmdline which
1403 * might redirect output elsewhere. */
1404 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1406 } else if (getpid() == 1) {
1407 /* Running inside a container, as PID 1 */
1408 arg_running_as = SYSTEMD_SYSTEM;
1409 log_set_target(LOG_TARGET_CONSOLE);
1410 log_close_console(); /* force reopen of /dev/console */
1413 /* For the later on, see above... */
1414 log_set_target(LOG_TARGET_JOURNAL);
1416 /* clear the kernel timestamp,
1417 * because we are in a container */
1418 kernel_timestamp.monotonic = 0ULL;
1419 kernel_timestamp.realtime = 0ULL;
1422 /* Running as user instance */
1423 arg_running_as = SYSTEMD_USER;
1424 log_set_target(LOG_TARGET_AUTO);
1427 /* clear the kernel timestamp,
1428 * because we are not PID 1 */
1429 kernel_timestamp.monotonic = 0ULL;
1430 kernel_timestamp.realtime = 0ULL;
1433 /* Initialize default unit */
1434 r = set_default_unit(SPECIAL_DEFAULT_TARGET);
1436 log_error("Failed to set default unit %s: %s", SPECIAL_DEFAULT_TARGET, strerror(-r));
1440 r = initialize_join_controllers();
1444 /* Mount /proc, /sys and friends, so that /proc/cmdline and
1445 * /proc/$PID/fd is available. */
1446 if (getpid() == 1) {
1447 r = mount_setup(loaded_policy);
1452 /* Reset all signal handlers. */
1453 assert_se(reset_all_signal_handlers() == 0);
1455 ignore_signals(SIGNALS_IGNORE, -1);
1457 if (parse_config_file() < 0)
1460 if (arg_running_as == SYSTEMD_SYSTEM)
1461 if (parse_proc_cmdline(parse_proc_cmdline_item) < 0)
1464 log_parse_environment();
1466 if (parse_argv(argc, argv) < 0)
1469 if (arg_action == ACTION_TEST &&
1471 log_error("Don't run test mode as root.");
1475 if (arg_running_as == SYSTEMD_USER &&
1476 arg_action == ACTION_RUN &&
1478 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1482 if (arg_running_as == SYSTEMD_SYSTEM &&
1483 arg_action == ACTION_RUN &&
1484 running_in_chroot() > 0) {
1485 log_error("Cannot be run in a chroot() environment.");
1489 if (arg_action == ACTION_TEST)
1492 pager_open_if_enabled();
1494 if (arg_action == ACTION_HELP) {
1497 } else if (arg_action == ACTION_VERSION) {
1500 } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
1501 unit_dump_config_items(stdout);
1502 retval = EXIT_SUCCESS;
1504 } else if (arg_action == ACTION_DONE) {
1505 retval = EXIT_SUCCESS;
1509 if (arg_running_as == SYSTEMD_USER &&
1510 !getenv("XDG_RUNTIME_DIR")) {
1511 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1515 assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
1517 /* Close logging fds, in order not to confuse fdset below */
1520 /* Remember open file descriptors for later deserialization */
1521 r = fdset_new_fill(&fds);
1523 log_error("Failed to allocate fd set: %s", strerror(-r));
1526 fdset_cloexec(fds, true);
1528 if (arg_serialization)
1529 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
1531 if (arg_running_as == SYSTEMD_SYSTEM)
1532 /* Become a session leader if we aren't one yet. */
1535 /* Move out of the way, so that we won't block unmounts */
1536 assert_se(chdir("/") == 0);
1538 /* Reset the console, but only if this is really init and we
1539 * are freshly booted */
1540 if (arg_running_as == SYSTEMD_SYSTEM && arg_action == ACTION_RUN)
1541 console_setup(getpid() == 1 && !skip_setup);
1543 /* Open the logging devices, if possible and necessary */
1546 if (arg_show_status == _SHOW_STATUS_UNSET)
1547 arg_show_status = SHOW_STATUS_YES;
1549 /* Make sure we leave a core dump without panicing the
1551 if (getpid() == 1) {
1552 install_crash_handler();
1554 r = mount_cgroup_controllers(arg_join_controllers);
1559 if (arg_running_as == SYSTEMD_SYSTEM) {
1560 const char *virtualization = NULL;
1562 log_info(PACKAGE_STRING " running in %ssystem mode. (" SYSTEMD_FEATURES ")",
1563 arg_action == ACTION_TEST ? "test " : "" );
1565 detect_virtualization(&virtualization);
1567 log_info("Detected virtualization '%s'.", virtualization);
1569 write_container_id();
1571 log_info("Detected architecture '%s'.", architecture_to_string(uname_architecture()));
1574 log_info("Running in initial RAM disk.");
1576 /* Let's check whether /etc is already populated. We
1577 * don't actually really check for that, but use
1578 * /etc/machine-id as flag file. This allows container
1579 * managers and installers to provision a couple of
1580 * files already. If the container manager wants to
1581 * provision the machine ID itself it should pass
1582 * $container_uuid to PID 1.*/
1584 empty_etc = access("/etc/machine-id", F_OK) < 0;
1586 log_info("Running with unpopulated /etc.");
1588 _cleanup_free_ char *t;
1590 t = uid_to_name(getuid());
1591 log_debug(PACKAGE_STRING " running in %suser mode for user "UID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1592 arg_action == ACTION_TEST ? " test" : "", getuid(), t);
1595 if (arg_running_as == SYSTEMD_SYSTEM && !skip_setup) {
1596 if (arg_show_status > 0 || plymouth_running())
1603 machine_id_setup(NULL);
1610 if (arg_running_as == SYSTEMD_SYSTEM && arg_runtime_watchdog > 0)
1611 watchdog_set_timeout(&arg_runtime_watchdog);
1613 if (arg_timer_slack_nsec != NSEC_INFINITY)
1614 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
1615 log_error("Failed to adjust timer slack: %m");
1617 if (arg_capability_bounding_set_drop) {
1618 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
1620 log_error("Failed to drop capability bounding set of usermode helpers: %s", strerror(-r));
1623 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
1625 log_error("Failed to drop capability bounding set: %s", strerror(-r));
1630 if (arg_syscall_archs) {
1631 r = enforce_syscall_archs(arg_syscall_archs);
1636 if (arg_running_as == SYSTEMD_USER) {
1637 /* Become reaper of our children */
1638 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0) {
1639 log_warning("Failed to make us a subreaper: %m");
1640 if (errno == EINVAL)
1641 log_info("Perhaps the kernel version is too old (< 3.4?)");
1645 if (arg_running_as == SYSTEMD_SYSTEM) {
1646 bump_rlimit_nofile(&saved_rlimit_nofile);
1649 r = unit_file_preset_all(UNIT_FILE_SYSTEM, false, NULL, UNIT_FILE_PRESET_FULL, false, NULL, 0);
1651 log_warning("Failed to populate /etc with preset unit settings, ignoring: %s", strerror(-r));
1653 log_info("Populated /etc with preset unit settings.");
1657 r = manager_new(arg_running_as, arg_action == ACTION_TEST, &m);
1659 log_error("Failed to allocate manager object: %s", strerror(-r));
1663 m->confirm_spawn = arg_confirm_spawn;
1664 m->default_timer_accuracy_usec = arg_default_timer_accuracy_usec;
1665 m->default_std_output = arg_default_std_output;
1666 m->default_std_error = arg_default_std_error;
1667 m->default_restart_usec = arg_default_restart_usec;
1668 m->default_timeout_start_usec = arg_default_timeout_start_usec;
1669 m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
1670 m->default_start_limit_interval = arg_default_start_limit_interval;
1671 m->default_start_limit_burst = arg_default_start_limit_burst;
1672 m->default_cpu_accounting = arg_default_cpu_accounting;
1673 m->default_blockio_accounting = arg_default_blockio_accounting;
1674 m->default_memory_accounting = arg_default_memory_accounting;
1675 m->runtime_watchdog = arg_runtime_watchdog;
1676 m->shutdown_watchdog = arg_shutdown_watchdog;
1677 m->userspace_timestamp = userspace_timestamp;
1678 m->kernel_timestamp = kernel_timestamp;
1679 m->initrd_timestamp = initrd_timestamp;
1680 m->security_start_timestamp = security_start_timestamp;
1681 m->security_finish_timestamp = security_finish_timestamp;
1683 manager_set_default_rlimits(m, arg_default_rlimit);
1684 manager_environment_add(m, NULL, arg_default_environment);
1685 manager_set_show_status(m, arg_show_status);
1686 manager_set_first_boot(m, empty_etc);
1688 /* Remember whether we should queue the default job */
1689 queue_default_job = !arg_serialization || arg_switched_root;
1691 before_startup = now(CLOCK_MONOTONIC);
1693 r = manager_startup(m, arg_serialization, fds);
1695 log_error("Failed to fully start up daemon: %s", strerror(-r));
1697 /* This will close all file descriptors that were opened, but
1698 * not claimed by any unit. */
1702 if (arg_serialization) {
1703 fclose(arg_serialization);
1704 arg_serialization = NULL;
1707 if (queue_default_job) {
1708 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
1709 Unit *target = NULL;
1710 Job *default_unit_job;
1712 log_debug("Activating default unit: %s", arg_default_unit);
1714 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
1716 log_error("Failed to load default target: %s", bus_error_message(&error, r));
1717 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
1718 log_error("Failed to load default target: %s", strerror(-target->load_error));
1719 else if (target->load_state == UNIT_MASKED)
1720 log_error("Default target masked.");
1722 if (!target || target->load_state != UNIT_LOADED) {
1723 log_info("Trying to load rescue target...");
1725 r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1727 log_error("Failed to load rescue target: %s", bus_error_message(&error, r));
1729 } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
1730 log_error("Failed to load rescue target: %s", strerror(-target->load_error));
1732 } else if (target->load_state == UNIT_MASKED) {
1733 log_error("Rescue target masked.");
1738 assert(target->load_state == UNIT_LOADED);
1740 if (arg_action == ACTION_TEST) {
1741 printf("-> By units:\n");
1742 manager_dump_units(m, stdout, "\t");
1745 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
1747 log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
1749 r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1751 log_error("Failed to start default target: %s", bus_error_message(&error, r));
1755 log_error("Failed to isolate default target: %s", bus_error_message(&error, r));
1759 m->default_unit_job_id = default_unit_job->id;
1761 after_startup = now(CLOCK_MONOTONIC);
1762 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1763 "Loaded units and determined initial transaction in %s.",
1764 format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 0));
1766 if (arg_action == ACTION_TEST) {
1767 printf("-> By jobs:\n");
1768 manager_dump_jobs(m, stdout, "\t");
1769 retval = EXIT_SUCCESS;
1775 r = manager_loop(m);
1777 log_error("Failed to run mainloop: %s", strerror(-r));
1781 switch (m->exit_code) {
1784 retval = EXIT_SUCCESS;
1788 case MANAGER_RELOAD:
1789 log_info("Reloading.");
1790 r = manager_reload(m);
1792 log_error("Failed to reload: %s", strerror(-r));
1795 case MANAGER_REEXECUTE:
1797 if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0)
1801 log_notice("Reexecuting.");
1804 case MANAGER_SWITCH_ROOT:
1805 /* Steal the switch root parameters */
1806 switch_root_dir = m->switch_root;
1807 switch_root_init = m->switch_root_init;
1808 m->switch_root = m->switch_root_init = NULL;
1810 if (!switch_root_init)
1811 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0)
1815 log_notice("Switching root.");
1818 case MANAGER_REBOOT:
1819 case MANAGER_POWEROFF:
1821 case MANAGER_KEXEC: {
1822 static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
1823 [MANAGER_REBOOT] = "reboot",
1824 [MANAGER_POWEROFF] = "poweroff",
1825 [MANAGER_HALT] = "halt",
1826 [MANAGER_KEXEC] = "kexec"
1829 assert_se(shutdown_verb = table[m->exit_code]);
1830 arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
1832 log_notice("Shutting down.");
1837 assert_not_reached("Unknown exit code.");
1849 for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++) {
1850 free(arg_default_rlimit[j]);
1851 arg_default_rlimit[j] = NULL;
1854 free(arg_default_unit);
1855 arg_default_unit = NULL;
1857 free_join_controllers();
1859 strv_free(arg_default_environment);
1860 arg_default_environment = NULL;
1862 set_free(arg_syscall_archs);
1863 arg_syscall_archs = NULL;
1869 unsigned i, args_size;
1872 /* Close and disarm the watchdog, so that the new
1873 * instance can reinitialize it, but doesn't get
1874 * rebooted while we do that */
1875 watchdog_close(true);
1877 /* Reset the RLIMIT_NOFILE to the kernel default, so
1878 * that the new systemd can pass the kernel default to
1879 * its child processes */
1880 if (saved_rlimit_nofile.rlim_cur > 0)
1881 setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
1883 if (switch_root_dir) {
1884 /* Kill all remaining processes from the
1885 * initrd, but don't wait for them, so that we
1886 * can handle the SIGCHLD for them after
1888 broadcast_signal(SIGTERM, false, true);
1890 /* And switch root */
1891 r = switch_root(switch_root_dir);
1893 log_error("Failed to switch root, ignoring: %s", strerror(-r));
1896 args_size = MAX(6, argc+1);
1897 args = newa(const char*, args_size);
1899 if (!switch_root_init) {
1902 /* First try to spawn ourselves with the right
1903 * path, and with full serialization. We do
1904 * this only if the user didn't specify an
1905 * explicit init to spawn. */
1907 assert(arg_serialization);
1910 snprintf(sfd, sizeof(sfd), "%i", fileno(arg_serialization));
1914 args[i++] = SYSTEMD_BINARY_PATH;
1915 if (switch_root_dir)
1916 args[i++] = "--switched-root";
1917 args[i++] = arg_running_as == SYSTEMD_SYSTEM ? "--system" : "--user";
1918 args[i++] = "--deserialize";
1922 /* do not pass along the environment we inherit from the kernel or initrd */
1923 if (switch_root_dir)
1926 assert(i <= args_size);
1927 execv(args[0], (char* const*) args);
1930 /* Try the fallback, if there is any, without any
1931 * serialization. We pass the original argv[] and
1932 * envp[]. (Well, modulo the ordering changes due to
1933 * getopt() in argv[], and some cleanups in envp[],
1934 * but let's hope that doesn't matter.) */
1936 if (arg_serialization) {
1937 fclose(arg_serialization);
1938 arg_serialization = NULL;
1946 /* Reopen the console */
1947 make_console_stdio();
1949 for (j = 1, i = 1; j < (unsigned) argc; j++)
1950 args[i++] = argv[j];
1952 assert(i <= args_size);
1954 /* reenable any blocked signals, especially important
1955 * if we switch from initial ramdisk to init=... */
1956 reset_all_signal_handlers();
1958 assert_se(sigemptyset(&ss) == 0);
1959 assert_se(sigprocmask(SIG_SETMASK, &ss, NULL) == 0);
1961 if (switch_root_init) {
1962 args[0] = switch_root_init;
1963 execv(args[0], (char* const*) args);
1964 log_warning("Failed to execute configured init, trying fallback: %m");
1967 args[0] = "/sbin/init";
1968 execv(args[0], (char* const*) args);
1970 if (errno == ENOENT) {
1971 log_warning("No /sbin/init, trying fallback");
1973 args[0] = "/bin/sh";
1975 execv(args[0], (char* const*) args);
1976 log_error("Failed to execute /bin/sh, giving up: %m");
1978 log_warning("Failed to execute /sbin/init, giving up: %m");
1981 if (arg_serialization) {
1982 fclose(arg_serialization);
1983 arg_serialization = NULL;
1991 #ifdef HAVE_VALGRIND_VALGRIND_H
1992 /* If we are PID 1 and running under valgrind, then let's exit
1993 * here explicitly. valgrind will only generate nice output on
1994 * exit(), not on exec(), hence let's do the former not the
1996 if (getpid() == 1 && RUNNING_ON_VALGRIND)
2000 if (shutdown_verb) {
2001 char log_level[DECIMAL_STR_MAX(int) + 1];
2002 const char* command_line[9] = {
2003 SYSTEMD_SHUTDOWN_BINARY_PATH,
2005 "--log-level", log_level,
2009 _cleanup_strv_free_ char **env_block = NULL;
2011 assert(command_line[pos] == NULL);
2012 env_block = strv_copy(environ);
2014 snprintf(log_level, sizeof(log_level), "%d", log_get_max_level());
2016 switch (log_get_target()) {
2017 case LOG_TARGET_KMSG:
2018 case LOG_TARGET_JOURNAL_OR_KMSG:
2019 case LOG_TARGET_SYSLOG_OR_KMSG:
2020 command_line[pos++] = "kmsg";
2023 case LOG_TARGET_CONSOLE:
2025 command_line[pos++] = "console";
2029 if (log_get_show_color())
2030 command_line[pos++] = "--log-color";
2032 if (log_get_show_location())
2033 command_line[pos++] = "--log-location";
2035 assert(pos < ELEMENTSOF(command_line));
2037 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
2040 /* If we reboot let's set the shutdown
2041 * watchdog and tell the shutdown binary to
2042 * repeatedly ping it */
2043 watchdog_set_timeout(&arg_shutdown_watchdog);
2044 watchdog_close(false);
2046 /* Tell the binary how often to ping, ignore failure */
2047 if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
2048 strv_push(&env_block, e);
2050 watchdog_close(true);
2052 /* Avoid the creation of new processes forked by the
2053 * kernel; at this point, we will not listen to the
2055 if (detect_container(NULL) <= 0)
2056 cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
2058 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
2059 log_error("Failed to execute shutdown binary, %s: %m",
2060 getpid() == 1 ? "freezing" : "quitting");