1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
26 #include <sys/types.h>
32 #include <sys/prctl.h>
33 #include <sys/mount.h>
35 #ifdef HAVE_VALGRIND_VALGRIND_H
36 #include <valgrind/valgrind.h>
42 #include "sd-daemon.h"
43 #include "sd-messages.h"
47 #include "load-fragment.h"
50 #include "conf-parser.h"
57 #include "architecture.h"
59 #include "path-util.h"
60 #include "switch-root.h"
61 #include "capability.h"
64 #include "clock-util.h"
66 #include "dbus-manager.h"
67 #include "bus-error.h"
70 #include "mount-setup.h"
71 #include "loopback-setup.h"
72 #include "hostname-setup.h"
73 #include "machine-id-setup.h"
74 #include "selinux-setup.h"
75 #include "ima-setup.h"
76 #include "smack-setup.h"
78 #include "kmod-setup.h"
86 ACTION_DUMP_CONFIGURATION_ITEMS,
88 } arg_action = ACTION_RUN;
89 static char *arg_default_unit = NULL;
90 static SystemdRunningAs arg_running_as = _SYSTEMD_RUNNING_AS_INVALID;
91 static bool arg_dump_core = true;
92 static bool arg_crash_shell = false;
93 static int arg_crash_chvt = -1;
94 static bool arg_confirm_spawn = false;
95 static ShowStatus arg_show_status = _SHOW_STATUS_UNSET;
96 static bool arg_switched_root = false;
97 static char ***arg_join_controllers = NULL;
98 static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
99 static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
100 static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
101 static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
102 static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
103 static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
104 static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
105 static usec_t arg_runtime_watchdog = 0;
106 static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
107 static char **arg_default_environment = NULL;
108 static struct rlimit *arg_default_rlimit[_RLIMIT_MAX] = {};
109 static uint64_t arg_capability_bounding_set_drop = 0;
110 static nsec_t arg_timer_slack_nsec = (nsec_t) -1;
111 static usec_t arg_default_timer_accuracy_usec = 1 * USEC_PER_MINUTE;
112 static Set* arg_syscall_archs = NULL;
113 static FILE* arg_serialization = NULL;
114 static bool arg_default_cpu_accounting = false;
115 static bool arg_default_blockio_accounting = false;
116 static bool arg_default_memory_accounting = false;
118 static void nop_handler(int sig) {}
120 noreturn static void crash(int sig) {
123 /* Pass this on immediately, if this is not PID 1 */
125 else if (!arg_dump_core)
126 log_error("Caught <%s>, not dumping core.", signal_to_string(sig));
128 struct sigaction sa = {
129 .sa_handler = nop_handler,
130 .sa_flags = SA_NOCLDSTOP|SA_RESTART,
134 /* We want to wait for the core process, hence let's enable SIGCHLD */
135 sigaction(SIGCHLD, &sa, NULL);
139 log_error("Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
142 struct rlimit rl = {};
144 /* Enable default signal handler for core dump */
146 sa.sa_handler = SIG_DFL;
147 sigaction(sig, &sa, NULL);
149 /* Don't limit the core dump size */
150 rl.rlim_cur = RLIM_INFINITY;
151 rl.rlim_max = RLIM_INFINITY;
152 setrlimit(RLIMIT_CORE, &rl);
154 /* Just to be sure... */
157 /* Raise the signal again */
160 assert_not_reached("We shouldn't be here...");
167 /* Order things nicely. */
168 r = wait_for_terminate(pid, &status);
170 log_error("Caught <%s>, waitpid() failed: %s", signal_to_string(sig), strerror(-r));
171 else if (status.si_code != CLD_DUMPED)
172 log_error("Caught <%s>, core dump failed.", signal_to_string(sig));
174 log_error("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
179 chvt(arg_crash_chvt);
181 if (arg_crash_shell) {
182 struct sigaction sa = {
183 .sa_handler = SIG_IGN,
184 .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
188 log_info("Executing crash shell in 10s...");
191 /* Let the kernel reap children for us */
192 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
196 log_error("Failed to fork off crash shell: %m");
198 make_console_stdio();
199 execl("/bin/sh", "/bin/sh", NULL);
201 log_error("execl() failed: %m");
205 log_info("Successfully spawned crash shell as pid "PID_FMT".", pid);
208 log_info("Freezing execution.");
212 static void install_crash_handler(void) {
213 struct sigaction sa = {
215 .sa_flags = SA_NODEFER,
218 sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
221 static int console_setup(bool do_reset) {
224 /* If we are init, we connect stdin/stdout/stderr to /dev/null
225 * and make sure we don't have a controlling tty. */
232 tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
234 log_error("Failed to open /dev/console: %s", strerror(-tty_fd));
238 /* We don't want to force text mode.
239 * plymouth may be showing pictures already from initrd. */
240 r = reset_terminal_fd(tty_fd, false);
242 log_error("Failed to reset /dev/console: %s", strerror(-r));
248 static int set_default_unit(const char *u) {
257 free(arg_default_unit);
258 arg_default_unit = c;
263 static int parse_proc_cmdline_item(const char *key, const char *value) {
265 static const char * const rlmap[] = {
266 "emergency", SPECIAL_EMERGENCY_TARGET,
267 "-b", SPECIAL_EMERGENCY_TARGET,
268 "single", SPECIAL_RESCUE_TARGET,
269 "-s", SPECIAL_RESCUE_TARGET,
270 "s", SPECIAL_RESCUE_TARGET,
271 "S", SPECIAL_RESCUE_TARGET,
272 "1", SPECIAL_RESCUE_TARGET,
273 "2", SPECIAL_RUNLEVEL2_TARGET,
274 "3", SPECIAL_RUNLEVEL3_TARGET,
275 "4", SPECIAL_RUNLEVEL4_TARGET,
276 "5", SPECIAL_RUNLEVEL5_TARGET,
282 if (streq(key, "systemd.unit") && value) {
285 return set_default_unit(value);
287 } else if (streq(key, "rd.systemd.unit") && value) {
289 return set_default_unit(value);
291 } else if (streq(key, "systemd.log_target") && value) {
293 if (log_set_target_from_string(value) < 0)
294 log_warning("Failed to parse log target %s. Ignoring.", value);
296 } else if (streq(key, "systemd.log_level") && value) {
298 if (log_set_max_level_from_string(value) < 0)
299 log_warning("Failed to parse log level %s. Ignoring.", value);
301 } else if (streq(key, "systemd.log_color") && value) {
303 if (log_show_color_from_string(value) < 0)
304 log_warning("Failed to parse log color setting %s. Ignoring.", value);
306 } else if (streq(key, "systemd.log_location") && value) {
308 if (log_show_location_from_string(value) < 0)
309 log_warning("Failed to parse log location setting %s. Ignoring.", value);
311 } else if (streq(key, "systemd.dump_core") && value) {
313 r = parse_boolean(value);
315 log_warning("Failed to parse dump core switch %s. Ignoring.", value);
319 } else if (streq(key, "systemd.crash_shell") && value) {
321 r = parse_boolean(value);
323 log_warning("Failed to parse crash shell switch %s. Ignoring.", value);
327 } else if (streq(key, "systemd.crash_chvt") && value) {
329 if (safe_atoi(value, &r) < 0)
330 log_warning("Failed to parse crash chvt switch %s. Ignoring.", value);
334 } else if (streq(key, "systemd.confirm_spawn") && value) {
336 r = parse_boolean(value);
338 log_warning("Failed to parse confirm spawn switch %s. Ignoring.", value);
340 arg_confirm_spawn = r;
342 } else if (streq(key, "systemd.show_status") && value) {
344 r = parse_show_status(value, &arg_show_status);
346 log_warning("Failed to parse show status switch %s. Ignoring.", value);
348 } else if (streq(key, "systemd.default_standard_output") && value) {
350 r = exec_output_from_string(value);
352 log_warning("Failed to parse default standard output switch %s. Ignoring.", value);
354 arg_default_std_output = r;
356 } else if (streq(key, "systemd.default_standard_error") && value) {
358 r = exec_output_from_string(value);
360 log_warning("Failed to parse default standard error switch %s. Ignoring.", value);
362 arg_default_std_error = r;
364 } else if (streq(key, "systemd.setenv") && value) {
366 if (env_assignment_is_valid(value)) {
369 env = strv_env_set(arg_default_environment, value);
371 arg_default_environment = env;
373 log_warning("Setting environment variable '%s' failed, ignoring: %s", value, strerror(ENOMEM));
375 log_warning("Environment variable name '%s' is not valid. Ignoring.", value);
377 } else if (!streq(key, "systemd.restore_state") &&
378 !streq(key, "systemd.gpt_auto") &&
379 (startswith(key, "systemd.") || startswith(key, "rd.systemd."))) {
383 /* Ignore systemd.journald.xyz and friends */
385 if (startswith(c, "rd."))
387 if (startswith(c, "systemd."))
389 if (c[strcspn(c, ".=")] != '.') {
391 log_warning("Unknown kernel switch %s. Ignoring.", key);
393 log_info("Supported kernel switches:\n"
394 "systemd.unit=UNIT Default unit to start\n"
395 "rd.systemd.unit=UNIT Default unit to start when run in initrd\n"
396 "systemd.dump_core=0|1 Dump core on crash\n"
397 "systemd.crash_shell=0|1 Run shell on crash\n"
398 "systemd.crash_chvt=N Change to VT #N on crash\n"
399 "systemd.confirm_spawn=0|1 Confirm every process spawn\n"
400 "systemd.show_status=0|1|auto Show status updates on the console during bootup\n"
401 "systemd.log_target=console|kmsg|journal|journal-or-kmsg|syslog|syslog-or-kmsg|null\n"
403 "systemd.log_level=LEVEL Log level\n"
404 "systemd.log_color=0|1 Highlight important log messages\n"
405 "systemd.log_location=0|1 Include code location in log messages\n"
406 "systemd.default_standard_output=null|tty|syslog|syslog+console|kmsg|kmsg+console|journal|journal+console\n"
407 " Set default log output for services\n"
408 "systemd.default_standard_error=null|tty|syslog|syslog+console|kmsg|kmsg+console|journal|journal+console\n"
409 " Set default log error output for services\n"
410 "systemd.setenv=ASSIGNMENT Set an environment variable for all spawned processes\n"
411 "systemd.restore_state=0|1 Restore backlight/rfkill state at boot\n");
414 } else if (streq(key, "quiet") && !value) {
415 if (arg_show_status == _SHOW_STATUS_UNSET)
416 arg_show_status = SHOW_STATUS_AUTO;
418 } else if (streq(key, "debug") && !value) {
419 log_set_max_level(LOG_DEBUG);
420 if (detect_container(NULL) > 0)
421 log_set_target(LOG_TARGET_CONSOLE);
423 } else if (!in_initrd() && !value) {
426 /* SysV compatibility */
427 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
428 if (streq(key, rlmap[i]))
429 return set_default_unit(rlmap[i+1]);
435 #define DEFINE_SETTER(name, func, descr) \
436 static int name(const char *unit, \
437 const char *filename, \
439 const char *section, \
440 unsigned section_line, \
441 const char *lvalue, \
443 const char *rvalue, \
455 log_syntax(unit, LOG_ERR, filename, line, -r, \
456 "Invalid " descr "'%s': %s", \
457 rvalue, strerror(-r)); \
462 DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
463 DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
464 DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
465 DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
467 static int config_parse_cpu_affinity2(
469 const char *filename,
472 unsigned section_line,
489 FOREACH_WORD_QUOTED(w, l, rvalue, state) {
494 if (!(t = strndup(w, l)))
497 r = safe_atou(t, &cpu);
501 if (!(c = cpu_set_malloc(&ncpus)))
504 if (r < 0 || cpu >= ncpus) {
505 log_syntax(unit, LOG_ERR, filename, line, -r,
506 "Failed to parse CPU affinity '%s'", rvalue);
511 CPU_SET_S(cpu, CPU_ALLOC_SIZE(ncpus), c);
515 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
516 log_warning_unit(unit, "Failed to set CPU affinity: %m");
524 static int config_parse_show_status(
526 const char *filename,
529 unsigned section_line,
537 ShowStatus *b = data;
544 k = parse_show_status(rvalue, b);
546 log_syntax(unit, LOG_ERR, filename, line, -k,
547 "Failed to parse show status setting, ignoring: %s", rvalue);
554 static void strv_free_free(char ***l) {
566 static void free_join_controllers(void) {
567 strv_free_free(arg_join_controllers);
568 arg_join_controllers = NULL;
571 static int config_parse_join_controllers(const char *unit,
572 const char *filename,
575 unsigned section_line,
590 free_join_controllers();
592 FOREACH_WORD_QUOTED(w, length, rvalue, state) {
595 s = strndup(w, length);
599 l = strv_split(s, ",");
604 if (strv_length(l) <= 1) {
609 if (!arg_join_controllers) {
610 arg_join_controllers = new(char**, 2);
611 if (!arg_join_controllers) {
616 arg_join_controllers[0] = l;
617 arg_join_controllers[1] = NULL;
624 t = new0(char**, n+2);
632 for (a = arg_join_controllers; *a; a++) {
634 if (strv_overlap(*a, l)) {
635 if (strv_extend_strv(&l, *a) < 0) {
655 t[n++] = strv_uniq(l);
657 strv_free_free(arg_join_controllers);
658 arg_join_controllers = t;
665 static int parse_config_file(void) {
667 const ConfigTableItem items[] = {
668 { "Manager", "LogLevel", config_parse_level2, 0, NULL },
669 { "Manager", "LogTarget", config_parse_target, 0, NULL },
670 { "Manager", "LogColor", config_parse_color, 0, NULL },
671 { "Manager", "LogLocation", config_parse_location, 0, NULL },
672 { "Manager", "DumpCore", config_parse_bool, 0, &arg_dump_core },
673 { "Manager", "CrashShell", config_parse_bool, 0, &arg_crash_shell },
674 { "Manager", "ShowStatus", config_parse_show_status, 0, &arg_show_status },
675 { "Manager", "CrashChVT", config_parse_int, 0, &arg_crash_chvt },
676 { "Manager", "CPUAffinity", config_parse_cpu_affinity2, 0, NULL },
677 { "Manager", "JoinControllers", config_parse_join_controllers, 0, &arg_join_controllers },
678 { "Manager", "RuntimeWatchdogSec", config_parse_sec, 0, &arg_runtime_watchdog },
679 { "Manager", "ShutdownWatchdogSec", config_parse_sec, 0, &arg_shutdown_watchdog },
680 { "Manager", "CapabilityBoundingSet", config_parse_bounding_set, 0, &arg_capability_bounding_set_drop },
682 { "Manager", "SystemCallArchitectures", config_parse_syscall_archs, 0, &arg_syscall_archs },
684 { "Manager", "TimerSlackNSec", config_parse_nsec, 0, &arg_timer_slack_nsec },
685 { "Manager", "DefaultTimerAccuracySec", config_parse_sec, 0, &arg_default_timer_accuracy_usec },
686 { "Manager", "DefaultStandardOutput", config_parse_output, 0, &arg_default_std_output },
687 { "Manager", "DefaultStandardError", config_parse_output, 0, &arg_default_std_error },
688 { "Manager", "DefaultTimeoutStartSec", config_parse_sec, 0, &arg_default_timeout_start_usec },
689 { "Manager", "DefaultTimeoutStopSec", config_parse_sec, 0, &arg_default_timeout_stop_usec },
690 { "Manager", "DefaultRestartSec", config_parse_sec, 0, &arg_default_restart_usec },
691 { "Manager", "DefaultStartLimitInterval", config_parse_sec, 0, &arg_default_start_limit_interval },
692 { "Manager", "DefaultStartLimitBurst", config_parse_unsigned, 0, &arg_default_start_limit_burst },
693 { "Manager", "DefaultEnvironment", config_parse_environ, 0, &arg_default_environment },
694 { "Manager", "DefaultLimitCPU", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CPU] },
695 { "Manager", "DefaultLimitFSIZE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_FSIZE] },
696 { "Manager", "DefaultLimitDATA", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_DATA] },
697 { "Manager", "DefaultLimitSTACK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_STACK] },
698 { "Manager", "DefaultLimitCORE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CORE] },
699 { "Manager", "DefaultLimitRSS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RSS] },
700 { "Manager", "DefaultLimitNOFILE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NOFILE] },
701 { "Manager", "DefaultLimitAS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_AS] },
702 { "Manager", "DefaultLimitNPROC", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NPROC] },
703 { "Manager", "DefaultLimitMEMLOCK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MEMLOCK] },
704 { "Manager", "DefaultLimitLOCKS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_LOCKS] },
705 { "Manager", "DefaultLimitSIGPENDING", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
706 { "Manager", "DefaultLimitMSGQUEUE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MSGQUEUE] },
707 { "Manager", "DefaultLimitNICE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NICE] },
708 { "Manager", "DefaultLimitRTPRIO", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTPRIO] },
709 { "Manager", "DefaultLimitRTTIME", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTTIME] },
710 { "Manager", "DefaultCPUAccounting", config_parse_bool, 0, &arg_default_cpu_accounting },
711 { "Manager", "DefaultBlockIOAccounting", config_parse_bool, 0, &arg_default_blockio_accounting },
712 { "Manager", "DefaultMemoryAccounting", config_parse_bool, 0, &arg_default_memory_accounting },
716 _cleanup_fclose_ FILE *f;
720 fn = arg_running_as == SYSTEMD_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
726 log_warning("Failed to open configuration file '%s': %m", fn);
730 r = config_parse(NULL, fn, f, "Manager\0", config_item_table_lookup, (void*) items, false, false, NULL);
732 log_warning("Failed to parse configuration file: %s", strerror(-r));
737 static int parse_argv(int argc, char *argv[]) {
740 ARG_LOG_LEVEL = 0x100,
749 ARG_DUMP_CONFIGURATION_ITEMS,
756 ARG_DEFAULT_STD_OUTPUT,
757 ARG_DEFAULT_STD_ERROR
760 static const struct option options[] = {
761 { "log-level", required_argument, NULL, ARG_LOG_LEVEL },
762 { "log-target", required_argument, NULL, ARG_LOG_TARGET },
763 { "log-color", optional_argument, NULL, ARG_LOG_COLOR },
764 { "log-location", optional_argument, NULL, ARG_LOG_LOCATION },
765 { "unit", required_argument, NULL, ARG_UNIT },
766 { "system", no_argument, NULL, ARG_SYSTEM },
767 { "user", no_argument, NULL, ARG_USER },
768 { "test", no_argument, NULL, ARG_TEST },
769 { "help", no_argument, NULL, 'h' },
770 { "version", no_argument, NULL, ARG_VERSION },
771 { "dump-configuration-items", no_argument, NULL, ARG_DUMP_CONFIGURATION_ITEMS },
772 { "dump-core", optional_argument, NULL, ARG_DUMP_CORE },
773 { "crash-shell", optional_argument, NULL, ARG_CRASH_SHELL },
774 { "confirm-spawn", optional_argument, NULL, ARG_CONFIRM_SPAWN },
775 { "show-status", optional_argument, NULL, ARG_SHOW_STATUS },
776 { "deserialize", required_argument, NULL, ARG_DESERIALIZE },
777 { "switched-root", no_argument, NULL, ARG_SWITCHED_ROOT },
778 { "default-standard-output", required_argument, NULL, ARG_DEFAULT_STD_OUTPUT, },
779 { "default-standard-error", required_argument, NULL, ARG_DEFAULT_STD_ERROR, },
791 while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
796 r = log_set_max_level_from_string(optarg);
798 log_error("Failed to parse log level %s.", optarg);
805 r = log_set_target_from_string(optarg);
807 log_error("Failed to parse log target %s.", optarg);
816 r = log_show_color_from_string(optarg);
818 log_error("Failed to parse log color setting %s.", optarg);
822 log_show_color(true);
826 case ARG_LOG_LOCATION:
828 r = log_show_location_from_string(optarg);
830 log_error("Failed to parse log location setting %s.", optarg);
834 log_show_location(true);
838 case ARG_DEFAULT_STD_OUTPUT:
839 r = exec_output_from_string(optarg);
841 log_error("Failed to parse default standard output setting %s.", optarg);
844 arg_default_std_output = r;
847 case ARG_DEFAULT_STD_ERROR:
848 r = exec_output_from_string(optarg);
850 log_error("Failed to parse default standard error output setting %s.", optarg);
853 arg_default_std_error = r;
858 r = set_default_unit(optarg);
860 log_error("Failed to set default unit %s: %s", optarg, strerror(-r));
867 arg_running_as = SYSTEMD_SYSTEM;
871 arg_running_as = SYSTEMD_USER;
875 arg_action = ACTION_TEST;
879 arg_action = ACTION_VERSION;
882 case ARG_DUMP_CONFIGURATION_ITEMS:
883 arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
887 r = optarg ? parse_boolean(optarg) : 1;
889 log_error("Failed to parse dump core boolean %s.", optarg);
895 case ARG_CRASH_SHELL:
896 r = optarg ? parse_boolean(optarg) : 1;
898 log_error("Failed to parse crash shell boolean %s.", optarg);
904 case ARG_CONFIRM_SPAWN:
905 r = optarg ? parse_boolean(optarg) : 1;
907 log_error("Failed to parse confirm spawn boolean %s.", optarg);
910 arg_confirm_spawn = r;
913 case ARG_SHOW_STATUS:
915 r = parse_show_status(optarg, &arg_show_status);
917 log_error("Failed to parse show status boolean %s.", optarg);
921 arg_show_status = SHOW_STATUS_YES;
924 case ARG_DESERIALIZE: {
928 r = safe_atoi(optarg, &fd);
929 if (r < 0 || fd < 0) {
930 log_error("Failed to parse deserialize option %s.", optarg);
931 return r < 0 ? r : -EINVAL;
934 fd_cloexec(fd, true);
938 log_error("Failed to open serialization fd: %m");
942 if (arg_serialization)
943 fclose(arg_serialization);
945 arg_serialization = f;
950 case ARG_SWITCHED_ROOT:
951 arg_switched_root = true;
955 arg_action = ACTION_HELP;
959 log_set_max_level(LOG_DEBUG);
965 /* Just to eat away the sysvinit kernel
966 * cmdline args without getopt() error
967 * messages that we'll parse in
968 * parse_proc_cmdline_word() or ignore. */
973 log_error("Unknown option code %c", c);
980 if (optind < argc && getpid() != 1) {
981 /* Hmm, when we aren't run as init system
982 * let's complain about excess arguments */
984 log_error("Excess arguments.");
988 if (detect_container(NULL) > 0) {
991 /* All /proc/cmdline arguments the kernel didn't
992 * understand it passed to us. We're not really
993 * interested in that usually since /proc/cmdline is
994 * more interesting and complete. With one exception:
995 * if we are run in a container /proc/cmdline is not
996 * relevant for the container, hence we rely on argv[]
999 for (a = argv; a < argv + argc; a++) {
1000 _cleanup_free_ char *w;
1007 value = strchr(w, '=');
1011 r = parse_proc_cmdline_item(w, value);
1013 log_error("Failed on cmdline argument %s: %s", *a, strerror(-r));
1022 static int help(void) {
1024 printf("%s [OPTIONS...]\n\n"
1025 "Starts up and maintains the system or user services.\n\n"
1026 " -h --help Show this help\n"
1027 " --test Determine startup sequence, dump it and exit\n"
1028 " --dump-configuration-items Dump understood unit configuration items\n"
1029 " --unit=UNIT Set default unit\n"
1030 " --system Run a system instance, even if PID != 1\n"
1031 " --user Run a user instance\n"
1032 " --dump-core[=0|1] Dump core on crash\n"
1033 " --crash-shell[=0|1] Run shell on crash\n"
1034 " --confirm-spawn[=0|1] Ask for confirmation when spawning processes\n"
1035 " --show-status[=0|1] Show status updates on the console during bootup\n"
1036 " --log-target=TARGET Set log target (console, journal, syslog, kmsg, journal-or-kmsg, syslog-or-kmsg, null)\n"
1037 " --log-level=LEVEL Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
1038 " --log-color[=0|1] Highlight important log messages\n"
1039 " --log-location[=0|1] Include code location in log messages\n"
1040 " --default-standard-output= Set default standard output for services\n"
1041 " --default-standard-error= Set default standard error output for services\n",
1042 program_invocation_short_name);
1047 static int version(void) {
1048 puts(PACKAGE_STRING);
1049 puts(SYSTEMD_FEATURES);
1054 static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
1063 r = manager_open_serialization(m, &f);
1065 log_error("Failed to create serialization file: %s", strerror(-r));
1069 /* Make sure nothing is really destructed when we shut down */
1071 bus_manager_send_reloading(m, true);
1076 log_error("Failed to allocate fd set: %s", strerror(-r));
1080 r = manager_serialize(m, f, fds, switching_root);
1082 log_error("Failed to serialize state: %s", strerror(-r));
1086 if (fseeko(f, 0, SEEK_SET) < 0) {
1087 log_error("Failed to rewind serialization fd: %m");
1091 r = fd_cloexec(fileno(f), false);
1093 log_error("Failed to disable O_CLOEXEC for serialization: %s", strerror(-r));
1097 r = fdset_cloexec(fds, false);
1099 log_error("Failed to disable O_CLOEXEC for serialization fds: %s", strerror(-r));
1117 static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1121 assert(saved_rlimit);
1123 /* Save the original RLIMIT_NOFILE so that we can reset it
1124 * later when transitioning from the initrd to the main
1125 * systemd or suchlike. */
1126 if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0) {
1127 log_error("Reading RLIMIT_NOFILE failed: %m");
1131 /* Make sure forked processes get the default kernel setting */
1132 if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1135 rl = newdup(struct rlimit, saved_rlimit, 1);
1139 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1142 /* Bump up the resource limit for ourselves substantially */
1143 nl.rlim_cur = nl.rlim_max = 64*1024;
1144 r = setrlimit_closest(RLIMIT_NOFILE, &nl);
1146 log_error("Setting RLIMIT_NOFILE failed: %s", strerror(-r));
1153 static void test_mtab(void) {
1155 static const char ok[] =
1156 "/proc/self/mounts\0"
1158 "../proc/self/mounts\0"
1161 _cleanup_free_ char *p = NULL;
1164 /* Check that /etc/mtab is a symlink to the right place or
1165 * non-existing. But certainly not a file, or a symlink to
1166 * some weird place... */
1168 r = readlink_malloc("/etc/mtab", &p);
1171 if (r >= 0 && nulstr_contains(ok, p))
1174 log_warning("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1175 "This is not supported anymore. "
1176 "Please make sure to replace this file by a symlink to avoid incorrect or misleading mount(8) output.");
1179 static void test_usr(void) {
1181 /* Check that /usr is not a separate fs */
1183 if (dir_is_empty("/usr") <= 0)
1186 log_warning("/usr appears to be on its own filesytem and is not already mounted. This is not a supported setup. "
1187 "Some things will probably break (sometimes even silently) in mysterious ways. "
1188 "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1191 static int initialize_join_controllers(void) {
1192 /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1193 * + "net_prio". We'd like to add "cpuset" to the mix, but
1194 * "cpuset" does't really work for groups with no initialized
1197 arg_join_controllers = new(char**, 3);
1198 if (!arg_join_controllers)
1201 arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
1202 arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
1203 arg_join_controllers[2] = NULL;
1205 if (!arg_join_controllers[0] || !arg_join_controllers[1]) {
1206 free_join_controllers();
1213 static int enforce_syscall_archs(Set *archs) {
1215 scmp_filter_ctx *seccomp;
1220 seccomp = seccomp_init(SCMP_ACT_ALLOW);
1224 SET_FOREACH(id, arg_syscall_archs, i) {
1225 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1229 log_error("Failed to add architecture to seccomp: %s", strerror(-r));
1234 r = seccomp_attr_set(seccomp, SCMP_FLTATR_CTL_NNP, 0);
1236 log_error("Failed to unset NO_NEW_PRIVS: %s", strerror(-r));
1240 r = seccomp_load(seccomp);
1242 log_error("Failed to add install architecture seccomp: %s", strerror(-r));
1245 seccomp_release(seccomp);
1252 static int status_welcome(void) {
1253 _cleanup_free_ char *pretty_name = NULL, *ansi_color = NULL;
1256 r = parse_env_file("/etc/os-release", NEWLINE,
1257 "PRETTY_NAME", &pretty_name,
1258 "ANSI_COLOR", &ansi_color,
1261 r = parse_env_file("/usr/lib/os-release", NEWLINE,
1262 "PRETTY_NAME", &pretty_name,
1263 "ANSI_COLOR", &ansi_color,
1267 if (r < 0 && r != -ENOENT)
1268 log_warning("Failed to read os-release file: %s", strerror(-r));
1270 return status_printf(NULL, false, false,
1271 "\nWelcome to \x1B[%sm%s\x1B[0m!\n",
1272 isempty(ansi_color) ? "1" : ansi_color,
1273 isempty(pretty_name) ? "Linux" : pretty_name);
1276 static int write_container_id(void) {
1279 c = getenv("container");
1283 return write_string_file("/run/systemd/container", c);
1286 int main(int argc, char *argv[]) {
1288 int r, retval = EXIT_FAILURE;
1289 usec_t before_startup, after_startup;
1290 char timespan[FORMAT_TIMESPAN_MAX];
1292 bool reexecute = false;
1293 const char *shutdown_verb = NULL;
1294 dual_timestamp initrd_timestamp = { 0ULL, 0ULL };
1295 dual_timestamp userspace_timestamp = { 0ULL, 0ULL };
1296 dual_timestamp kernel_timestamp = { 0ULL, 0ULL };
1297 dual_timestamp security_start_timestamp = { 0ULL, 0ULL };
1298 dual_timestamp security_finish_timestamp = { 0ULL, 0ULL };
1299 static char systemd[] = "systemd";
1300 bool skip_setup = false;
1302 bool loaded_policy = false;
1303 bool arm_reboot_watchdog = false;
1304 bool queue_default_job = false;
1305 char *switch_root_dir = NULL, *switch_root_init = NULL;
1306 static struct rlimit saved_rlimit_nofile = { 0, 0 };
1308 #ifdef HAVE_SYSV_COMPAT
1309 if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
1310 /* This is compatibility support for SysV, where
1311 * calling init as a user is identical to telinit. */
1314 execv(SYSTEMCTL_BINARY_PATH, argv);
1315 log_error("Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
1320 dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1321 dual_timestamp_get(&userspace_timestamp);
1323 /* Determine if this is a reexecution or normal bootup. We do
1324 * the full command line parsing much later, so let's just
1325 * have a quick peek here. */
1326 if (strv_find(argv+1, "--deserialize"))
1329 /* If we have switched root, do all the special setup
1331 if (strv_find(argv+1, "--switched-root"))
1334 /* If we get started via the /sbin/init symlink then we are
1335 called 'init'. After a subsequent reexecution we are then
1336 called 'systemd'. That is confusing, hence let's call us
1337 systemd right-away. */
1338 program_invocation_short_name = systemd;
1339 prctl(PR_SET_NAME, systemd);
1344 log_show_color(isatty(STDERR_FILENO) > 0);
1346 /* Disable the umask logic */
1350 if (getpid() == 1 && detect_container(NULL) <= 0) {
1352 /* Running outside of a container as PID 1 */
1353 arg_running_as = SYSTEMD_SYSTEM;
1355 log_set_target(LOG_TARGET_KMSG);
1359 initrd_timestamp = userspace_timestamp;
1362 mount_setup_early();
1363 dual_timestamp_get(&security_start_timestamp);
1364 if (selinux_setup(&loaded_policy) < 0)
1366 if (ima_setup() < 0)
1368 if (smack_setup(&loaded_policy) < 0)
1370 dual_timestamp_get(&security_finish_timestamp);
1373 if (label_init(NULL) < 0)
1377 if (clock_is_localtime() > 0) {
1380 /* The first-time call to settimeofday() does a time warp in the kernel */
1381 r = clock_set_timezone(&min);
1383 log_error("Failed to apply local time delta, ignoring: %s", strerror(-r));
1385 log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
1386 } else if (!in_initrd()) {
1388 * Do dummy first-time call to seal the kernel's time warp magic
1390 * Do not call this this from inside the initrd. The initrd might not
1391 * carry /etc/adjtime with LOCAL, but the real system could be set up
1392 * that way. In such case, we need to delay the time-warp or the sealing
1393 * until we reach the real system.
1395 clock_reset_timezone();
1397 /* Tell the kernel our timezone */
1398 r = clock_set_timezone(NULL);
1400 log_error("Failed to set the kernel's timezone, ignoring: %s", strerror(-r));
1404 /* Set the default for later on, but don't actually
1405 * open the logs like this for now. Note that if we
1406 * are transitioning from the initrd there might still
1407 * be journal fd open, and we shouldn't attempt
1408 * opening that before we parsed /proc/cmdline which
1409 * might redirect output elsewhere. */
1410 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1412 } else if (getpid() == 1) {
1413 /* Running inside a container, as PID 1 */
1414 arg_running_as = SYSTEMD_SYSTEM;
1415 log_set_target(LOG_TARGET_CONSOLE);
1416 log_close_console(); /* force reopen of /dev/console */
1419 /* For the later on, see above... */
1420 log_set_target(LOG_TARGET_JOURNAL);
1422 /* clear the kernel timestamp,
1423 * because we are in a container */
1424 kernel_timestamp.monotonic = 0ULL;
1425 kernel_timestamp.realtime = 0ULL;
1428 /* Running as user instance */
1429 arg_running_as = SYSTEMD_USER;
1430 log_set_target(LOG_TARGET_AUTO);
1433 /* clear the kernel timestamp,
1434 * because we are not PID 1 */
1435 kernel_timestamp.monotonic = 0ULL;
1436 kernel_timestamp.realtime = 0ULL;
1439 /* Initialize default unit */
1440 r = set_default_unit(SPECIAL_DEFAULT_TARGET);
1442 log_error("Failed to set default unit %s: %s", SPECIAL_DEFAULT_TARGET, strerror(-r));
1446 r = initialize_join_controllers();
1450 /* Mount /proc, /sys and friends, so that /proc/cmdline and
1451 * /proc/$PID/fd is available. */
1452 if (getpid() == 1) {
1453 r = mount_setup(loaded_policy);
1458 /* Reset all signal handlers. */
1459 assert_se(reset_all_signal_handlers() == 0);
1461 ignore_signals(SIGNALS_IGNORE, -1);
1463 if (parse_config_file() < 0)
1466 if (arg_running_as == SYSTEMD_SYSTEM)
1467 if (parse_proc_cmdline(parse_proc_cmdline_item) < 0)
1470 log_parse_environment();
1472 if (parse_argv(argc, argv) < 0)
1475 if (arg_action == ACTION_TEST &&
1477 log_error("Don't run test mode as root.");
1481 if (arg_running_as == SYSTEMD_USER &&
1482 arg_action == ACTION_RUN &&
1484 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1488 if (arg_running_as == SYSTEMD_SYSTEM &&
1489 arg_action == ACTION_RUN &&
1490 running_in_chroot() > 0) {
1491 log_error("Cannot be run in a chroot() environment.");
1495 if (arg_action == ACTION_HELP) {
1498 } else if (arg_action == ACTION_VERSION) {
1501 } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
1502 unit_dump_config_items(stdout);
1503 retval = EXIT_SUCCESS;
1505 } else if (arg_action == ACTION_DONE) {
1506 retval = EXIT_SUCCESS;
1510 if (arg_running_as == SYSTEMD_USER &&
1511 !getenv("XDG_RUNTIME_DIR")) {
1512 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1516 assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
1518 /* Close logging fds, in order not to confuse fdset below */
1521 /* Remember open file descriptors for later deserialization */
1522 r = fdset_new_fill(&fds);
1524 log_error("Failed to allocate fd set: %s", strerror(-r));
1527 fdset_cloexec(fds, true);
1529 if (arg_serialization)
1530 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
1532 if (arg_running_as == SYSTEMD_SYSTEM)
1533 /* Become a session leader if we aren't one yet. */
1536 /* Move out of the way, so that we won't block unmounts */
1537 assert_se(chdir("/") == 0);
1539 /* Reset the console, but only if this is really init and we
1540 * are freshly booted */
1541 if (arg_running_as == SYSTEMD_SYSTEM && arg_action == ACTION_RUN)
1542 console_setup(getpid() == 1 && !skip_setup);
1544 /* Open the logging devices, if possible and necessary */
1547 if (arg_show_status == _SHOW_STATUS_UNSET)
1548 arg_show_status = SHOW_STATUS_YES;
1550 /* Make sure we leave a core dump without panicing the
1552 if (getpid() == 1) {
1553 install_crash_handler();
1555 r = mount_cgroup_controllers(arg_join_controllers);
1560 if (arg_running_as == SYSTEMD_SYSTEM) {
1561 const char *virtualization = NULL;
1563 log_info(PACKAGE_STRING " running in system mode. (" SYSTEMD_FEATURES ")");
1565 detect_virtualization(&virtualization);
1567 log_info("Detected virtualization '%s'.", virtualization);
1569 write_container_id();
1571 log_info("Detected architecture '%s'.", architecture_to_string(uname_architecture()));
1574 log_info("Running in initial RAM disk.");
1577 _cleanup_free_ char *t = uid_to_name(getuid());
1578 log_debug(PACKAGE_STRING " running in user mode for user "PID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1582 if (arg_running_as == SYSTEMD_SYSTEM && !skip_setup) {
1583 if (arg_show_status > 0 || plymouth_running())
1587 if (detect_container(NULL) <= 0)
1591 machine_id_setup("");
1598 if (arg_running_as == SYSTEMD_SYSTEM && arg_runtime_watchdog > 0)
1599 watchdog_set_timeout(&arg_runtime_watchdog);
1601 if (arg_timer_slack_nsec != (nsec_t) -1)
1602 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
1603 log_error("Failed to adjust timer slack: %m");
1605 if (arg_capability_bounding_set_drop) {
1606 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
1608 log_error("Failed to drop capability bounding set of usermode helpers: %s", strerror(-r));
1611 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
1613 log_error("Failed to drop capability bounding set: %s", strerror(-r));
1618 if (arg_syscall_archs) {
1619 r = enforce_syscall_archs(arg_syscall_archs);
1624 if (arg_running_as == SYSTEMD_USER) {
1625 /* Become reaper of our children */
1626 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0) {
1627 log_warning("Failed to make us a subreaper: %m");
1628 if (errno == EINVAL)
1629 log_info("Perhaps the kernel version is too old (< 3.4?)");
1633 if (arg_running_as == SYSTEMD_SYSTEM)
1634 bump_rlimit_nofile(&saved_rlimit_nofile);
1636 r = manager_new(arg_running_as, &m);
1638 log_error("Failed to allocate manager object: %s", strerror(-r));
1642 m->confirm_spawn = arg_confirm_spawn;
1643 m->default_timer_accuracy_usec = arg_default_timer_accuracy_usec;
1644 m->default_std_output = arg_default_std_output;
1645 m->default_std_error = arg_default_std_error;
1646 m->default_restart_usec = arg_default_restart_usec;
1647 m->default_timeout_start_usec = arg_default_timeout_start_usec;
1648 m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
1649 m->default_start_limit_interval = arg_default_start_limit_interval;
1650 m->default_start_limit_burst = arg_default_start_limit_burst;
1651 m->default_cpu_accounting = arg_default_cpu_accounting;
1652 m->default_blockio_accounting = arg_default_blockio_accounting;
1653 m->default_memory_accounting = arg_default_memory_accounting;
1654 m->runtime_watchdog = arg_runtime_watchdog;
1655 m->shutdown_watchdog = arg_shutdown_watchdog;
1656 m->userspace_timestamp = userspace_timestamp;
1657 m->kernel_timestamp = kernel_timestamp;
1658 m->initrd_timestamp = initrd_timestamp;
1659 m->security_start_timestamp = security_start_timestamp;
1660 m->security_finish_timestamp = security_finish_timestamp;
1662 manager_set_default_rlimits(m, arg_default_rlimit);
1663 manager_environment_add(m, NULL, arg_default_environment);
1664 manager_set_show_status(m, arg_show_status);
1666 /* Remember whether we should queue the default job */
1667 queue_default_job = !arg_serialization || arg_switched_root;
1669 before_startup = now(CLOCK_MONOTONIC);
1671 r = manager_startup(m, arg_serialization, fds);
1673 log_error("Failed to fully start up daemon: %s", strerror(-r));
1675 /* This will close all file descriptors that were opened, but
1676 * not claimed by any unit. */
1680 if (arg_serialization) {
1681 fclose(arg_serialization);
1682 arg_serialization = NULL;
1685 if (queue_default_job) {
1686 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
1687 Unit *target = NULL;
1688 Job *default_unit_job;
1690 log_debug("Activating default unit: %s", arg_default_unit);
1692 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
1694 log_error("Failed to load default target: %s", bus_error_message(&error, r));
1695 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
1696 log_error("Failed to load default target: %s", strerror(-target->load_error));
1697 else if (target->load_state == UNIT_MASKED)
1698 log_error("Default target masked.");
1700 if (!target || target->load_state != UNIT_LOADED) {
1701 log_info("Trying to load rescue target...");
1703 r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1705 log_error("Failed to load rescue target: %s", bus_error_message(&error, r));
1707 } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
1708 log_error("Failed to load rescue target: %s", strerror(-target->load_error));
1710 } else if (target->load_state == UNIT_MASKED) {
1711 log_error("Rescue target masked.");
1716 assert(target->load_state == UNIT_LOADED);
1718 if (arg_action == ACTION_TEST) {
1719 printf("-> By units:\n");
1720 manager_dump_units(m, stdout, "\t");
1723 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
1725 log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
1727 r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1729 log_error("Failed to start default target: %s", bus_error_message(&error, r));
1733 log_error("Failed to isolate default target: %s", bus_error_message(&error, r));
1737 m->default_unit_job_id = default_unit_job->id;
1739 after_startup = now(CLOCK_MONOTONIC);
1740 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1741 "Loaded units and determined initial transaction in %s.",
1742 format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 0));
1744 if (arg_action == ACTION_TEST) {
1745 printf("-> By jobs:\n");
1746 manager_dump_jobs(m, stdout, "\t");
1747 retval = EXIT_SUCCESS;
1753 r = manager_loop(m);
1755 log_error("Failed to run mainloop: %s", strerror(-r));
1759 switch (m->exit_code) {
1762 retval = EXIT_SUCCESS;
1766 case MANAGER_RELOAD:
1767 log_info("Reloading.");
1768 r = manager_reload(m);
1770 log_error("Failed to reload: %s", strerror(-r));
1773 case MANAGER_REEXECUTE:
1775 if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0)
1779 log_notice("Reexecuting.");
1782 case MANAGER_SWITCH_ROOT:
1783 /* Steal the switch root parameters */
1784 switch_root_dir = m->switch_root;
1785 switch_root_init = m->switch_root_init;
1786 m->switch_root = m->switch_root_init = NULL;
1788 if (!switch_root_init)
1789 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0)
1793 log_notice("Switching root.");
1796 case MANAGER_REBOOT:
1797 case MANAGER_POWEROFF:
1799 case MANAGER_KEXEC: {
1800 static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
1801 [MANAGER_REBOOT] = "reboot",
1802 [MANAGER_POWEROFF] = "poweroff",
1803 [MANAGER_HALT] = "halt",
1804 [MANAGER_KEXEC] = "kexec"
1807 assert_se(shutdown_verb = table[m->exit_code]);
1808 arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
1810 log_notice("Shutting down.");
1815 assert_not_reached("Unknown exit code.");
1825 for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++) {
1826 free(arg_default_rlimit[j]);
1827 arg_default_rlimit[j] = NULL;
1830 free(arg_default_unit);
1831 arg_default_unit = NULL;
1833 free_join_controllers();
1835 strv_free(arg_default_environment);
1836 arg_default_environment = NULL;
1838 set_free(arg_syscall_archs);
1839 arg_syscall_archs = NULL;
1845 unsigned i, args_size;
1847 /* Close and disarm the watchdog, so that the new
1848 * instance can reinitialize it, but doesn't get
1849 * rebooted while we do that */
1850 watchdog_close(true);
1852 /* Reset the RLIMIT_NOFILE to the kernel default, so
1853 * that the new systemd can pass the kernel default to
1854 * its child processes */
1855 if (saved_rlimit_nofile.rlim_cur > 0)
1856 setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
1858 if (switch_root_dir) {
1859 /* Kill all remaining processes from the
1860 * initrd, but don't wait for them, so that we
1861 * can handle the SIGCHLD for them after
1863 broadcast_signal(SIGTERM, false, true);
1865 /* And switch root */
1866 r = switch_root(switch_root_dir);
1868 log_error("Failed to switch root, ignoring: %s", strerror(-r));
1871 args_size = MAX(6, argc+1);
1872 args = newa(const char*, args_size);
1874 if (!switch_root_init) {
1877 /* First try to spawn ourselves with the right
1878 * path, and with full serialization. We do
1879 * this only if the user didn't specify an
1880 * explicit init to spawn. */
1882 assert(arg_serialization);
1885 snprintf(sfd, sizeof(sfd), "%i", fileno(arg_serialization));
1889 args[i++] = SYSTEMD_BINARY_PATH;
1890 if (switch_root_dir)
1891 args[i++] = "--switched-root";
1892 args[i++] = arg_running_as == SYSTEMD_SYSTEM ? "--system" : "--user";
1893 args[i++] = "--deserialize";
1897 /* do not pass along the environment we inherit from the kernel or initrd */
1898 if (switch_root_dir)
1901 assert(i <= args_size);
1902 execv(args[0], (char* const*) args);
1905 /* Try the fallback, if there is any, without any
1906 * serialization. We pass the original argv[] and
1907 * envp[]. (Well, modulo the ordering changes due to
1908 * getopt() in argv[], and some cleanups in envp[],
1909 * but let's hope that doesn't matter.) */
1911 if (arg_serialization) {
1912 fclose(arg_serialization);
1913 arg_serialization = NULL;
1921 /* Reopen the console */
1922 make_console_stdio();
1924 for (j = 1, i = 1; j < (unsigned) argc; j++)
1925 args[i++] = argv[j];
1927 assert(i <= args_size);
1929 if (switch_root_init) {
1930 args[0] = switch_root_init;
1931 execv(args[0], (char* const*) args);
1932 log_warning("Failed to execute configured init, trying fallback: %m");
1935 args[0] = "/sbin/init";
1936 execv(args[0], (char* const*) args);
1938 if (errno == ENOENT) {
1939 log_warning("No /sbin/init, trying fallback");
1941 args[0] = "/bin/sh";
1943 execv(args[0], (char* const*) args);
1944 log_error("Failed to execute /bin/sh, giving up: %m");
1946 log_warning("Failed to execute /sbin/init, giving up: %m");
1949 if (arg_serialization) {
1950 fclose(arg_serialization);
1951 arg_serialization = NULL;
1959 #ifdef HAVE_VALGRIND_VALGRIND_H
1960 /* If we are PID 1 and running under valgrind, then let's exit
1961 * here explicitly. valgrind will only generate nice output on
1962 * exit(), not on exec(), hence let's do the former not the
1964 if (getpid() == 1 && RUNNING_ON_VALGRIND)
1968 if (shutdown_verb) {
1969 char log_level[DECIMAL_STR_MAX(int) + 1];
1970 const char* command_line[9] = {
1971 SYSTEMD_SHUTDOWN_BINARY_PATH,
1973 "--log-level", log_level,
1977 _cleanup_strv_free_ char **env_block = NULL;
1979 assert(command_line[pos] == NULL);
1980 env_block = strv_copy(environ);
1982 snprintf(log_level, sizeof(log_level), "%d", log_get_max_level());
1984 switch (log_get_target()) {
1985 case LOG_TARGET_KMSG:
1986 case LOG_TARGET_JOURNAL_OR_KMSG:
1987 case LOG_TARGET_SYSLOG_OR_KMSG:
1988 command_line[pos++] = "kmsg";
1991 case LOG_TARGET_CONSOLE:
1993 command_line[pos++] = "console";
1997 if (log_get_show_color())
1998 command_line[pos++] = "--log-color";
2000 if (log_get_show_location())
2001 command_line[pos++] = "--log-location";
2003 assert(pos < ELEMENTSOF(command_line));
2005 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
2008 /* If we reboot let's set the shutdown
2009 * watchdog and tell the shutdown binary to
2010 * repeatedly ping it */
2011 watchdog_set_timeout(&arg_shutdown_watchdog);
2012 watchdog_close(false);
2014 /* Tell the binary how often to ping, ignore failure */
2015 if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
2016 strv_push(&env_block, e);
2018 watchdog_close(true);
2020 /* Avoid the creation of new processes forked by the
2021 * kernel; at this point, we will not listen to the
2023 if (detect_container(NULL) <= 0)
2024 cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
2026 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
2027 log_error("Failed to execute shutdown binary, %s: %m",
2028 getpid() == 1 ? "freezing" : "quitting");