1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
26 #include <sys/types.h>
32 #include <sys/prctl.h>
33 #include <sys/mount.h>
35 #ifdef HAVE_VALGRIND_VALGRIND_H
36 #include <valgrind/valgrind.h>
42 #include "sd-daemon.h"
43 #include "sd-messages.h"
48 #include "conf-parser.h"
56 #include "architecture.h"
58 #include "path-util.h"
59 #include "switch-root.h"
60 #include "capability.h"
63 #include "clock-util.h"
65 #include "bus-error.h"
67 #include "selinux-util.h"
69 #include "dbus-manager.h"
70 #include "load-fragment.h"
72 #include "mount-setup.h"
73 #include "loopback-setup.h"
74 #include "hostname-setup.h"
75 #include "machine-id-setup.h"
76 #include "selinux-setup.h"
77 #include "ima-setup.h"
78 #include "smack-setup.h"
79 #include "kmod-setup.h"
86 ACTION_DUMP_CONFIGURATION_ITEMS,
88 } arg_action = ACTION_RUN;
89 static char *arg_default_unit = NULL;
90 static SystemdRunningAs arg_running_as = _SYSTEMD_RUNNING_AS_INVALID;
91 static bool arg_dump_core = true;
92 static bool arg_crash_shell = false;
93 static int arg_crash_chvt = -1;
94 static bool arg_confirm_spawn = false;
95 static ShowStatus arg_show_status = _SHOW_STATUS_UNSET;
96 static bool arg_switched_root = false;
97 static int arg_no_pager = -1;
98 static char ***arg_join_controllers = NULL;
99 static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
100 static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
101 static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
102 static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
103 static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
104 static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
105 static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
106 static usec_t arg_runtime_watchdog = 0;
107 static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
108 static char **arg_default_environment = NULL;
109 static struct rlimit *arg_default_rlimit[_RLIMIT_MAX] = {};
110 static uint64_t arg_capability_bounding_set_drop = 0;
111 static nsec_t arg_timer_slack_nsec = NSEC_INFINITY;
112 static usec_t arg_default_timer_accuracy_usec = 1 * USEC_PER_MINUTE;
113 static Set* arg_syscall_archs = NULL;
114 static FILE* arg_serialization = NULL;
115 static bool arg_default_cpu_accounting = false;
116 static bool arg_default_blockio_accounting = false;
117 static bool arg_default_memory_accounting = false;
119 static void nop_handler(int sig) {}
121 static void pager_open_if_enabled(void) {
123 if (arg_no_pager <= 0)
129 noreturn static void crash(int sig) {
132 /* Pass this on immediately, if this is not PID 1 */
134 else if (!arg_dump_core)
135 log_emergency("Caught <%s>, not dumping core.", signal_to_string(sig));
137 struct sigaction sa = {
138 .sa_handler = nop_handler,
139 .sa_flags = SA_NOCLDSTOP|SA_RESTART,
143 /* We want to wait for the core process, hence let's enable SIGCHLD */
144 sigaction(SIGCHLD, &sa, NULL);
146 pid = raw_clone(SIGCHLD, NULL);
148 log_emergency_errno(errno, "Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
151 struct rlimit rl = {};
153 /* Enable default signal handler for core dump */
155 sa.sa_handler = SIG_DFL;
156 sigaction(sig, &sa, NULL);
158 /* Don't limit the core dump size */
159 rl.rlim_cur = RLIM_INFINITY;
160 rl.rlim_max = RLIM_INFINITY;
161 setrlimit(RLIMIT_CORE, &rl);
163 /* Just to be sure... */
166 /* Raise the signal again */
168 kill(pid, sig); /* raise() would kill the parent */
170 assert_not_reached("We shouldn't be here...");
176 /* Order things nicely. */
177 r = wait_for_terminate(pid, &status);
179 log_emergency_errno(r, "Caught <%s>, waitpid() failed: %m", signal_to_string(sig));
180 else if (status.si_code != CLD_DUMPED)
181 log_emergency("Caught <%s>, core dump failed (child "PID_FMT", code=%s, status=%i/%s).",
182 signal_to_string(sig),
183 pid, sigchld_code_to_string(status.si_code),
185 strna(status.si_code == CLD_EXITED
186 ? exit_status_to_string(status.si_status, EXIT_STATUS_FULL)
187 : signal_to_string(status.si_status)));
189 log_emergency("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
194 chvt(arg_crash_chvt);
196 if (arg_crash_shell) {
197 struct sigaction sa = {
198 .sa_handler = SIG_IGN,
199 .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
203 log_info("Executing crash shell in 10s...");
206 /* Let the kernel reap children for us */
207 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
209 pid = raw_clone(SIGCHLD, NULL);
211 log_emergency_errno(errno, "Failed to fork off crash shell: %m");
213 make_console_stdio();
214 execle("/bin/sh", "/bin/sh", NULL, environ);
216 log_emergency_errno(errno, "execle() failed: %m");
219 log_info("Successfully spawned crash shell as PID "PID_FMT".", pid);
222 log_emergency("Freezing execution.");
226 static void install_crash_handler(void) {
227 static const struct sigaction sa = {
229 .sa_flags = SA_NODEFER, /* So that we can raise the signal again from the signal handler */
233 /* We ignore the return value here, since, we don't mind if we
234 * cannot set up a crash handler */
235 r = sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
237 log_debug_errno(r, "I had trouble setting up the crash handler, ignoring: %m");
240 static int console_setup(void) {
241 _cleanup_close_ int tty_fd = -1;
244 tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
246 return log_error_errno(tty_fd, "Failed to open /dev/console: %m");
248 /* We don't want to force text mode. plymouth may be showing
249 * pictures already from initrd. */
250 r = reset_terminal_fd(tty_fd, false);
252 return log_error_errno(r, "Failed to reset /dev/console: %m");
257 static int set_default_unit(const char *u) {
266 free(arg_default_unit);
267 arg_default_unit = c;
272 static int parse_proc_cmdline_item(const char *key, const char *value) {
274 static const char * const rlmap[] = {
275 "emergency", SPECIAL_EMERGENCY_TARGET,
276 "-b", SPECIAL_EMERGENCY_TARGET,
277 "rescue", SPECIAL_RESCUE_TARGET,
278 "single", SPECIAL_RESCUE_TARGET,
279 "-s", SPECIAL_RESCUE_TARGET,
280 "s", SPECIAL_RESCUE_TARGET,
281 "S", SPECIAL_RESCUE_TARGET,
282 "1", SPECIAL_RESCUE_TARGET,
283 "2", SPECIAL_RUNLEVEL2_TARGET,
284 "3", SPECIAL_RUNLEVEL3_TARGET,
285 "4", SPECIAL_RUNLEVEL4_TARGET,
286 "5", SPECIAL_RUNLEVEL5_TARGET,
292 if (streq(key, "systemd.unit") && value) {
295 return set_default_unit(value);
297 } else if (streq(key, "rd.systemd.unit") && value) {
300 return set_default_unit(value);
302 } else if (streq(key, "systemd.dump_core") && value) {
304 r = parse_boolean(value);
306 log_warning("Failed to parse dump core switch %s. Ignoring.", value);
310 } else if (streq(key, "systemd.crash_shell") && value) {
312 r = parse_boolean(value);
314 log_warning("Failed to parse crash shell switch %s. Ignoring.", value);
318 } else if (streq(key, "systemd.crash_chvt") && value) {
320 if (safe_atoi(value, &r) < 0)
321 log_warning("Failed to parse crash chvt switch %s. Ignoring.", value);
325 } else if (streq(key, "systemd.confirm_spawn") && value) {
327 r = parse_boolean(value);
329 log_warning("Failed to parse confirm spawn switch %s. Ignoring.", value);
331 arg_confirm_spawn = r;
333 } else if (streq(key, "systemd.show_status") && value) {
335 r = parse_show_status(value, &arg_show_status);
337 log_warning("Failed to parse show status switch %s. Ignoring.", value);
339 } else if (streq(key, "systemd.default_standard_output") && value) {
341 r = exec_output_from_string(value);
343 log_warning("Failed to parse default standard output switch %s. Ignoring.", value);
345 arg_default_std_output = r;
347 } else if (streq(key, "systemd.default_standard_error") && value) {
349 r = exec_output_from_string(value);
351 log_warning("Failed to parse default standard error switch %s. Ignoring.", value);
353 arg_default_std_error = r;
355 } else if (streq(key, "systemd.setenv") && value) {
357 if (env_assignment_is_valid(value)) {
360 env = strv_env_set(arg_default_environment, value);
362 arg_default_environment = env;
364 log_warning_errno(ENOMEM, "Setting environment variable '%s' failed, ignoring: %m", value);
366 log_warning("Environment variable name '%s' is not valid. Ignoring.", value);
368 } else if (streq(key, "quiet") && !value) {
370 log_set_max_level(LOG_NOTICE);
372 if (arg_show_status == _SHOW_STATUS_UNSET)
373 arg_show_status = SHOW_STATUS_AUTO;
375 } else if (streq(key, "debug") && !value) {
377 /* Note that log_parse_environment() handles 'debug'
378 * too, and sets the log level to LOG_DEBUG. */
380 if (detect_container(NULL) > 0)
381 log_set_target(LOG_TARGET_CONSOLE);
383 } else if (!in_initrd() && !value) {
386 /* SysV compatibility */
387 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
388 if (streq(key, rlmap[i]))
389 return set_default_unit(rlmap[i+1]);
395 #define DEFINE_SETTER(name, func, descr) \
396 static int name(const char *unit, \
397 const char *filename, \
399 const char *section, \
400 unsigned section_line, \
401 const char *lvalue, \
403 const char *rvalue, \
415 log_syntax(unit, LOG_ERR, filename, line, -r, \
416 "Invalid " descr "'%s': %s", \
417 rvalue, strerror(-r)); \
422 DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
423 DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
424 DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
425 DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
427 static int config_parse_cpu_affinity2(
429 const char *filename,
432 unsigned section_line,
439 const char *word, *state;
448 FOREACH_WORD_QUOTED(word, l, rvalue, state) {
453 if (!(t = strndup(word, l)))
456 r = safe_atou(t, &cpu);
460 if (!(c = cpu_set_malloc(&ncpus)))
463 if (r < 0 || cpu >= ncpus) {
464 log_syntax(unit, LOG_ERR, filename, line, -r,
465 "Failed to parse CPU affinity '%s'", rvalue);
470 CPU_SET_S(cpu, CPU_ALLOC_SIZE(ncpus), c);
473 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
474 "Trailing garbage, ignoring.");
477 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
478 log_unit_warning(unit, "Failed to set CPU affinity: %m");
486 static int config_parse_show_status(
488 const char *filename,
491 unsigned section_line,
499 ShowStatus *b = data;
506 k = parse_show_status(rvalue, b);
508 log_syntax(unit, LOG_ERR, filename, line, -k,
509 "Failed to parse show status setting, ignoring: %s", rvalue);
516 static void strv_free_free(char ***l) {
528 static void free_join_controllers(void) {
529 strv_free_free(arg_join_controllers);
530 arg_join_controllers = NULL;
533 static int config_parse_join_controllers(const char *unit,
534 const char *filename,
537 unsigned section_line,
545 const char *word, *state;
552 free_join_controllers();
554 FOREACH_WORD_QUOTED(word, length, rvalue, state) {
557 s = strndup(word, length);
561 l = strv_split(s, ",");
566 if (strv_length(l) <= 1) {
571 if (!arg_join_controllers) {
572 arg_join_controllers = new(char**, 2);
573 if (!arg_join_controllers) {
578 arg_join_controllers[0] = l;
579 arg_join_controllers[1] = NULL;
586 t = new0(char**, n+2);
594 for (a = arg_join_controllers; *a; a++) {
596 if (strv_overlap(*a, l)) {
597 if (strv_extend_strv(&l, *a) < 0) {
617 t[n++] = strv_uniq(l);
619 strv_free_free(arg_join_controllers);
620 arg_join_controllers = t;
624 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
625 "Trailing garbage, ignoring.");
630 static int parse_config_file(void) {
632 const ConfigTableItem items[] = {
633 { "Manager", "LogLevel", config_parse_level2, 0, NULL },
634 { "Manager", "LogTarget", config_parse_target, 0, NULL },
635 { "Manager", "LogColor", config_parse_color, 0, NULL },
636 { "Manager", "LogLocation", config_parse_location, 0, NULL },
637 { "Manager", "DumpCore", config_parse_bool, 0, &arg_dump_core },
638 { "Manager", "CrashShell", config_parse_bool, 0, &arg_crash_shell },
639 { "Manager", "ShowStatus", config_parse_show_status, 0, &arg_show_status },
640 { "Manager", "CrashChVT", config_parse_int, 0, &arg_crash_chvt },
641 { "Manager", "CPUAffinity", config_parse_cpu_affinity2, 0, NULL },
642 { "Manager", "JoinControllers", config_parse_join_controllers, 0, &arg_join_controllers },
643 { "Manager", "RuntimeWatchdogSec", config_parse_sec, 0, &arg_runtime_watchdog },
644 { "Manager", "ShutdownWatchdogSec", config_parse_sec, 0, &arg_shutdown_watchdog },
645 { "Manager", "CapabilityBoundingSet", config_parse_bounding_set, 0, &arg_capability_bounding_set_drop },
647 { "Manager", "SystemCallArchitectures", config_parse_syscall_archs, 0, &arg_syscall_archs },
649 { "Manager", "TimerSlackNSec", config_parse_nsec, 0, &arg_timer_slack_nsec },
650 { "Manager", "DefaultTimerAccuracySec", config_parse_sec, 0, &arg_default_timer_accuracy_usec },
651 { "Manager", "DefaultStandardOutput", config_parse_output, 0, &arg_default_std_output },
652 { "Manager", "DefaultStandardError", config_parse_output, 0, &arg_default_std_error },
653 { "Manager", "DefaultTimeoutStartSec", config_parse_sec, 0, &arg_default_timeout_start_usec },
654 { "Manager", "DefaultTimeoutStopSec", config_parse_sec, 0, &arg_default_timeout_stop_usec },
655 { "Manager", "DefaultRestartSec", config_parse_sec, 0, &arg_default_restart_usec },
656 { "Manager", "DefaultStartLimitInterval", config_parse_sec, 0, &arg_default_start_limit_interval },
657 { "Manager", "DefaultStartLimitBurst", config_parse_unsigned, 0, &arg_default_start_limit_burst },
658 { "Manager", "DefaultEnvironment", config_parse_environ, 0, &arg_default_environment },
659 { "Manager", "DefaultLimitCPU", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CPU] },
660 { "Manager", "DefaultLimitFSIZE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_FSIZE] },
661 { "Manager", "DefaultLimitDATA", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_DATA] },
662 { "Manager", "DefaultLimitSTACK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_STACK] },
663 { "Manager", "DefaultLimitCORE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CORE] },
664 { "Manager", "DefaultLimitRSS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RSS] },
665 { "Manager", "DefaultLimitNOFILE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NOFILE] },
666 { "Manager", "DefaultLimitAS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_AS] },
667 { "Manager", "DefaultLimitNPROC", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NPROC] },
668 { "Manager", "DefaultLimitMEMLOCK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MEMLOCK] },
669 { "Manager", "DefaultLimitLOCKS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_LOCKS] },
670 { "Manager", "DefaultLimitSIGPENDING", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
671 { "Manager", "DefaultLimitMSGQUEUE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MSGQUEUE] },
672 { "Manager", "DefaultLimitNICE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NICE] },
673 { "Manager", "DefaultLimitRTPRIO", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTPRIO] },
674 { "Manager", "DefaultLimitRTTIME", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTTIME] },
675 { "Manager", "DefaultCPUAccounting", config_parse_bool, 0, &arg_default_cpu_accounting },
676 { "Manager", "DefaultBlockIOAccounting", config_parse_bool, 0, &arg_default_blockio_accounting },
677 { "Manager", "DefaultMemoryAccounting", config_parse_bool, 0, &arg_default_memory_accounting },
681 const char *fn, *conf_dirs_nulstr;
683 fn = arg_running_as == SYSTEMD_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
684 conf_dirs_nulstr = arg_running_as == SYSTEMD_SYSTEM ? CONF_DIRS_NULSTR("systemd/system.conf") : CONF_DIRS_NULSTR("systemd/user.conf");
685 config_parse_many(fn, conf_dirs_nulstr, "Manager\0",
686 config_item_table_lookup, items, false, NULL);
691 static int parse_argv(int argc, char *argv[]) {
694 ARG_LOG_LEVEL = 0x100,
704 ARG_DUMP_CONFIGURATION_ITEMS,
711 ARG_DEFAULT_STD_OUTPUT,
712 ARG_DEFAULT_STD_ERROR
715 static const struct option options[] = {
716 { "log-level", required_argument, NULL, ARG_LOG_LEVEL },
717 { "log-target", required_argument, NULL, ARG_LOG_TARGET },
718 { "log-color", optional_argument, NULL, ARG_LOG_COLOR },
719 { "log-location", optional_argument, NULL, ARG_LOG_LOCATION },
720 { "unit", required_argument, NULL, ARG_UNIT },
721 { "system", no_argument, NULL, ARG_SYSTEM },
722 { "user", no_argument, NULL, ARG_USER },
723 { "test", no_argument, NULL, ARG_TEST },
724 { "no-pager", no_argument, NULL, ARG_NO_PAGER },
725 { "help", no_argument, NULL, 'h' },
726 { "version", no_argument, NULL, ARG_VERSION },
727 { "dump-configuration-items", no_argument, NULL, ARG_DUMP_CONFIGURATION_ITEMS },
728 { "dump-core", optional_argument, NULL, ARG_DUMP_CORE },
729 { "crash-shell", optional_argument, NULL, ARG_CRASH_SHELL },
730 { "confirm-spawn", optional_argument, NULL, ARG_CONFIRM_SPAWN },
731 { "show-status", optional_argument, NULL, ARG_SHOW_STATUS },
732 { "deserialize", required_argument, NULL, ARG_DESERIALIZE },
733 { "switched-root", no_argument, NULL, ARG_SWITCHED_ROOT },
734 { "default-standard-output", required_argument, NULL, ARG_DEFAULT_STD_OUTPUT, },
735 { "default-standard-error", required_argument, NULL, ARG_DEFAULT_STD_ERROR, },
747 while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
752 r = log_set_max_level_from_string(optarg);
754 log_error("Failed to parse log level %s.", optarg);
761 r = log_set_target_from_string(optarg);
763 log_error("Failed to parse log target %s.", optarg);
772 r = log_show_color_from_string(optarg);
774 log_error("Failed to parse log color setting %s.", optarg);
778 log_show_color(true);
782 case ARG_LOG_LOCATION:
784 r = log_show_location_from_string(optarg);
786 log_error("Failed to parse log location setting %s.", optarg);
790 log_show_location(true);
794 case ARG_DEFAULT_STD_OUTPUT:
795 r = exec_output_from_string(optarg);
797 log_error("Failed to parse default standard output setting %s.", optarg);
800 arg_default_std_output = r;
803 case ARG_DEFAULT_STD_ERROR:
804 r = exec_output_from_string(optarg);
806 log_error("Failed to parse default standard error output setting %s.", optarg);
809 arg_default_std_error = r;
814 r = set_default_unit(optarg);
816 return log_error_errno(r, "Failed to set default unit %s: %m", optarg);
821 arg_running_as = SYSTEMD_SYSTEM;
825 arg_running_as = SYSTEMD_USER;
829 arg_action = ACTION_TEST;
830 if (arg_no_pager < 0)
839 arg_action = ACTION_VERSION;
842 case ARG_DUMP_CONFIGURATION_ITEMS:
843 arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
847 r = optarg ? parse_boolean(optarg) : 1;
849 log_error("Failed to parse dump core boolean %s.", optarg);
855 case ARG_CRASH_SHELL:
856 r = optarg ? parse_boolean(optarg) : 1;
858 log_error("Failed to parse crash shell boolean %s.", optarg);
864 case ARG_CONFIRM_SPAWN:
865 r = optarg ? parse_boolean(optarg) : 1;
867 log_error("Failed to parse confirm spawn boolean %s.", optarg);
870 arg_confirm_spawn = r;
873 case ARG_SHOW_STATUS:
875 r = parse_show_status(optarg, &arg_show_status);
877 log_error("Failed to parse show status boolean %s.", optarg);
881 arg_show_status = SHOW_STATUS_YES;
884 case ARG_DESERIALIZE: {
888 r = safe_atoi(optarg, &fd);
889 if (r < 0 || fd < 0) {
890 log_error("Failed to parse deserialize option %s.", optarg);
891 return r < 0 ? r : -EINVAL;
894 fd_cloexec(fd, true);
898 return log_error_errno(errno, "Failed to open serialization fd: %m");
900 if (arg_serialization)
901 fclose(arg_serialization);
903 arg_serialization = f;
908 case ARG_SWITCHED_ROOT:
909 arg_switched_root = true;
913 arg_action = ACTION_HELP;
914 if (arg_no_pager < 0)
919 log_set_max_level(LOG_DEBUG);
925 /* Just to eat away the sysvinit kernel
926 * cmdline args without getopt() error
927 * messages that we'll parse in
928 * parse_proc_cmdline_word() or ignore. */
937 assert_not_reached("Unhandled option code.");
940 if (optind < argc && getpid() != 1) {
941 /* Hmm, when we aren't run as init system
942 * let's complain about excess arguments */
944 log_error("Excess arguments.");
951 static int help(void) {
953 printf("%s [OPTIONS...]\n\n"
954 "Starts up and maintains the system or user services.\n\n"
955 " -h --help Show this help\n"
956 " --test Determine startup sequence, dump it and exit\n"
957 " --no-pager Do not pipe output into a pager\n"
958 " --dump-configuration-items Dump understood unit configuration items\n"
959 " --unit=UNIT Set default unit\n"
960 " --system Run a system instance, even if PID != 1\n"
961 " --user Run a user instance\n"
962 " --dump-core[=0|1] Dump core on crash\n"
963 " --crash-shell[=0|1] Run shell on crash\n"
964 " --confirm-spawn[=0|1] Ask for confirmation when spawning processes\n"
965 " --show-status[=0|1] Show status updates on the console during bootup\n"
966 " --log-target=TARGET Set log target (console, journal, kmsg, journal-or-kmsg, null)\n"
967 " --log-level=LEVEL Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
968 " --log-color[=0|1] Highlight important log messages\n"
969 " --log-location[=0|1] Include code location in log messages\n"
970 " --default-standard-output= Set default standard output for services\n"
971 " --default-standard-error= Set default standard error output for services\n",
972 program_invocation_short_name);
977 static int version(void) {
978 puts(PACKAGE_STRING);
979 puts(SYSTEMD_FEATURES);
984 static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
993 r = manager_open_serialization(m, &f);
995 log_error_errno(r, "Failed to create serialization file: %m");
999 /* Make sure nothing is really destructed when we shut down */
1001 bus_manager_send_reloading(m, true);
1006 log_error_errno(r, "Failed to allocate fd set: %m");
1010 r = manager_serialize(m, f, fds, switching_root);
1012 log_error_errno(r, "Failed to serialize state: %m");
1016 if (fseeko(f, 0, SEEK_SET) < 0) {
1017 log_error_errno(errno, "Failed to rewind serialization fd: %m");
1021 r = fd_cloexec(fileno(f), false);
1023 log_error_errno(r, "Failed to disable O_CLOEXEC for serialization: %m");
1027 r = fdset_cloexec(fds, false);
1029 log_error_errno(r, "Failed to disable O_CLOEXEC for serialization fds: %m");
1047 static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1051 assert(saved_rlimit);
1053 /* Save the original RLIMIT_NOFILE so that we can reset it
1054 * later when transitioning from the initrd to the main
1055 * systemd or suchlike. */
1056 if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0)
1057 return log_error_errno(errno, "Reading RLIMIT_NOFILE failed: %m");
1059 /* Make sure forked processes get the default kernel setting */
1060 if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1063 rl = newdup(struct rlimit, saved_rlimit, 1);
1067 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1070 /* Bump up the resource limit for ourselves substantially */
1071 nl.rlim_cur = nl.rlim_max = 64*1024;
1072 r = setrlimit_closest(RLIMIT_NOFILE, &nl);
1074 return log_error_errno(r, "Setting RLIMIT_NOFILE failed: %m");
1079 static void test_mtab(void) {
1081 static const char ok[] =
1082 "/proc/self/mounts\0"
1084 "../proc/self/mounts\0"
1087 _cleanup_free_ char *p = NULL;
1090 /* Check that /etc/mtab is a symlink to the right place or
1091 * non-existing. But certainly not a file, or a symlink to
1092 * some weird place... */
1094 r = readlink_malloc("/etc/mtab", &p);
1097 if (r >= 0 && nulstr_contains(ok, p))
1100 log_warning("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1101 "This is not supported anymore. "
1102 "Please make sure to replace this file by a symlink to avoid incorrect or misleading mount(8) output.");
1105 static void test_usr(void) {
1107 /* Check that /usr is not a separate fs */
1109 if (dir_is_empty("/usr") <= 0)
1112 log_warning("/usr appears to be on its own filesystem and is not already mounted. This is not a supported setup. "
1113 "Some things will probably break (sometimes even silently) in mysterious ways. "
1114 "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1117 static int initialize_join_controllers(void) {
1118 /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1119 * + "net_prio". We'd like to add "cpuset" to the mix, but
1120 * "cpuset" doesn't really work for groups with no initialized
1123 arg_join_controllers = new(char**, 3);
1124 if (!arg_join_controllers)
1127 arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
1128 arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
1129 arg_join_controllers[2] = NULL;
1131 if (!arg_join_controllers[0] || !arg_join_controllers[1]) {
1132 free_join_controllers();
1139 static int enforce_syscall_archs(Set *archs) {
1141 scmp_filter_ctx *seccomp;
1146 seccomp = seccomp_init(SCMP_ACT_ALLOW);
1150 SET_FOREACH(id, arg_syscall_archs, i) {
1151 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1155 log_error_errno(r, "Failed to add architecture to seccomp: %m");
1160 r = seccomp_attr_set(seccomp, SCMP_FLTATR_CTL_NNP, 0);
1162 log_error_errno(r, "Failed to unset NO_NEW_PRIVS: %m");
1166 r = seccomp_load(seccomp);
1168 log_error_errno(r, "Failed to add install architecture seccomp: %m");
1171 seccomp_release(seccomp);
1178 static int status_welcome(void) {
1179 _cleanup_free_ char *pretty_name = NULL, *ansi_color = NULL;
1182 r = parse_env_file("/etc/os-release", NEWLINE,
1183 "PRETTY_NAME", &pretty_name,
1184 "ANSI_COLOR", &ansi_color,
1187 r = parse_env_file("/usr/lib/os-release", NEWLINE,
1188 "PRETTY_NAME", &pretty_name,
1189 "ANSI_COLOR", &ansi_color,
1193 if (r < 0 && r != -ENOENT)
1194 log_warning_errno(r, "Failed to read os-release file: %m");
1196 return status_printf(NULL, false, false,
1197 "\nWelcome to \x1B[%sm%s\x1B[0m!\n",
1198 isempty(ansi_color) ? "1" : ansi_color,
1199 isempty(pretty_name) ? "Linux" : pretty_name);
1202 static int write_container_id(void) {
1205 c = getenv("container");
1209 return write_string_file("/run/systemd/container", c);
1212 int main(int argc, char *argv[]) {
1214 int r, retval = EXIT_FAILURE;
1215 usec_t before_startup, after_startup;
1216 char timespan[FORMAT_TIMESPAN_MAX];
1218 bool reexecute = false;
1219 const char *shutdown_verb = NULL;
1220 dual_timestamp initrd_timestamp = { 0ULL, 0ULL };
1221 dual_timestamp userspace_timestamp = { 0ULL, 0ULL };
1222 dual_timestamp kernel_timestamp = { 0ULL, 0ULL };
1223 dual_timestamp security_start_timestamp = { 0ULL, 0ULL };
1224 dual_timestamp security_finish_timestamp = { 0ULL, 0ULL };
1225 static char systemd[] = "systemd";
1226 bool skip_setup = false;
1228 bool loaded_policy = false;
1229 bool arm_reboot_watchdog = false;
1230 bool queue_default_job = false;
1231 bool empty_etc = false;
1232 char *switch_root_dir = NULL, *switch_root_init = NULL;
1233 static struct rlimit saved_rlimit_nofile = { 0, 0 };
1234 const char *error_message = NULL;
1236 #ifdef HAVE_SYSV_COMPAT
1237 if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
1238 /* This is compatibility support for SysV, where
1239 * calling init as a user is identical to telinit. */
1242 execv(SYSTEMCTL_BINARY_PATH, argv);
1243 log_error_errno(errno, "Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
1248 dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1249 dual_timestamp_get(&userspace_timestamp);
1251 /* Determine if this is a reexecution or normal bootup. We do
1252 * the full command line parsing much later, so let's just
1253 * have a quick peek here. */
1254 if (strv_find(argv+1, "--deserialize"))
1257 /* If we have switched root, do all the special setup
1259 if (strv_find(argv+1, "--switched-root"))
1262 /* If we get started via the /sbin/init symlink then we are
1263 called 'init'. After a subsequent reexecution we are then
1264 called 'systemd'. That is confusing, hence let's call us
1265 systemd right-away. */
1266 program_invocation_short_name = systemd;
1267 prctl(PR_SET_NAME, systemd);
1272 log_show_color(isatty(STDERR_FILENO) > 0);
1273 log_set_upgrade_syslog_to_journal(true);
1275 /* Disable the umask logic */
1279 if (getpid() == 1 && detect_container(NULL) <= 0) {
1281 /* Running outside of a container as PID 1 */
1282 arg_running_as = SYSTEMD_SYSTEM;
1284 log_set_target(LOG_TARGET_KMSG);
1288 initrd_timestamp = userspace_timestamp;
1291 mount_setup_early();
1292 dual_timestamp_get(&security_start_timestamp);
1293 if (mac_selinux_setup(&loaded_policy) < 0) {
1294 error_message = "Failed to load SELinux policy";
1296 } else if (ima_setup() < 0) {
1297 error_message = "Failed to load IMA policy";
1299 } else if (mac_smack_setup(&loaded_policy) < 0) {
1300 error_message = "Failed to load SMACK policy";
1303 dual_timestamp_get(&security_finish_timestamp);
1306 if (mac_selinux_init(NULL) < 0) {
1307 error_message = "Failed to initialize SELinux policy";
1312 if (clock_is_localtime() > 0) {
1316 * The very first call of settimeofday() also does a time warp in the kernel.
1318 * In the rtc-in-local time mode, we set the kernel's timezone, and rely on
1319 * external tools to take care of maintaining the RTC and do all adjustments.
1320 * This matches the behavior of Windows, which leaves the RTC alone if the
1321 * registry tells that the RTC runs in UTC.
1323 r = clock_set_timezone(&min);
1325 log_error_errno(r, "Failed to apply local time delta, ignoring: %m");
1327 log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
1328 } else if (!in_initrd()) {
1330 * Do a dummy very first call to seal the kernel's time warp magic.
1332 * Do not call this this from inside the initrd. The initrd might not
1333 * carry /etc/adjtime with LOCAL, but the real system could be set up
1334 * that way. In such case, we need to delay the time-warp or the sealing
1335 * until we reach the real system.
1337 * Do no set the kernel's timezone. The concept of local time cannot
1338 * be supported reliably, the time will jump or be incorrect at every daylight
1339 * saving time change. All kernel local time concepts will be treated
1342 clock_reset_timewarp();
1346 /* Set the default for later on, but don't actually
1347 * open the logs like this for now. Note that if we
1348 * are transitioning from the initrd there might still
1349 * be journal fd open, and we shouldn't attempt
1350 * opening that before we parsed /proc/cmdline which
1351 * might redirect output elsewhere. */
1352 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1354 } else if (getpid() == 1) {
1355 /* Running inside a container, as PID 1 */
1356 arg_running_as = SYSTEMD_SYSTEM;
1357 log_set_target(LOG_TARGET_CONSOLE);
1358 log_close_console(); /* force reopen of /dev/console */
1361 /* For the later on, see above... */
1362 log_set_target(LOG_TARGET_JOURNAL);
1364 /* clear the kernel timestamp,
1365 * because we are in a container */
1366 kernel_timestamp.monotonic = 0ULL;
1367 kernel_timestamp.realtime = 0ULL;
1370 /* Running as user instance */
1371 arg_running_as = SYSTEMD_USER;
1372 log_set_target(LOG_TARGET_AUTO);
1375 /* clear the kernel timestamp,
1376 * because we are not PID 1 */
1377 kernel_timestamp.monotonic = 0ULL;
1378 kernel_timestamp.realtime = 0ULL;
1381 /* Initialize default unit */
1382 r = set_default_unit(SPECIAL_DEFAULT_TARGET);
1384 log_emergency_errno(r, "Failed to set default unit %s: %m", SPECIAL_DEFAULT_TARGET);
1385 error_message = "Failed to set default unit";
1389 r = initialize_join_controllers();
1391 error_message = "Failed to initalize cgroup controllers";
1395 /* Mount /proc, /sys and friends, so that /proc/cmdline and
1396 * /proc/$PID/fd is available. */
1397 if (getpid() == 1) {
1399 /* Load the kernel modules early, so that we kdbus.ko is loaded before kdbusfs shall be mounted */
1403 r = mount_setup(loaded_policy);
1405 error_message = "Failed to mount API filesystems";
1410 /* Reset all signal handlers. */
1411 assert_se(reset_all_signal_handlers() == 0);
1413 ignore_signals(SIGNALS_IGNORE, -1);
1415 if (parse_config_file() < 0) {
1416 error_message = "Failed to parse config file";
1420 if (arg_running_as == SYSTEMD_SYSTEM) {
1421 r = parse_proc_cmdline(parse_proc_cmdline_item);
1423 log_warning_errno(r, "Failed to parse kernel command line, ignoring: %m");
1426 /* Note that this also parses bits from the kernel command
1427 * line, including "debug". */
1428 log_parse_environment();
1430 if (parse_argv(argc, argv) < 0) {
1431 error_message = "Failed to parse commandline arguments";
1435 if (arg_action == ACTION_TEST &&
1437 log_error("Don't run test mode as root.");
1441 if (arg_running_as == SYSTEMD_USER &&
1442 arg_action == ACTION_RUN &&
1444 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1448 if (arg_running_as == SYSTEMD_SYSTEM &&
1449 arg_action == ACTION_RUN &&
1450 running_in_chroot() > 0) {
1451 log_error("Cannot be run in a chroot() environment.");
1455 if (arg_action == ACTION_TEST)
1458 pager_open_if_enabled();
1460 if (arg_action == ACTION_HELP) {
1463 } else if (arg_action == ACTION_VERSION) {
1466 } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
1467 unit_dump_config_items(stdout);
1468 retval = EXIT_SUCCESS;
1470 } else if (arg_action == ACTION_DONE) {
1471 retval = EXIT_SUCCESS;
1475 if (arg_running_as == SYSTEMD_USER &&
1476 !getenv("XDG_RUNTIME_DIR")) {
1477 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1481 assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
1483 /* Close logging fds, in order not to confuse fdset below */
1486 /* Remember open file descriptors for later deserialization */
1487 r = fdset_new_fill(&fds);
1489 log_emergency_errno(r, "Failed to allocate fd set: %m");
1490 error_message = "Failed to allocate fd set";
1493 fdset_cloexec(fds, true);
1495 if (arg_serialization)
1496 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
1498 if (arg_running_as == SYSTEMD_SYSTEM)
1499 /* Become a session leader if we aren't one yet. */
1502 /* Move out of the way, so that we won't block unmounts */
1503 assert_se(chdir("/") == 0);
1505 /* Reset the console, but only if this is really init and we
1506 * are freshly booted */
1507 if (arg_running_as == SYSTEMD_SYSTEM && arg_action == ACTION_RUN) {
1509 /* If we are init, we connect stdin/stdout/stderr to
1510 * /dev/null and make sure we don't have a controlling
1514 if (getpid() == 1 && !skip_setup)
1518 /* Open the logging devices, if possible and necessary */
1521 if (arg_show_status == _SHOW_STATUS_UNSET)
1522 arg_show_status = SHOW_STATUS_YES;
1524 /* Make sure we leave a core dump without panicing the
1526 if (getpid() == 1) {
1527 install_crash_handler();
1529 r = mount_cgroup_controllers(arg_join_controllers);
1534 if (arg_running_as == SYSTEMD_SYSTEM) {
1535 const char *virtualization = NULL;
1537 log_info(PACKAGE_STRING " running in %ssystem mode. (" SYSTEMD_FEATURES ")",
1538 arg_action == ACTION_TEST ? "test " : "" );
1540 detect_virtualization(&virtualization);
1542 log_info("Detected virtualization '%s'.", virtualization);
1544 write_container_id();
1546 log_info("Detected architecture '%s'.", architecture_to_string(uname_architecture()));
1549 log_info("Running in initial RAM disk.");
1551 /* Let's check whether /etc is already populated. We
1552 * don't actually really check for that, but use
1553 * /etc/machine-id as flag file. This allows container
1554 * managers and installers to provision a couple of
1555 * files already. If the container manager wants to
1556 * provision the machine ID itself it should pass
1557 * $container_uuid to PID 1. */
1559 empty_etc = access("/etc/machine-id", F_OK) < 0;
1561 log_info("Running with unpopulated /etc.");
1563 _cleanup_free_ char *t;
1565 t = uid_to_name(getuid());
1566 log_debug(PACKAGE_STRING " running in %suser mode for user "UID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1567 arg_action == ACTION_TEST ? " test" : "", getuid(), t);
1570 if (arg_running_as == SYSTEMD_SYSTEM && !skip_setup) {
1571 if (arg_show_status > 0 || plymouth_running())
1575 machine_id_setup(NULL);
1582 if (arg_running_as == SYSTEMD_SYSTEM && arg_runtime_watchdog > 0)
1583 watchdog_set_timeout(&arg_runtime_watchdog);
1585 if (arg_timer_slack_nsec != NSEC_INFINITY)
1586 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
1587 log_error_errno(errno, "Failed to adjust timer slack: %m");
1589 if (arg_capability_bounding_set_drop) {
1590 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
1592 log_emergency_errno(r, "Failed to drop capability bounding set of usermode helpers: %m");
1593 error_message = "Failed to drop capability bounding set of usermode helpers";
1596 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
1598 log_emergency_errno(r, "Failed to drop capability bounding set: %m");
1599 error_message = "Failed to drop capability bounding set";
1604 if (arg_syscall_archs) {
1605 r = enforce_syscall_archs(arg_syscall_archs);
1607 error_message = "Failed to set syscall architectures";
1612 if (arg_running_as == SYSTEMD_USER) {
1613 /* Become reaper of our children */
1614 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0) {
1615 log_warning_errno(errno, "Failed to make us a subreaper: %m");
1616 if (errno == EINVAL)
1617 log_info("Perhaps the kernel version is too old (< 3.4?)");
1621 if (arg_running_as == SYSTEMD_SYSTEM) {
1622 bump_rlimit_nofile(&saved_rlimit_nofile);
1625 r = unit_file_preset_all(UNIT_FILE_SYSTEM, false, NULL, UNIT_FILE_PRESET_FULL, false, NULL, 0);
1627 log_warning_errno(r, "Failed to populate /etc with preset unit settings, ignoring: %m");
1629 log_info("Populated /etc with preset unit settings.");
1633 r = manager_new(arg_running_as, arg_action == ACTION_TEST, &m);
1635 log_emergency_errno(r, "Failed to allocate manager object: %m");
1636 error_message = "Failed to allocate manager object";
1640 m->confirm_spawn = arg_confirm_spawn;
1641 m->default_timer_accuracy_usec = arg_default_timer_accuracy_usec;
1642 m->default_std_output = arg_default_std_output;
1643 m->default_std_error = arg_default_std_error;
1644 m->default_restart_usec = arg_default_restart_usec;
1645 m->default_timeout_start_usec = arg_default_timeout_start_usec;
1646 m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
1647 m->default_start_limit_interval = arg_default_start_limit_interval;
1648 m->default_start_limit_burst = arg_default_start_limit_burst;
1649 m->default_cpu_accounting = arg_default_cpu_accounting;
1650 m->default_blockio_accounting = arg_default_blockio_accounting;
1651 m->default_memory_accounting = arg_default_memory_accounting;
1652 m->runtime_watchdog = arg_runtime_watchdog;
1653 m->shutdown_watchdog = arg_shutdown_watchdog;
1655 m->userspace_timestamp = userspace_timestamp;
1656 m->kernel_timestamp = kernel_timestamp;
1657 m->initrd_timestamp = initrd_timestamp;
1658 m->security_start_timestamp = security_start_timestamp;
1659 m->security_finish_timestamp = security_finish_timestamp;
1661 manager_set_default_rlimits(m, arg_default_rlimit);
1662 manager_environment_add(m, NULL, arg_default_environment);
1663 manager_set_show_status(m, arg_show_status);
1664 manager_set_first_boot(m, empty_etc);
1666 /* Remember whether we should queue the default job */
1667 queue_default_job = !arg_serialization || arg_switched_root;
1669 before_startup = now(CLOCK_MONOTONIC);
1671 r = manager_startup(m, arg_serialization, fds);
1673 log_error_errno(r, "Failed to fully start up daemon: %m");
1675 /* This will close all file descriptors that were opened, but
1676 * not claimed by any unit. */
1680 if (arg_serialization) {
1681 fclose(arg_serialization);
1682 arg_serialization = NULL;
1685 if (queue_default_job) {
1686 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
1687 Unit *target = NULL;
1688 Job *default_unit_job;
1690 log_debug("Activating default unit: %s", arg_default_unit);
1692 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
1694 log_error("Failed to load default target: %s", bus_error_message(&error, r));
1695 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
1696 log_error_errno(target->load_error, "Failed to load default target: %m");
1697 else if (target->load_state == UNIT_MASKED)
1698 log_error("Default target masked.");
1700 if (!target || target->load_state != UNIT_LOADED) {
1701 log_info("Trying to load rescue target...");
1703 r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1705 log_emergency("Failed to load rescue target: %s", bus_error_message(&error, r));
1706 error_message = "Failed to load rescue target";
1708 } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
1709 log_emergency_errno(target->load_error, "Failed to load rescue target: %m");
1710 error_message = "Failed to load rescue target";
1712 } else if (target->load_state == UNIT_MASKED) {
1713 log_emergency("Rescue target masked.");
1714 error_message = "Rescue target masked";
1719 assert(target->load_state == UNIT_LOADED);
1721 if (arg_action == ACTION_TEST) {
1722 printf("-> By units:\n");
1723 manager_dump_units(m, stdout, "\t");
1726 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
1728 log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
1730 r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1732 log_emergency("Failed to start default target: %s", bus_error_message(&error, r));
1733 error_message = "Failed to start default target";
1737 log_emergency("Failed to isolate default target: %s", bus_error_message(&error, r));
1738 error_message = "Failed to isolate default target";
1742 m->default_unit_job_id = default_unit_job->id;
1744 after_startup = now(CLOCK_MONOTONIC);
1745 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1746 "Loaded units and determined initial transaction in %s.",
1747 format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 100 * USEC_PER_MSEC));
1749 if (arg_action == ACTION_TEST) {
1750 printf("-> By jobs:\n");
1751 manager_dump_jobs(m, stdout, "\t");
1752 retval = EXIT_SUCCESS;
1758 r = manager_loop(m);
1760 log_emergency_errno(r, "Failed to run main loop: %m");
1761 error_message = "Failed to run main loop";
1765 switch (m->exit_code) {
1768 retval = EXIT_SUCCESS;
1772 case MANAGER_RELOAD:
1773 log_info("Reloading.");
1774 r = manager_reload(m);
1776 log_error_errno(r, "Failed to reload: %m");
1779 case MANAGER_REEXECUTE:
1781 if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0) {
1782 error_message = "Failed to prepare for reexection";
1787 log_notice("Reexecuting.");
1790 case MANAGER_SWITCH_ROOT:
1791 /* Steal the switch root parameters */
1792 switch_root_dir = m->switch_root;
1793 switch_root_init = m->switch_root_init;
1794 m->switch_root = m->switch_root_init = NULL;
1796 if (!switch_root_init)
1797 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0) {
1798 error_message = "Failed to prepare for reexection";
1803 log_notice("Switching root.");
1806 case MANAGER_REBOOT:
1807 case MANAGER_POWEROFF:
1809 case MANAGER_KEXEC: {
1810 static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
1811 [MANAGER_REBOOT] = "reboot",
1812 [MANAGER_POWEROFF] = "poweroff",
1813 [MANAGER_HALT] = "halt",
1814 [MANAGER_KEXEC] = "kexec"
1817 assert_se(shutdown_verb = table[m->exit_code]);
1818 arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
1820 log_notice("Shutting down.");
1825 assert_not_reached("Unknown exit code.");
1833 arg_shutdown_watchdog = m->shutdown_watchdog;
1834 m = manager_free(m);
1836 for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++) {
1837 free(arg_default_rlimit[j]);
1838 arg_default_rlimit[j] = NULL;
1841 free(arg_default_unit);
1842 arg_default_unit = NULL;
1844 free_join_controllers();
1846 strv_free(arg_default_environment);
1847 arg_default_environment = NULL;
1849 set_free(arg_syscall_archs);
1850 arg_syscall_archs = NULL;
1852 mac_selinux_finish();
1856 unsigned i, args_size;
1858 /* Close and disarm the watchdog, so that the new
1859 * instance can reinitialize it, but doesn't get
1860 * rebooted while we do that */
1861 watchdog_close(true);
1863 /* Reset the RLIMIT_NOFILE to the kernel default, so
1864 * that the new systemd can pass the kernel default to
1865 * its child processes */
1866 if (saved_rlimit_nofile.rlim_cur > 0)
1867 setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
1869 if (switch_root_dir) {
1870 /* Kill all remaining processes from the
1871 * initrd, but don't wait for them, so that we
1872 * can handle the SIGCHLD for them after
1874 broadcast_signal(SIGTERM, false, true);
1876 /* And switch root with MS_MOVE, because we remove the old directory afterwards and detach it. */
1877 r = switch_root(switch_root_dir, "/mnt", true, MS_MOVE);
1879 log_error_errno(r, "Failed to switch root, trying to continue: %m");
1882 args_size = MAX(6, argc+1);
1883 args = newa(const char*, args_size);
1885 if (!switch_root_init) {
1888 /* First try to spawn ourselves with the right
1889 * path, and with full serialization. We do
1890 * this only if the user didn't specify an
1891 * explicit init to spawn. */
1893 assert(arg_serialization);
1896 snprintf(sfd, sizeof(sfd), "%i", fileno(arg_serialization));
1900 args[i++] = SYSTEMD_BINARY_PATH;
1901 if (switch_root_dir)
1902 args[i++] = "--switched-root";
1903 args[i++] = arg_running_as == SYSTEMD_SYSTEM ? "--system" : "--user";
1904 args[i++] = "--deserialize";
1908 /* do not pass along the environment we inherit from the kernel or initrd */
1909 if (switch_root_dir)
1912 assert(i <= args_size);
1913 execv(args[0], (char* const*) args);
1916 /* Try the fallback, if there is any, without any
1917 * serialization. We pass the original argv[] and
1918 * envp[]. (Well, modulo the ordering changes due to
1919 * getopt() in argv[], and some cleanups in envp[],
1920 * but let's hope that doesn't matter.) */
1922 if (arg_serialization) {
1923 fclose(arg_serialization);
1924 arg_serialization = NULL;
1932 /* Reopen the console */
1933 make_console_stdio();
1935 for (j = 1, i = 1; j < (unsigned) argc; j++)
1936 args[i++] = argv[j];
1938 assert(i <= args_size);
1940 /* Reenable any blocked signals, especially important
1941 * if we switch from initial ramdisk to init=... */
1942 reset_all_signal_handlers();
1943 reset_signal_mask();
1945 if (switch_root_init) {
1946 args[0] = switch_root_init;
1947 execv(args[0], (char* const*) args);
1948 log_warning_errno(errno, "Failed to execute configured init, trying fallback: %m");
1951 args[0] = "/sbin/init";
1952 execv(args[0], (char* const*) args);
1954 if (errno == ENOENT) {
1955 log_warning("No /sbin/init, trying fallback");
1957 args[0] = "/bin/sh";
1959 execv(args[0], (char* const*) args);
1960 log_error_errno(errno, "Failed to execute /bin/sh, giving up: %m");
1962 log_warning_errno(errno, "Failed to execute /sbin/init, giving up: %m");
1965 if (arg_serialization) {
1966 fclose(arg_serialization);
1967 arg_serialization = NULL;
1975 #ifdef HAVE_VALGRIND_VALGRIND_H
1976 /* If we are PID 1 and running under valgrind, then let's exit
1977 * here explicitly. valgrind will only generate nice output on
1978 * exit(), not on exec(), hence let's do the former not the
1980 if (getpid() == 1 && RUNNING_ON_VALGRIND)
1984 if (shutdown_verb) {
1985 char log_level[DECIMAL_STR_MAX(int) + 1];
1986 const char* command_line[9] = {
1987 SYSTEMD_SHUTDOWN_BINARY_PATH,
1989 "--log-level", log_level,
1993 _cleanup_strv_free_ char **env_block = NULL;
1995 assert(command_line[pos] == NULL);
1996 env_block = strv_copy(environ);
1998 snprintf(log_level, sizeof(log_level), "%d", log_get_max_level());
2000 switch (log_get_target()) {
2001 case LOG_TARGET_KMSG:
2002 case LOG_TARGET_JOURNAL_OR_KMSG:
2003 case LOG_TARGET_SYSLOG_OR_KMSG:
2004 command_line[pos++] = "kmsg";
2007 case LOG_TARGET_CONSOLE:
2009 command_line[pos++] = "console";
2013 if (log_get_show_color())
2014 command_line[pos++] = "--log-color";
2016 if (log_get_show_location())
2017 command_line[pos++] = "--log-location";
2019 assert(pos < ELEMENTSOF(command_line));
2021 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
2024 /* If we reboot let's set the shutdown
2025 * watchdog and tell the shutdown binary to
2026 * repeatedly ping it */
2027 watchdog_set_timeout(&arg_shutdown_watchdog);
2028 watchdog_close(false);
2030 /* Tell the binary how often to ping, ignore failure */
2031 if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
2032 strv_push(&env_block, e);
2034 watchdog_close(true);
2036 /* Avoid the creation of new processes forked by the
2037 * kernel; at this point, we will not listen to the
2039 if (detect_container(NULL) <= 0)
2040 cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
2042 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
2043 log_error_errno(errno, "Failed to execute shutdown binary, %s: %m",
2044 getpid() == 1 ? "freezing" : "quitting");
2047 if (getpid() == 1) {
2049 manager_status_printf(NULL, STATUS_TYPE_EMERGENCY,
2050 ANSI_HIGHLIGHT_RED_ON "!!!!!!" ANSI_HIGHLIGHT_OFF,
2051 "%s, freezing.", error_message);