chiark / gitweb /
core: populate unit file set with preset data if we boot with empty /etc
[elogind.git] / src / core / main.c
1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
2
3 /***
4   This file is part of systemd.
5
6   Copyright 2010 Lennart Poettering
7
8   systemd is free software; you can redistribute it and/or modify it
9   under the terms of the GNU Lesser General Public License as published by
10   the Free Software Foundation; either version 2.1 of the License, or
11   (at your option) any later version.
12
13   systemd is distributed in the hope that it will be useful, but
14   WITHOUT ANY WARRANTY; without even the implied warranty of
15   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16   Lesser General Public License for more details.
17
18   You should have received a copy of the GNU Lesser General Public License
19   along with systemd; If not, see <http://www.gnu.org/licenses/>.
20 ***/
21
22 #include <stdio.h>
23 #include <errno.h>
24 #include <string.h>
25 #include <unistd.h>
26 #include <sys/types.h>
27 #include <sys/stat.h>
28 #include <getopt.h>
29 #include <signal.h>
30 #include <sys/wait.h>
31 #include <fcntl.h>
32 #include <sys/prctl.h>
33 #include <sys/mount.h>
34
35 #ifdef HAVE_VALGRIND_VALGRIND_H
36 #include <valgrind/valgrind.h>
37 #endif
38 #ifdef HAVE_SECCOMP
39 #include <seccomp.h>
40 #endif
41
42 #include "sd-daemon.h"
43 #include "sd-messages.h"
44 #include "sd-bus.h"
45 #include "manager.h"
46 #include "log.h"
47 #include "load-fragment.h"
48 #include "fdset.h"
49 #include "special.h"
50 #include "conf-parser.h"
51 #include "missing.h"
52 #include "label.h"
53 #include "build.h"
54 #include "strv.h"
55 #include "def.h"
56 #include "virt.h"
57 #include "architecture.h"
58 #include "watchdog.h"
59 #include "path-util.h"
60 #include "switch-root.h"
61 #include "capability.h"
62 #include "killall.h"
63 #include "env-util.h"
64 #include "clock-util.h"
65 #include "fileio.h"
66 #include "dbus-manager.h"
67 #include "bus-error.h"
68 #include "bus-util.h"
69
70 #include "mount-setup.h"
71 #include "loopback-setup.h"
72 #include "hostname-setup.h"
73 #include "machine-id-setup.h"
74 #include "selinux-setup.h"
75 #include "ima-setup.h"
76 #include "smack-setup.h"
77 #ifdef HAVE_KMOD
78 #include "kmod-setup.h"
79 #endif
80
81 static enum {
82         ACTION_RUN,
83         ACTION_HELP,
84         ACTION_VERSION,
85         ACTION_TEST,
86         ACTION_DUMP_CONFIGURATION_ITEMS,
87         ACTION_DONE
88 } arg_action = ACTION_RUN;
89 static char *arg_default_unit = NULL;
90 static SystemdRunningAs arg_running_as = _SYSTEMD_RUNNING_AS_INVALID;
91 static bool arg_dump_core = true;
92 static bool arg_crash_shell = false;
93 static int arg_crash_chvt = -1;
94 static bool arg_confirm_spawn = false;
95 static ShowStatus arg_show_status = _SHOW_STATUS_UNSET;
96 static bool arg_switched_root = false;
97 static char ***arg_join_controllers = NULL;
98 static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
99 static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
100 static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
101 static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
102 static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
103 static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
104 static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
105 static usec_t arg_runtime_watchdog = 0;
106 static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
107 static char **arg_default_environment = NULL;
108 static struct rlimit *arg_default_rlimit[_RLIMIT_MAX] = {};
109 static uint64_t arg_capability_bounding_set_drop = 0;
110 static nsec_t arg_timer_slack_nsec = (nsec_t) -1;
111 static usec_t arg_default_timer_accuracy_usec = 1 * USEC_PER_MINUTE;
112 static Set* arg_syscall_archs = NULL;
113 static FILE* arg_serialization = NULL;
114 static bool arg_default_cpu_accounting = false;
115 static bool arg_default_blockio_accounting = false;
116 static bool arg_default_memory_accounting = false;
117
118 static void nop_handler(int sig) {}
119
120 noreturn static void crash(int sig) {
121
122         if (getpid() != 1)
123                 /* Pass this on immediately, if this is not PID 1 */
124                 raise(sig);
125         else if (!arg_dump_core)
126                 log_error("Caught <%s>, not dumping core.", signal_to_string(sig));
127         else {
128                 struct sigaction sa = {
129                         .sa_handler = nop_handler,
130                         .sa_flags = SA_NOCLDSTOP|SA_RESTART,
131                 };
132                 pid_t pid;
133
134                 /* We want to wait for the core process, hence let's enable SIGCHLD */
135                 sigaction(SIGCHLD, &sa, NULL);
136
137                 pid = fork();
138                 if (pid < 0)
139                         log_error("Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
140
141                 else if (pid == 0) {
142                         struct rlimit rl = {};
143
144                         /* Enable default signal handler for core dump */
145                         zero(sa);
146                         sa.sa_handler = SIG_DFL;
147                         sigaction(sig, &sa, NULL);
148
149                         /* Don't limit the core dump size */
150                         rl.rlim_cur = RLIM_INFINITY;
151                         rl.rlim_max = RLIM_INFINITY;
152                         setrlimit(RLIMIT_CORE, &rl);
153
154                         /* Just to be sure... */
155                         chdir("/");
156
157                         /* Raise the signal again */
158                         raise(sig);
159
160                         assert_not_reached("We shouldn't be here...");
161                         _exit(1);
162
163                 } else {
164                         siginfo_t status;
165                         int r;
166
167                         /* Order things nicely. */
168                         r = wait_for_terminate(pid, &status);
169                         if (r < 0)
170                                 log_error("Caught <%s>, waitpid() failed: %s", signal_to_string(sig), strerror(-r));
171                         else if (status.si_code != CLD_DUMPED)
172                                 log_error("Caught <%s>, core dump failed.", signal_to_string(sig));
173                         else
174                                 log_error("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
175                 }
176         }
177
178         if (arg_crash_chvt)
179                 chvt(arg_crash_chvt);
180
181         if (arg_crash_shell) {
182                 struct sigaction sa = {
183                         .sa_handler = SIG_IGN,
184                         .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
185                 };
186                 pid_t pid;
187
188                 log_info("Executing crash shell in 10s...");
189                 sleep(10);
190
191                 /* Let the kernel reap children for us */
192                 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
193
194                 pid = fork();
195                 if (pid < 0)
196                         log_error("Failed to fork off crash shell: %m");
197                 else if (pid == 0) {
198                         make_console_stdio();
199                         execl("/bin/sh", "/bin/sh", NULL);
200
201                         log_error("execl() failed: %m");
202                         _exit(1);
203                 }
204
205                 log_info("Successfully spawned crash shell as pid "PID_FMT".", pid);
206         }
207
208         log_info("Freezing execution.");
209         freeze();
210 }
211
212 static void install_crash_handler(void) {
213         struct sigaction sa = {
214                 .sa_handler = crash,
215                 .sa_flags = SA_NODEFER,
216         };
217
218         sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
219 }
220
221 static int console_setup(bool do_reset) {
222         int tty_fd, r;
223
224         /* If we are init, we connect stdin/stdout/stderr to /dev/null
225          * and make sure we don't have a controlling tty. */
226
227         release_terminal();
228
229         if (!do_reset)
230                 return 0;
231
232         tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
233         if (tty_fd < 0) {
234                 log_error("Failed to open /dev/console: %s", strerror(-tty_fd));
235                 return -tty_fd;
236         }
237
238         /* We don't want to force text mode.
239          * plymouth may be showing pictures already from initrd. */
240         r = reset_terminal_fd(tty_fd, false);
241         if (r < 0)
242                 log_error("Failed to reset /dev/console: %s", strerror(-r));
243
244         safe_close(tty_fd);
245         return r;
246 }
247
248 static int set_default_unit(const char *u) {
249         char *c;
250
251         assert(u);
252
253         c = strdup(u);
254         if (!c)
255                 return -ENOMEM;
256
257         free(arg_default_unit);
258         arg_default_unit = c;
259
260         return 0;
261 }
262
263 static int parse_proc_cmdline_item(const char *key, const char *value) {
264
265         static const char * const rlmap[] = {
266                 "emergency", SPECIAL_EMERGENCY_TARGET,
267                 "-b",        SPECIAL_EMERGENCY_TARGET,
268                 "single",    SPECIAL_RESCUE_TARGET,
269                 "-s",        SPECIAL_RESCUE_TARGET,
270                 "s",         SPECIAL_RESCUE_TARGET,
271                 "S",         SPECIAL_RESCUE_TARGET,
272                 "1",         SPECIAL_RESCUE_TARGET,
273                 "2",         SPECIAL_RUNLEVEL2_TARGET,
274                 "3",         SPECIAL_RUNLEVEL3_TARGET,
275                 "4",         SPECIAL_RUNLEVEL4_TARGET,
276                 "5",         SPECIAL_RUNLEVEL5_TARGET,
277         };
278         int r;
279
280         assert(key);
281
282         if (streq(key, "systemd.unit") && value) {
283
284                 if (!in_initrd())
285                         return set_default_unit(value);
286
287         } else if (streq(key, "rd.systemd.unit") && value) {
288
289                 return set_default_unit(value);
290
291         } else if (streq(key, "systemd.log_target") && value) {
292
293                 if (log_set_target_from_string(value) < 0)
294                         log_warning("Failed to parse log target %s. Ignoring.", value);
295
296         } else if (streq(key, "systemd.log_level") && value) {
297
298                 if (log_set_max_level_from_string(value) < 0)
299                         log_warning("Failed to parse log level %s. Ignoring.", value);
300
301         } else if (streq(key, "systemd.log_color") && value) {
302
303                 if (log_show_color_from_string(value) < 0)
304                         log_warning("Failed to parse log color setting %s. Ignoring.", value);
305
306         } else if (streq(key, "systemd.log_location") && value) {
307
308                 if (log_show_location_from_string(value) < 0)
309                         log_warning("Failed to parse log location setting %s. Ignoring.", value);
310
311         } else if (streq(key, "systemd.dump_core") && value) {
312
313                 r = parse_boolean(value);
314                 if (r < 0)
315                         log_warning("Failed to parse dump core switch %s. Ignoring.", value);
316                 else
317                         arg_dump_core = r;
318
319         } else if (streq(key, "systemd.crash_shell") && value) {
320
321                 r = parse_boolean(value);
322                 if (r < 0)
323                         log_warning("Failed to parse crash shell switch %s. Ignoring.", value);
324                 else
325                         arg_crash_shell = r;
326
327         } else if (streq(key, "systemd.crash_chvt") && value) {
328
329                 if (safe_atoi(value, &r) < 0)
330                         log_warning("Failed to parse crash chvt switch %s. Ignoring.", value);
331                 else
332                         arg_crash_chvt = r;
333
334         } else if (streq(key, "systemd.confirm_spawn") && value) {
335
336                 r = parse_boolean(value);
337                 if (r < 0)
338                         log_warning("Failed to parse confirm spawn switch %s. Ignoring.", value);
339                 else
340                         arg_confirm_spawn = r;
341
342         } else if (streq(key, "systemd.show_status") && value) {
343
344                 r = parse_show_status(value, &arg_show_status);
345                 if (r < 0)
346                         log_warning("Failed to parse show status switch %s. Ignoring.", value);
347
348         } else if (streq(key, "systemd.default_standard_output") && value) {
349
350                 r = exec_output_from_string(value);
351                 if (r < 0)
352                         log_warning("Failed to parse default standard output switch %s. Ignoring.", value);
353                 else
354                         arg_default_std_output = r;
355
356         } else if (streq(key, "systemd.default_standard_error") && value) {
357
358                 r = exec_output_from_string(value);
359                 if (r < 0)
360                         log_warning("Failed to parse default standard error switch %s. Ignoring.", value);
361                 else
362                         arg_default_std_error = r;
363
364         } else if (streq(key, "systemd.setenv") && value) {
365
366                 if (env_assignment_is_valid(value)) {
367                         char **env;
368
369                         env = strv_env_set(arg_default_environment, value);
370                         if (env)
371                                 arg_default_environment = env;
372                         else
373                                 log_warning("Setting environment variable '%s' failed, ignoring: %s", value, strerror(ENOMEM));
374                 } else
375                         log_warning("Environment variable name '%s' is not valid. Ignoring.", value);
376
377         } else if (!streq(key, "systemd.restore_state") &&
378                    !streq(key, "systemd.gpt_auto") &&
379                    (startswith(key, "systemd.") || startswith(key, "rd.systemd."))) {
380
381                 const char *c;
382
383                 /* Ignore systemd.journald.xyz and friends */
384                 c = key;
385                 if (startswith(c, "rd."))
386                         c += 3;
387                 if (startswith(c, "systemd."))
388                         c += 8;
389                 if (c[strcspn(c, ".=")] != '.')  {
390
391                         log_warning("Unknown kernel switch %s. Ignoring.", key);
392
393                         log_info("Supported kernel switches:\n"
394                                  "systemd.unit=UNIT                        Default unit to start\n"
395                                  "rd.systemd.unit=UNIT                     Default unit to start when run in initrd\n"
396                                  "systemd.dump_core=0|1                    Dump core on crash\n"
397                                  "systemd.crash_shell=0|1                  Run shell on crash\n"
398                                  "systemd.crash_chvt=N                     Change to VT #N on crash\n"
399                                  "systemd.confirm_spawn=0|1                Confirm every process spawn\n"
400                                  "systemd.show_status=0|1|auto             Show status updates on the console during bootup\n"
401                                  "systemd.log_target=console|kmsg|journal|journal-or-kmsg|syslog|syslog-or-kmsg|null\n"
402                                  "                                         Log target\n"
403                                  "systemd.log_level=LEVEL                  Log level\n"
404                                  "systemd.log_color=0|1                    Highlight important log messages\n"
405                                  "systemd.log_location=0|1                 Include code location in log messages\n"
406                                  "systemd.default_standard_output=null|tty|syslog|syslog+console|kmsg|kmsg+console|journal|journal+console\n"
407                                  "                                         Set default log output for services\n"
408                                  "systemd.default_standard_error=null|tty|syslog|syslog+console|kmsg|kmsg+console|journal|journal+console\n"
409                                  "                                         Set default log error output for services\n"
410                                  "systemd.setenv=ASSIGNMENT                Set an environment variable for all spawned processes\n"
411                                  "systemd.restore_state=0|1                Restore backlight/rfkill state at boot\n");
412                 }
413
414         } else if (streq(key, "quiet") && !value) {
415
416                 log_set_max_level(LOG_NOTICE);
417
418                 if (arg_show_status == _SHOW_STATUS_UNSET)
419                         arg_show_status = SHOW_STATUS_AUTO;
420
421         } else if (streq(key, "debug") && !value) {
422
423                 log_set_max_level(LOG_DEBUG);
424
425                 if (detect_container(NULL) > 0)
426                         log_set_target(LOG_TARGET_CONSOLE);
427
428         } else if (!in_initrd() && !value) {
429                 unsigned i;
430
431                 /* SysV compatibility */
432                 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
433                         if (streq(key, rlmap[i]))
434                                 return set_default_unit(rlmap[i+1]);
435         }
436
437         return 0;
438 }
439
440 #define DEFINE_SETTER(name, func, descr)                              \
441         static int name(const char *unit,                             \
442                         const char *filename,                         \
443                         unsigned line,                                \
444                         const char *section,                          \
445                         unsigned section_line,                        \
446                         const char *lvalue,                           \
447                         int ltype,                                    \
448                         const char *rvalue,                           \
449                         void *data,                                   \
450                         void *userdata) {                             \
451                                                                       \
452                 int r;                                                \
453                                                                       \
454                 assert(filename);                                     \
455                 assert(lvalue);                                       \
456                 assert(rvalue);                                       \
457                                                                       \
458                 r = func(rvalue);                                     \
459                 if (r < 0)                                            \
460                         log_syntax(unit, LOG_ERR, filename, line, -r, \
461                                    "Invalid " descr "'%s': %s",       \
462                                    rvalue, strerror(-r));             \
463                                                                       \
464                 return 0;                                             \
465         }
466
467 DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
468 DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
469 DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
470 DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
471
472 static int config_parse_cpu_affinity2(
473                 const char *unit,
474                 const char *filename,
475                 unsigned line,
476                 const char *section,
477                 unsigned section_line,
478                 const char *lvalue,
479                 int ltype,
480                 const char *rvalue,
481                 void *data,
482                 void *userdata) {
483
484         char *w;
485         size_t l;
486         char *state;
487         cpu_set_t *c = NULL;
488         unsigned ncpus = 0;
489
490         assert(filename);
491         assert(lvalue);
492         assert(rvalue);
493
494         FOREACH_WORD_QUOTED(w, l, rvalue, state) {
495                 char *t;
496                 int r;
497                 unsigned cpu;
498
499                 if (!(t = strndup(w, l)))
500                         return log_oom();
501
502                 r = safe_atou(t, &cpu);
503                 free(t);
504
505                 if (!c)
506                         if (!(c = cpu_set_malloc(&ncpus)))
507                                 return log_oom();
508
509                 if (r < 0 || cpu >= ncpus) {
510                         log_syntax(unit, LOG_ERR, filename, line, -r,
511                                    "Failed to parse CPU affinity '%s'", rvalue);
512                         CPU_FREE(c);
513                         return -EBADMSG;
514                 }
515
516                 CPU_SET_S(cpu, CPU_ALLOC_SIZE(ncpus), c);
517         }
518
519         if (c) {
520                 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
521                         log_warning_unit(unit, "Failed to set CPU affinity: %m");
522
523                 CPU_FREE(c);
524         }
525
526         return 0;
527 }
528
529 static int config_parse_show_status(
530                 const char* unit,
531                 const char *filename,
532                 unsigned line,
533                 const char *section,
534                 unsigned section_line,
535                 const char *lvalue,
536                 int ltype,
537                 const char *rvalue,
538                 void *data,
539                 void *userdata) {
540
541         int k;
542         ShowStatus *b = data;
543
544         assert(filename);
545         assert(lvalue);
546         assert(rvalue);
547         assert(data);
548
549         k = parse_show_status(rvalue, b);
550         if (k < 0) {
551                 log_syntax(unit, LOG_ERR, filename, line, -k,
552                            "Failed to parse show status setting, ignoring: %s", rvalue);
553                 return 0;
554         }
555
556         return 0;
557 }
558
559 static void strv_free_free(char ***l) {
560         char ***i;
561
562         if (!l)
563                 return;
564
565         for (i = l; *i; i++)
566                 strv_free(*i);
567
568         free(l);
569 }
570
571 static void free_join_controllers(void) {
572         strv_free_free(arg_join_controllers);
573         arg_join_controllers = NULL;
574 }
575
576 static int config_parse_join_controllers(const char *unit,
577                                          const char *filename,
578                                          unsigned line,
579                                          const char *section,
580                                          unsigned section_line,
581                                          const char *lvalue,
582                                          int ltype,
583                                          const char *rvalue,
584                                          void *data,
585                                          void *userdata) {
586
587         unsigned n = 0;
588         char *state, *w;
589         size_t length;
590
591         assert(filename);
592         assert(lvalue);
593         assert(rvalue);
594
595         free_join_controllers();
596
597         FOREACH_WORD_QUOTED(w, length, rvalue, state) {
598                 char *s, **l;
599
600                 s = strndup(w, length);
601                 if (!s)
602                         return log_oom();
603
604                 l = strv_split(s, ",");
605                 free(s);
606
607                 strv_uniq(l);
608
609                 if (strv_length(l) <= 1) {
610                         strv_free(l);
611                         continue;
612                 }
613
614                 if (!arg_join_controllers) {
615                         arg_join_controllers = new(char**, 2);
616                         if (!arg_join_controllers) {
617                                 strv_free(l);
618                                 return log_oom();
619                         }
620
621                         arg_join_controllers[0] = l;
622                         arg_join_controllers[1] = NULL;
623
624                         n = 1;
625                 } else {
626                         char ***a;
627                         char ***t;
628
629                         t = new0(char**, n+2);
630                         if (!t) {
631                                 strv_free(l);
632                                 return log_oom();
633                         }
634
635                         n = 0;
636
637                         for (a = arg_join_controllers; *a; a++) {
638
639                                 if (strv_overlap(*a, l)) {
640                                         if (strv_extend_strv(&l, *a) < 0) {
641                                                 strv_free(l);
642                                                 strv_free_free(t);
643                                                 return log_oom();
644                                         }
645
646                                 } else {
647                                         char **c;
648
649                                         c = strv_copy(*a);
650                                         if (!c) {
651                                                 strv_free(l);
652                                                 strv_free_free(t);
653                                                 return log_oom();
654                                         }
655
656                                         t[n++] = c;
657                                 }
658                         }
659
660                         t[n++] = strv_uniq(l);
661
662                         strv_free_free(arg_join_controllers);
663                         arg_join_controllers = t;
664                 }
665         }
666
667         return 0;
668 }
669
670 static int parse_config_file(void) {
671
672         const ConfigTableItem items[] = {
673                 { "Manager", "LogLevel",                  config_parse_level2,           0, NULL                                   },
674                 { "Manager", "LogTarget",                 config_parse_target,           0, NULL                                   },
675                 { "Manager", "LogColor",                  config_parse_color,            0, NULL                                   },
676                 { "Manager", "LogLocation",               config_parse_location,         0, NULL                                   },
677                 { "Manager", "DumpCore",                  config_parse_bool,             0, &arg_dump_core                         },
678                 { "Manager", "CrashShell",                config_parse_bool,             0, &arg_crash_shell                       },
679                 { "Manager", "ShowStatus",                config_parse_show_status,      0, &arg_show_status                       },
680                 { "Manager", "CrashChVT",                 config_parse_int,              0, &arg_crash_chvt                        },
681                 { "Manager", "CPUAffinity",               config_parse_cpu_affinity2,    0, NULL                                   },
682                 { "Manager", "JoinControllers",           config_parse_join_controllers, 0, &arg_join_controllers                  },
683                 { "Manager", "RuntimeWatchdogSec",        config_parse_sec,              0, &arg_runtime_watchdog                  },
684                 { "Manager", "ShutdownWatchdogSec",       config_parse_sec,              0, &arg_shutdown_watchdog                 },
685                 { "Manager", "CapabilityBoundingSet",     config_parse_bounding_set,     0, &arg_capability_bounding_set_drop      },
686 #ifdef HAVE_SECCOMP
687                 { "Manager", "SystemCallArchitectures",   config_parse_syscall_archs,    0, &arg_syscall_archs                     },
688 #endif
689                 { "Manager", "TimerSlackNSec",            config_parse_nsec,             0, &arg_timer_slack_nsec                  },
690                 { "Manager", "DefaultTimerAccuracySec",   config_parse_sec,              0, &arg_default_timer_accuracy_usec       },
691                 { "Manager", "DefaultStandardOutput",     config_parse_output,           0, &arg_default_std_output                },
692                 { "Manager", "DefaultStandardError",      config_parse_output,           0, &arg_default_std_error                 },
693                 { "Manager", "DefaultTimeoutStartSec",    config_parse_sec,              0, &arg_default_timeout_start_usec        },
694                 { "Manager", "DefaultTimeoutStopSec",     config_parse_sec,              0, &arg_default_timeout_stop_usec         },
695                 { "Manager", "DefaultRestartSec",         config_parse_sec,              0, &arg_default_restart_usec              },
696                 { "Manager", "DefaultStartLimitInterval", config_parse_sec,              0, &arg_default_start_limit_interval      },
697                 { "Manager", "DefaultStartLimitBurst",    config_parse_unsigned,         0, &arg_default_start_limit_burst         },
698                 { "Manager", "DefaultEnvironment",        config_parse_environ,          0, &arg_default_environment               },
699                 { "Manager", "DefaultLimitCPU",           config_parse_limit,            0, &arg_default_rlimit[RLIMIT_CPU]        },
700                 { "Manager", "DefaultLimitFSIZE",         config_parse_limit,            0, &arg_default_rlimit[RLIMIT_FSIZE]      },
701                 { "Manager", "DefaultLimitDATA",          config_parse_limit,            0, &arg_default_rlimit[RLIMIT_DATA]       },
702                 { "Manager", "DefaultLimitSTACK",         config_parse_limit,            0, &arg_default_rlimit[RLIMIT_STACK]      },
703                 { "Manager", "DefaultLimitCORE",          config_parse_limit,            0, &arg_default_rlimit[RLIMIT_CORE]       },
704                 { "Manager", "DefaultLimitRSS",           config_parse_limit,            0, &arg_default_rlimit[RLIMIT_RSS]        },
705                 { "Manager", "DefaultLimitNOFILE",        config_parse_limit,            0, &arg_default_rlimit[RLIMIT_NOFILE]     },
706                 { "Manager", "DefaultLimitAS",            config_parse_limit,            0, &arg_default_rlimit[RLIMIT_AS]         },
707                 { "Manager", "DefaultLimitNPROC",         config_parse_limit,            0, &arg_default_rlimit[RLIMIT_NPROC]      },
708                 { "Manager", "DefaultLimitMEMLOCK",       config_parse_limit,            0, &arg_default_rlimit[RLIMIT_MEMLOCK]    },
709                 { "Manager", "DefaultLimitLOCKS",         config_parse_limit,            0, &arg_default_rlimit[RLIMIT_LOCKS]      },
710                 { "Manager", "DefaultLimitSIGPENDING",    config_parse_limit,            0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
711                 { "Manager", "DefaultLimitMSGQUEUE",      config_parse_limit,            0, &arg_default_rlimit[RLIMIT_MSGQUEUE]   },
712                 { "Manager", "DefaultLimitNICE",          config_parse_limit,            0, &arg_default_rlimit[RLIMIT_NICE]       },
713                 { "Manager", "DefaultLimitRTPRIO",        config_parse_limit,            0, &arg_default_rlimit[RLIMIT_RTPRIO]     },
714                 { "Manager", "DefaultLimitRTTIME",        config_parse_limit,            0, &arg_default_rlimit[RLIMIT_RTTIME]     },
715                 { "Manager", "DefaultCPUAccounting",      config_parse_bool,             0, &arg_default_cpu_accounting            },
716                 { "Manager", "DefaultBlockIOAccounting",  config_parse_bool,             0, &arg_default_blockio_accounting        },
717                 { "Manager", "DefaultMemoryAccounting",   config_parse_bool,             0, &arg_default_memory_accounting         },
718                 {}
719         };
720
721         _cleanup_fclose_ FILE *f;
722         const char *fn;
723         int r;
724
725         fn = arg_running_as == SYSTEMD_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
726         f = fopen(fn, "re");
727         if (!f) {
728                 if (errno == ENOENT)
729                         return 0;
730
731                 log_warning("Failed to open configuration file '%s': %m", fn);
732                 return 0;
733         }
734
735         r = config_parse(NULL, fn, f, "Manager\0", config_item_table_lookup, (void*) items, false, false, NULL);
736         if (r < 0)
737                 log_warning("Failed to parse configuration file: %s", strerror(-r));
738
739         return 0;
740 }
741
742 static int parse_argv(int argc, char *argv[]) {
743
744         enum {
745                 ARG_LOG_LEVEL = 0x100,
746                 ARG_LOG_TARGET,
747                 ARG_LOG_COLOR,
748                 ARG_LOG_LOCATION,
749                 ARG_UNIT,
750                 ARG_SYSTEM,
751                 ARG_USER,
752                 ARG_TEST,
753                 ARG_VERSION,
754                 ARG_DUMP_CONFIGURATION_ITEMS,
755                 ARG_DUMP_CORE,
756                 ARG_CRASH_SHELL,
757                 ARG_CONFIRM_SPAWN,
758                 ARG_SHOW_STATUS,
759                 ARG_DESERIALIZE,
760                 ARG_SWITCHED_ROOT,
761                 ARG_DEFAULT_STD_OUTPUT,
762                 ARG_DEFAULT_STD_ERROR
763         };
764
765         static const struct option options[] = {
766                 { "log-level",                required_argument, NULL, ARG_LOG_LEVEL                },
767                 { "log-target",               required_argument, NULL, ARG_LOG_TARGET               },
768                 { "log-color",                optional_argument, NULL, ARG_LOG_COLOR                },
769                 { "log-location",             optional_argument, NULL, ARG_LOG_LOCATION             },
770                 { "unit",                     required_argument, NULL, ARG_UNIT                     },
771                 { "system",                   no_argument,       NULL, ARG_SYSTEM                   },
772                 { "user",                     no_argument,       NULL, ARG_USER                     },
773                 { "test",                     no_argument,       NULL, ARG_TEST                     },
774                 { "help",                     no_argument,       NULL, 'h'                          },
775                 { "version",                  no_argument,       NULL, ARG_VERSION                  },
776                 { "dump-configuration-items", no_argument,       NULL, ARG_DUMP_CONFIGURATION_ITEMS },
777                 { "dump-core",                optional_argument, NULL, ARG_DUMP_CORE                },
778                 { "crash-shell",              optional_argument, NULL, ARG_CRASH_SHELL              },
779                 { "confirm-spawn",            optional_argument, NULL, ARG_CONFIRM_SPAWN            },
780                 { "show-status",              optional_argument, NULL, ARG_SHOW_STATUS              },
781                 { "deserialize",              required_argument, NULL, ARG_DESERIALIZE              },
782                 { "switched-root",            no_argument,       NULL, ARG_SWITCHED_ROOT            },
783                 { "default-standard-output",  required_argument, NULL, ARG_DEFAULT_STD_OUTPUT,      },
784                 { "default-standard-error",   required_argument, NULL, ARG_DEFAULT_STD_ERROR,       },
785                 {}
786         };
787
788         int c, r;
789
790         assert(argc >= 1);
791         assert(argv);
792
793         if (getpid() == 1)
794                 opterr = 0;
795
796         while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
797
798                 switch (c) {
799
800                 case ARG_LOG_LEVEL:
801                         r = log_set_max_level_from_string(optarg);
802                         if (r < 0) {
803                                 log_error("Failed to parse log level %s.", optarg);
804                                 return r;
805                         }
806
807                         break;
808
809                 case ARG_LOG_TARGET:
810                         r = log_set_target_from_string(optarg);
811                         if (r < 0) {
812                                 log_error("Failed to parse log target %s.", optarg);
813                                 return r;
814                         }
815
816                         break;
817
818                 case ARG_LOG_COLOR:
819
820                         if (optarg) {
821                                 r = log_show_color_from_string(optarg);
822                                 if (r < 0) {
823                                         log_error("Failed to parse log color setting %s.", optarg);
824                                         return r;
825                                 }
826                         } else
827                                 log_show_color(true);
828
829                         break;
830
831                 case ARG_LOG_LOCATION:
832                         if (optarg) {
833                                 r = log_show_location_from_string(optarg);
834                                 if (r < 0) {
835                                         log_error("Failed to parse log location setting %s.", optarg);
836                                         return r;
837                                 }
838                         } else
839                                 log_show_location(true);
840
841                         break;
842
843                 case ARG_DEFAULT_STD_OUTPUT:
844                         r = exec_output_from_string(optarg);
845                         if (r < 0) {
846                                 log_error("Failed to parse default standard output setting %s.", optarg);
847                                 return r;
848                         } else
849                                 arg_default_std_output = r;
850                         break;
851
852                 case ARG_DEFAULT_STD_ERROR:
853                         r = exec_output_from_string(optarg);
854                         if (r < 0) {
855                                 log_error("Failed to parse default standard error output setting %s.", optarg);
856                                 return r;
857                         } else
858                                 arg_default_std_error = r;
859                         break;
860
861                 case ARG_UNIT:
862
863                         r = set_default_unit(optarg);
864                         if (r < 0) {
865                                 log_error("Failed to set default unit %s: %s", optarg, strerror(-r));
866                                 return r;
867                         }
868
869                         break;
870
871                 case ARG_SYSTEM:
872                         arg_running_as = SYSTEMD_SYSTEM;
873                         break;
874
875                 case ARG_USER:
876                         arg_running_as = SYSTEMD_USER;
877                         break;
878
879                 case ARG_TEST:
880                         arg_action = ACTION_TEST;
881                         break;
882
883                 case ARG_VERSION:
884                         arg_action = ACTION_VERSION;
885                         break;
886
887                 case ARG_DUMP_CONFIGURATION_ITEMS:
888                         arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
889                         break;
890
891                 case ARG_DUMP_CORE:
892                         r = optarg ? parse_boolean(optarg) : 1;
893                         if (r < 0) {
894                                 log_error("Failed to parse dump core boolean %s.", optarg);
895                                 return r;
896                         }
897                         arg_dump_core = r;
898                         break;
899
900                 case ARG_CRASH_SHELL:
901                         r = optarg ? parse_boolean(optarg) : 1;
902                         if (r < 0) {
903                                 log_error("Failed to parse crash shell boolean %s.", optarg);
904                                 return r;
905                         }
906                         arg_crash_shell = r;
907                         break;
908
909                 case ARG_CONFIRM_SPAWN:
910                         r = optarg ? parse_boolean(optarg) : 1;
911                         if (r < 0) {
912                                 log_error("Failed to parse confirm spawn boolean %s.", optarg);
913                                 return r;
914                         }
915                         arg_confirm_spawn = r;
916                         break;
917
918                 case ARG_SHOW_STATUS:
919                         if (optarg) {
920                                 r = parse_show_status(optarg, &arg_show_status);
921                                 if (r < 0) {
922                                         log_error("Failed to parse show status boolean %s.", optarg);
923                                         return r;
924                                 }
925                         } else
926                                 arg_show_status = SHOW_STATUS_YES;
927                         break;
928
929                 case ARG_DESERIALIZE: {
930                         int fd;
931                         FILE *f;
932
933                         r = safe_atoi(optarg, &fd);
934                         if (r < 0 || fd < 0) {
935                                 log_error("Failed to parse deserialize option %s.", optarg);
936                                 return r < 0 ? r : -EINVAL;
937                         }
938
939                         fd_cloexec(fd, true);
940
941                         f = fdopen(fd, "r");
942                         if (!f) {
943                                 log_error("Failed to open serialization fd: %m");
944                                 return -errno;
945                         }
946
947                         if (arg_serialization)
948                                 fclose(arg_serialization);
949
950                         arg_serialization = f;
951
952                         break;
953                 }
954
955                 case ARG_SWITCHED_ROOT:
956                         arg_switched_root = true;
957                         break;
958
959                 case 'h':
960                         arg_action = ACTION_HELP;
961                         break;
962
963                 case 'D':
964                         log_set_max_level(LOG_DEBUG);
965                         break;
966
967                 case 'b':
968                 case 's':
969                 case 'z':
970                         /* Just to eat away the sysvinit kernel
971                          * cmdline args without getopt() error
972                          * messages that we'll parse in
973                          * parse_proc_cmdline_word() or ignore. */
974
975                 case '?':
976                 default:
977                         if (getpid() != 1) {
978                                 log_error("Unknown option code %c", c);
979                                 return -EINVAL;
980                         }
981
982                         break;
983                 }
984
985         if (optind < argc && getpid() != 1) {
986                 /* Hmm, when we aren't run as init system
987                  * let's complain about excess arguments */
988
989                 log_error("Excess arguments.");
990                 return -EINVAL;
991         }
992
993         if (detect_container(NULL) > 0) {
994                 char **a;
995
996                 /* All /proc/cmdline arguments the kernel didn't
997                  * understand it passed to us. We're not really
998                  * interested in that usually since /proc/cmdline is
999                  * more interesting and complete. With one exception:
1000                  * if we are run in a container /proc/cmdline is not
1001                  * relevant for the container, hence we rely on argv[]
1002                  * instead. */
1003
1004                 for (a = argv; a < argv + argc; a++) {
1005                         _cleanup_free_ char *w;
1006                         char *value;
1007
1008                         w = strdup(*a);
1009                         if (!w)
1010                                 return log_oom();
1011
1012                         value = strchr(w, '=');
1013                         if (value)
1014                                 *(value++) = 0;
1015
1016                         r = parse_proc_cmdline_item(w, value);
1017                         if (r < 0) {
1018                                 log_error("Failed on cmdline argument %s: %s", *a, strerror(-r));
1019                                 return r;
1020                         }
1021                 }
1022         }
1023
1024         return 0;
1025 }
1026
1027 static int help(void) {
1028
1029         printf("%s [OPTIONS...]\n\n"
1030                "Starts up and maintains the system or user services.\n\n"
1031                "  -h --help                      Show this help\n"
1032                "     --test                      Determine startup sequence, dump it and exit\n"
1033                "     --dump-configuration-items  Dump understood unit configuration items\n"
1034                "     --unit=UNIT                 Set default unit\n"
1035                "     --system                    Run a system instance, even if PID != 1\n"
1036                "     --user                      Run a user instance\n"
1037                "     --dump-core[=0|1]           Dump core on crash\n"
1038                "     --crash-shell[=0|1]         Run shell on crash\n"
1039                "     --confirm-spawn[=0|1]       Ask for confirmation when spawning processes\n"
1040                "     --show-status[=0|1]         Show status updates on the console during bootup\n"
1041                "     --log-target=TARGET         Set log target (console, journal, syslog, kmsg, journal-or-kmsg, syslog-or-kmsg, null)\n"
1042                "     --log-level=LEVEL           Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
1043                "     --log-color[=0|1]           Highlight important log messages\n"
1044                "     --log-location[=0|1]        Include code location in log messages\n"
1045                "     --default-standard-output=  Set default standard output for services\n"
1046                "     --default-standard-error=   Set default standard error output for services\n",
1047                program_invocation_short_name);
1048
1049         return 0;
1050 }
1051
1052 static int version(void) {
1053         puts(PACKAGE_STRING);
1054         puts(SYSTEMD_FEATURES);
1055
1056         return 0;
1057 }
1058
1059 static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
1060         FILE *f = NULL;
1061         FDSet *fds = NULL;
1062         int r;
1063
1064         assert(m);
1065         assert(_f);
1066         assert(_fds);
1067
1068         r = manager_open_serialization(m, &f);
1069         if (r < 0) {
1070                 log_error("Failed to create serialization file: %s", strerror(-r));
1071                 goto fail;
1072         }
1073
1074         /* Make sure nothing is really destructed when we shut down */
1075         m->n_reloading ++;
1076         bus_manager_send_reloading(m, true);
1077
1078         fds = fdset_new();
1079         if (!fds) {
1080                 r = -ENOMEM;
1081                 log_error("Failed to allocate fd set: %s", strerror(-r));
1082                 goto fail;
1083         }
1084
1085         r = manager_serialize(m, f, fds, switching_root);
1086         if (r < 0) {
1087                 log_error("Failed to serialize state: %s", strerror(-r));
1088                 goto fail;
1089         }
1090
1091         if (fseeko(f, 0, SEEK_SET) < 0) {
1092                 log_error("Failed to rewind serialization fd: %m");
1093                 goto fail;
1094         }
1095
1096         r = fd_cloexec(fileno(f), false);
1097         if (r < 0) {
1098                 log_error("Failed to disable O_CLOEXEC for serialization: %s", strerror(-r));
1099                 goto fail;
1100         }
1101
1102         r = fdset_cloexec(fds, false);
1103         if (r < 0) {
1104                 log_error("Failed to disable O_CLOEXEC for serialization fds: %s", strerror(-r));
1105                 goto fail;
1106         }
1107
1108         *_f = f;
1109         *_fds = fds;
1110
1111         return 0;
1112
1113 fail:
1114         fdset_free(fds);
1115
1116         if (f)
1117                 fclose(f);
1118
1119         return r;
1120 }
1121
1122 static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1123         struct rlimit nl;
1124         int r;
1125
1126         assert(saved_rlimit);
1127
1128         /* Save the original RLIMIT_NOFILE so that we can reset it
1129          * later when transitioning from the initrd to the main
1130          * systemd or suchlike. */
1131         if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0) {
1132                 log_error("Reading RLIMIT_NOFILE failed: %m");
1133                 return -errno;
1134         }
1135
1136         /* Make sure forked processes get the default kernel setting */
1137         if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1138                 struct rlimit *rl;
1139
1140                 rl = newdup(struct rlimit, saved_rlimit, 1);
1141                 if (!rl)
1142                         return log_oom();
1143
1144                 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1145         }
1146
1147         /* Bump up the resource limit for ourselves substantially */
1148         nl.rlim_cur = nl.rlim_max = 64*1024;
1149         r = setrlimit_closest(RLIMIT_NOFILE, &nl);
1150         if (r < 0) {
1151                 log_error("Setting RLIMIT_NOFILE failed: %s", strerror(-r));
1152                 return r;
1153         }
1154
1155         return 0;
1156 }
1157
1158 static void test_mtab(void) {
1159
1160         static const char ok[] =
1161                 "/proc/self/mounts\0"
1162                 "/proc/mounts\0"
1163                 "../proc/self/mounts\0"
1164                 "../proc/mounts\0";
1165
1166         _cleanup_free_ char *p = NULL;
1167         int r;
1168
1169         /* Check that /etc/mtab is a symlink to the right place or
1170          * non-existing. But certainly not a file, or a symlink to
1171          * some weird place... */
1172
1173         r = readlink_malloc("/etc/mtab", &p);
1174         if (r == -ENOENT)
1175                 return;
1176         if (r >= 0 && nulstr_contains(ok, p))
1177                 return;
1178
1179         log_warning("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1180                     "This is not supported anymore. "
1181                     "Please make sure to replace this file by a symlink to avoid incorrect or misleading mount(8) output.");
1182 }
1183
1184 static void test_usr(void) {
1185
1186         /* Check that /usr is not a separate fs */
1187
1188         if (dir_is_empty("/usr") <= 0)
1189                 return;
1190
1191         log_warning("/usr appears to be on its own filesytem and is not already mounted. This is not a supported setup. "
1192                     "Some things will probably break (sometimes even silently) in mysterious ways. "
1193                     "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1194 }
1195
1196 static int initialize_join_controllers(void) {
1197         /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1198          * + "net_prio". We'd like to add "cpuset" to the mix, but
1199          * "cpuset" does't really work for groups with no initialized
1200          * attributes. */
1201
1202         arg_join_controllers = new(char**, 3);
1203         if (!arg_join_controllers)
1204                 return -ENOMEM;
1205
1206         arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
1207         arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
1208         arg_join_controllers[2] = NULL;
1209
1210         if (!arg_join_controllers[0] || !arg_join_controllers[1]) {
1211                 free_join_controllers();
1212                 return -ENOMEM;
1213         }
1214
1215         return 0;
1216 }
1217
1218 static int enforce_syscall_archs(Set *archs) {
1219 #ifdef HAVE_SECCOMP
1220         scmp_filter_ctx *seccomp;
1221         Iterator i;
1222         void *id;
1223         int r;
1224
1225         seccomp = seccomp_init(SCMP_ACT_ALLOW);
1226         if (!seccomp)
1227                 return log_oom();
1228
1229         SET_FOREACH(id, arg_syscall_archs, i) {
1230                 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1231                 if (r == -EEXIST)
1232                         continue;
1233                 if (r < 0) {
1234                         log_error("Failed to add architecture to seccomp: %s", strerror(-r));
1235                         goto finish;
1236                 }
1237         }
1238
1239         r = seccomp_attr_set(seccomp, SCMP_FLTATR_CTL_NNP, 0);
1240         if (r < 0) {
1241                 log_error("Failed to unset NO_NEW_PRIVS: %s", strerror(-r));
1242                 goto finish;
1243         }
1244
1245         r = seccomp_load(seccomp);
1246         if (r < 0)
1247                 log_error("Failed to add install architecture seccomp: %s", strerror(-r));
1248
1249 finish:
1250         seccomp_release(seccomp);
1251         return r;
1252 #else
1253         return 0;
1254 #endif
1255 }
1256
1257 static int status_welcome(void) {
1258         _cleanup_free_ char *pretty_name = NULL, *ansi_color = NULL;
1259         int r;
1260
1261         r = parse_env_file("/etc/os-release", NEWLINE,
1262                            "PRETTY_NAME", &pretty_name,
1263                            "ANSI_COLOR", &ansi_color,
1264                            NULL);
1265         if (r == -ENOENT) {
1266                 r = parse_env_file("/usr/lib/os-release", NEWLINE,
1267                                    "PRETTY_NAME", &pretty_name,
1268                                    "ANSI_COLOR", &ansi_color,
1269                                    NULL);
1270         }
1271
1272         if (r < 0 && r != -ENOENT)
1273                 log_warning("Failed to read os-release file: %s", strerror(-r));
1274
1275         return status_printf(NULL, false, false,
1276                              "\nWelcome to \x1B[%sm%s\x1B[0m!\n",
1277                              isempty(ansi_color) ? "1" : ansi_color,
1278                              isempty(pretty_name) ? "Linux" : pretty_name);
1279 }
1280
1281 static int write_container_id(void) {
1282         const char *c;
1283
1284         c = getenv("container");
1285         if (isempty(c))
1286                 return 0;
1287
1288         return write_string_file("/run/systemd/container", c);
1289 }
1290
1291 int main(int argc, char *argv[]) {
1292         Manager *m = NULL;
1293         int r, retval = EXIT_FAILURE;
1294         usec_t before_startup, after_startup;
1295         char timespan[FORMAT_TIMESPAN_MAX];
1296         FDSet *fds = NULL;
1297         bool reexecute = false;
1298         const char *shutdown_verb = NULL;
1299         dual_timestamp initrd_timestamp = { 0ULL, 0ULL };
1300         dual_timestamp userspace_timestamp = { 0ULL, 0ULL };
1301         dual_timestamp kernel_timestamp = { 0ULL, 0ULL };
1302         dual_timestamp security_start_timestamp = { 0ULL, 0ULL };
1303         dual_timestamp security_finish_timestamp = { 0ULL, 0ULL };
1304         static char systemd[] = "systemd";
1305         bool skip_setup = false;
1306         unsigned j;
1307         bool loaded_policy = false;
1308         bool arm_reboot_watchdog = false;
1309         bool queue_default_job = false;
1310         bool empty_etc = false;
1311         char *switch_root_dir = NULL, *switch_root_init = NULL;
1312         static struct rlimit saved_rlimit_nofile = { 0, 0 };
1313
1314 #ifdef HAVE_SYSV_COMPAT
1315         if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
1316                 /* This is compatibility support for SysV, where
1317                  * calling init as a user is identical to telinit. */
1318
1319                 errno = -ENOENT;
1320                 execv(SYSTEMCTL_BINARY_PATH, argv);
1321                 log_error("Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
1322                 return 1;
1323         }
1324 #endif
1325
1326         dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1327         dual_timestamp_get(&userspace_timestamp);
1328
1329         /* Determine if this is a reexecution or normal bootup. We do
1330          * the full command line parsing much later, so let's just
1331          * have a quick peek here. */
1332         if (strv_find(argv+1, "--deserialize"))
1333                 skip_setup = true;
1334
1335         /* If we have switched root, do all the special setup
1336          * things */
1337         if (strv_find(argv+1, "--switched-root"))
1338                 skip_setup = false;
1339
1340         /* If we get started via the /sbin/init symlink then we are
1341            called 'init'. After a subsequent reexecution we are then
1342            called 'systemd'. That is confusing, hence let's call us
1343            systemd right-away. */
1344         program_invocation_short_name = systemd;
1345         prctl(PR_SET_NAME, systemd);
1346
1347         saved_argv = argv;
1348         saved_argc = argc;
1349
1350         log_show_color(isatty(STDERR_FILENO) > 0);
1351
1352         /* Disable the umask logic */
1353         if (getpid() == 1)
1354                 umask(0);
1355
1356         if (getpid() == 1 && detect_container(NULL) <= 0) {
1357
1358                 /* Running outside of a container as PID 1 */
1359                 arg_running_as = SYSTEMD_SYSTEM;
1360                 make_null_stdio();
1361                 log_set_target(LOG_TARGET_KMSG);
1362                 log_open();
1363
1364                 if (in_initrd())
1365                         initrd_timestamp = userspace_timestamp;
1366
1367                 if (!skip_setup) {
1368                         mount_setup_early();
1369                         dual_timestamp_get(&security_start_timestamp);
1370                         if (selinux_setup(&loaded_policy) < 0)
1371                                 goto finish;
1372                         if (ima_setup() < 0)
1373                                 goto finish;
1374                         if (smack_setup(&loaded_policy) < 0)
1375                                 goto finish;
1376                         dual_timestamp_get(&security_finish_timestamp);
1377                 }
1378
1379                 if (label_init(NULL) < 0)
1380                         goto finish;
1381
1382                 if (!skip_setup) {
1383                         if (clock_is_localtime() > 0) {
1384                                 int min;
1385
1386                                 /* The first-time call to settimeofday() does a time warp in the kernel */
1387                                 r = clock_set_timezone(&min);
1388                                 if (r < 0)
1389                                         log_error("Failed to apply local time delta, ignoring: %s", strerror(-r));
1390                                 else
1391                                         log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
1392                         } else if (!in_initrd()) {
1393                                 /*
1394                                  * Do dummy first-time call to seal the kernel's time warp magic
1395                                  *
1396                                  * Do not call this this from inside the initrd. The initrd might not
1397                                  * carry /etc/adjtime with LOCAL, but the real system could be set up
1398                                  * that way. In such case, we need to delay the time-warp or the sealing
1399                                  * until we reach the real system.
1400                                  */
1401                                 clock_reset_timezone();
1402
1403                                 /* Tell the kernel our timezone */
1404                                 r = clock_set_timezone(NULL);
1405                                 if (r < 0)
1406                                         log_error("Failed to set the kernel's timezone, ignoring: %s", strerror(-r));
1407                         }
1408                 }
1409
1410                 /* Set the default for later on, but don't actually
1411                  * open the logs like this for now. Note that if we
1412                  * are transitioning from the initrd there might still
1413                  * be journal fd open, and we shouldn't attempt
1414                  * opening that before we parsed /proc/cmdline which
1415                  * might redirect output elsewhere. */
1416                 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1417
1418         } else if (getpid() == 1) {
1419                 /* Running inside a container, as PID 1 */
1420                 arg_running_as = SYSTEMD_SYSTEM;
1421                 log_set_target(LOG_TARGET_CONSOLE);
1422                 log_close_console(); /* force reopen of /dev/console */
1423                 log_open();
1424
1425                 /* For the later on, see above... */
1426                 log_set_target(LOG_TARGET_JOURNAL);
1427
1428                 /* clear the kernel timestamp,
1429                  * because we are in a container */
1430                 kernel_timestamp.monotonic = 0ULL;
1431                 kernel_timestamp.realtime = 0ULL;
1432
1433         } else {
1434                 /* Running as user instance */
1435                 arg_running_as = SYSTEMD_USER;
1436                 log_set_target(LOG_TARGET_AUTO);
1437                 log_open();
1438
1439                 /* clear the kernel timestamp,
1440                  * because we are not PID 1 */
1441                 kernel_timestamp.monotonic = 0ULL;
1442                 kernel_timestamp.realtime = 0ULL;
1443         }
1444
1445         /* Initialize default unit */
1446         r = set_default_unit(SPECIAL_DEFAULT_TARGET);
1447         if (r < 0) {
1448                 log_error("Failed to set default unit %s: %s", SPECIAL_DEFAULT_TARGET, strerror(-r));
1449                 goto finish;
1450         }
1451
1452         r = initialize_join_controllers();
1453         if (r < 0)
1454                 goto finish;
1455
1456         /* Mount /proc, /sys and friends, so that /proc/cmdline and
1457          * /proc/$PID/fd is available. */
1458         if (getpid() == 1) {
1459                 r = mount_setup(loaded_policy);
1460                 if (r < 0)
1461                         goto finish;
1462         }
1463
1464         /* Reset all signal handlers. */
1465         assert_se(reset_all_signal_handlers() == 0);
1466
1467         ignore_signals(SIGNALS_IGNORE, -1);
1468
1469         if (parse_config_file() < 0)
1470                 goto finish;
1471
1472         if (arg_running_as == SYSTEMD_SYSTEM)
1473                 if (parse_proc_cmdline(parse_proc_cmdline_item) < 0)
1474                         goto finish;
1475
1476         log_parse_environment();
1477
1478         if (parse_argv(argc, argv) < 0)
1479                 goto finish;
1480
1481         if (arg_action == ACTION_TEST &&
1482             geteuid() == 0) {
1483                 log_error("Don't run test mode as root.");
1484                 goto finish;
1485         }
1486
1487         if (arg_running_as == SYSTEMD_USER &&
1488             arg_action == ACTION_RUN &&
1489             sd_booted() <= 0) {
1490                 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1491                 goto finish;
1492         }
1493
1494         if (arg_running_as == SYSTEMD_SYSTEM &&
1495             arg_action == ACTION_RUN &&
1496             running_in_chroot() > 0) {
1497                 log_error("Cannot be run in a chroot() environment.");
1498                 goto finish;
1499         }
1500
1501         if (arg_action == ACTION_HELP) {
1502                 retval = help();
1503                 goto finish;
1504         } else if (arg_action == ACTION_VERSION) {
1505                 retval = version();
1506                 goto finish;
1507         } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
1508                 unit_dump_config_items(stdout);
1509                 retval = EXIT_SUCCESS;
1510                 goto finish;
1511         } else if (arg_action == ACTION_DONE) {
1512                 retval = EXIT_SUCCESS;
1513                 goto finish;
1514         }
1515
1516         if (arg_running_as == SYSTEMD_USER &&
1517             !getenv("XDG_RUNTIME_DIR")) {
1518                 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1519                 goto finish;
1520         }
1521
1522         assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
1523
1524         /* Close logging fds, in order not to confuse fdset below */
1525         log_close();
1526
1527         /* Remember open file descriptors for later deserialization */
1528         r = fdset_new_fill(&fds);
1529         if (r < 0) {
1530                 log_error("Failed to allocate fd set: %s", strerror(-r));
1531                 goto finish;
1532         } else
1533                 fdset_cloexec(fds, true);
1534
1535         if (arg_serialization)
1536                 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
1537
1538         if (arg_running_as == SYSTEMD_SYSTEM)
1539                 /* Become a session leader if we aren't one yet. */
1540                 setsid();
1541
1542         /* Move out of the way, so that we won't block unmounts */
1543         assert_se(chdir("/")  == 0);
1544
1545         /* Reset the console, but only if this is really init and we
1546          * are freshly booted */
1547         if (arg_running_as == SYSTEMD_SYSTEM && arg_action == ACTION_RUN)
1548                 console_setup(getpid() == 1 && !skip_setup);
1549
1550         /* Open the logging devices, if possible and necessary */
1551         log_open();
1552
1553         if (arg_show_status == _SHOW_STATUS_UNSET)
1554                 arg_show_status = SHOW_STATUS_YES;
1555
1556         /* Make sure we leave a core dump without panicing the
1557          * kernel. */
1558         if (getpid() == 1) {
1559                 install_crash_handler();
1560
1561                 r = mount_cgroup_controllers(arg_join_controllers);
1562                 if (r < 0)
1563                         goto finish;
1564         }
1565
1566         if (arg_running_as == SYSTEMD_SYSTEM) {
1567                 const char *virtualization = NULL;
1568
1569                 log_info(PACKAGE_STRING " running in system mode. (" SYSTEMD_FEATURES ")");
1570
1571                 detect_virtualization(&virtualization);
1572                 if (virtualization)
1573                         log_info("Detected virtualization '%s'.", virtualization);
1574
1575                 write_container_id();
1576
1577                 log_info("Detected architecture '%s'.", architecture_to_string(uname_architecture()));
1578
1579                 if (in_initrd())
1580                         log_info("Running in initial RAM disk.");
1581
1582                 empty_etc = dir_is_empty("/etc") > 0;
1583                 if (empty_etc)
1584                         log_info("Running with unpopulated /etc.");
1585         } else {
1586                 _cleanup_free_ char *t = uid_to_name(getuid());
1587                 log_debug(PACKAGE_STRING " running in user mode for user "PID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1588                           getuid(), t);
1589         }
1590
1591         if (arg_running_as == SYSTEMD_SYSTEM && !skip_setup) {
1592                 if (arg_show_status > 0 || plymouth_running())
1593                         status_welcome();
1594
1595 #ifdef HAVE_KMOD
1596                 kmod_setup();
1597 #endif
1598                 hostname_setup();
1599                 machine_id_setup(NULL);
1600                 loopback_setup();
1601
1602                 test_mtab();
1603                 test_usr();
1604         }
1605
1606         if (arg_running_as == SYSTEMD_SYSTEM && arg_runtime_watchdog > 0)
1607                 watchdog_set_timeout(&arg_runtime_watchdog);
1608
1609         if (arg_timer_slack_nsec != (nsec_t) -1)
1610                 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
1611                         log_error("Failed to adjust timer slack: %m");
1612
1613         if (arg_capability_bounding_set_drop) {
1614                 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
1615                 if (r < 0) {
1616                         log_error("Failed to drop capability bounding set of usermode helpers: %s", strerror(-r));
1617                         goto finish;
1618                 }
1619                 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
1620                 if (r < 0) {
1621                         log_error("Failed to drop capability bounding set: %s", strerror(-r));
1622                         goto finish;
1623                 }
1624         }
1625
1626         if (arg_syscall_archs) {
1627                 r = enforce_syscall_archs(arg_syscall_archs);
1628                 if (r < 0)
1629                         goto finish;
1630         }
1631
1632         if (arg_running_as == SYSTEMD_USER) {
1633                 /* Become reaper of our children */
1634                 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0) {
1635                         log_warning("Failed to make us a subreaper: %m");
1636                         if (errno == EINVAL)
1637                                 log_info("Perhaps the kernel version is too old (< 3.4?)");
1638                 }
1639         }
1640
1641         if (arg_running_as == SYSTEMD_SYSTEM) {
1642                 bump_rlimit_nofile(&saved_rlimit_nofile);
1643
1644                 if (empty_etc) {
1645                         r = unit_file_preset_all(UNIT_FILE_SYSTEM, false, NULL, UNIT_FILE_PRESET_FULL, false, NULL, 0);
1646                         if (r < 0)
1647                                 log_warning("Failed to populate /etc with preset unit settings, ignoring: %s", strerror(-r));
1648                         else
1649                                 log_info("Populated /etc with preset unit settings.");
1650                 }
1651         }
1652
1653         r = manager_new(arg_running_as, &m);
1654         if (r < 0) {
1655                 log_error("Failed to allocate manager object: %s", strerror(-r));
1656                 goto finish;
1657         }
1658
1659         m->confirm_spawn = arg_confirm_spawn;
1660         m->default_timer_accuracy_usec = arg_default_timer_accuracy_usec;
1661         m->default_std_output = arg_default_std_output;
1662         m->default_std_error = arg_default_std_error;
1663         m->default_restart_usec = arg_default_restart_usec;
1664         m->default_timeout_start_usec = arg_default_timeout_start_usec;
1665         m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
1666         m->default_start_limit_interval = arg_default_start_limit_interval;
1667         m->default_start_limit_burst = arg_default_start_limit_burst;
1668         m->default_cpu_accounting = arg_default_cpu_accounting;
1669         m->default_blockio_accounting = arg_default_blockio_accounting;
1670         m->default_memory_accounting = arg_default_memory_accounting;
1671         m->runtime_watchdog = arg_runtime_watchdog;
1672         m->shutdown_watchdog = arg_shutdown_watchdog;
1673         m->userspace_timestamp = userspace_timestamp;
1674         m->kernel_timestamp = kernel_timestamp;
1675         m->initrd_timestamp = initrd_timestamp;
1676         m->security_start_timestamp = security_start_timestamp;
1677         m->security_finish_timestamp = security_finish_timestamp;
1678
1679         manager_set_default_rlimits(m, arg_default_rlimit);
1680         manager_environment_add(m, NULL, arg_default_environment);
1681         manager_set_show_status(m, arg_show_status);
1682
1683         /* Remember whether we should queue the default job */
1684         queue_default_job = !arg_serialization || arg_switched_root;
1685
1686         before_startup = now(CLOCK_MONOTONIC);
1687
1688         r = manager_startup(m, arg_serialization, fds);
1689         if (r < 0)
1690                 log_error("Failed to fully start up daemon: %s", strerror(-r));
1691
1692         /* This will close all file descriptors that were opened, but
1693          * not claimed by any unit. */
1694         fdset_free(fds);
1695         fds = NULL;
1696
1697         if (arg_serialization) {
1698                 fclose(arg_serialization);
1699                 arg_serialization = NULL;
1700         }
1701
1702         if (queue_default_job) {
1703                 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
1704                 Unit *target = NULL;
1705                 Job *default_unit_job;
1706
1707                 log_debug("Activating default unit: %s", arg_default_unit);
1708
1709                 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
1710                 if (r < 0)
1711                         log_error("Failed to load default target: %s", bus_error_message(&error, r));
1712                 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
1713                         log_error("Failed to load default target: %s", strerror(-target->load_error));
1714                 else if (target->load_state == UNIT_MASKED)
1715                         log_error("Default target masked.");
1716
1717                 if (!target || target->load_state != UNIT_LOADED) {
1718                         log_info("Trying to load rescue target...");
1719
1720                         r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1721                         if (r < 0) {
1722                                 log_error("Failed to load rescue target: %s", bus_error_message(&error, r));
1723                                 goto finish;
1724                         } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
1725                                 log_error("Failed to load rescue target: %s", strerror(-target->load_error));
1726                                 goto finish;
1727                         } else if (target->load_state == UNIT_MASKED) {
1728                                 log_error("Rescue target masked.");
1729                                 goto finish;
1730                         }
1731                 }
1732
1733                 assert(target->load_state == UNIT_LOADED);
1734
1735                 if (arg_action == ACTION_TEST) {
1736                         printf("-> By units:\n");
1737                         manager_dump_units(m, stdout, "\t");
1738                 }
1739
1740                 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
1741                 if (r == -EPERM) {
1742                         log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
1743
1744                         r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1745                         if (r < 0) {
1746                                 log_error("Failed to start default target: %s", bus_error_message(&error, r));
1747                                 goto finish;
1748                         }
1749                 } else if (r < 0) {
1750                         log_error("Failed to isolate default target: %s", bus_error_message(&error, r));
1751                         goto finish;
1752                 }
1753
1754                 m->default_unit_job_id = default_unit_job->id;
1755
1756                 after_startup = now(CLOCK_MONOTONIC);
1757                 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1758                          "Loaded units and determined initial transaction in %s.",
1759                          format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 0));
1760
1761                 if (arg_action == ACTION_TEST) {
1762                         printf("-> By jobs:\n");
1763                         manager_dump_jobs(m, stdout, "\t");
1764                         retval = EXIT_SUCCESS;
1765                         goto finish;
1766                 }
1767         }
1768
1769         for (;;) {
1770                 r = manager_loop(m);
1771                 if (r < 0) {
1772                         log_error("Failed to run mainloop: %s", strerror(-r));
1773                         goto finish;
1774                 }
1775
1776                 switch (m->exit_code) {
1777
1778                 case MANAGER_EXIT:
1779                         retval = EXIT_SUCCESS;
1780                         log_debug("Exit.");
1781                         goto finish;
1782
1783                 case MANAGER_RELOAD:
1784                         log_info("Reloading.");
1785                         r = manager_reload(m);
1786                         if (r < 0)
1787                                 log_error("Failed to reload: %s", strerror(-r));
1788                         break;
1789
1790                 case MANAGER_REEXECUTE:
1791
1792                         if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0)
1793                                 goto finish;
1794
1795                         reexecute = true;
1796                         log_notice("Reexecuting.");
1797                         goto finish;
1798
1799                 case MANAGER_SWITCH_ROOT:
1800                         /* Steal the switch root parameters */
1801                         switch_root_dir = m->switch_root;
1802                         switch_root_init = m->switch_root_init;
1803                         m->switch_root = m->switch_root_init = NULL;
1804
1805                         if (!switch_root_init)
1806                                 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0)
1807                                         goto finish;
1808
1809                         reexecute = true;
1810                         log_notice("Switching root.");
1811                         goto finish;
1812
1813                 case MANAGER_REBOOT:
1814                 case MANAGER_POWEROFF:
1815                 case MANAGER_HALT:
1816                 case MANAGER_KEXEC: {
1817                         static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
1818                                 [MANAGER_REBOOT] = "reboot",
1819                                 [MANAGER_POWEROFF] = "poweroff",
1820                                 [MANAGER_HALT] = "halt",
1821                                 [MANAGER_KEXEC] = "kexec"
1822                         };
1823
1824                         assert_se(shutdown_verb = table[m->exit_code]);
1825                         arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
1826
1827                         log_notice("Shutting down.");
1828                         goto finish;
1829                 }
1830
1831                 default:
1832                         assert_not_reached("Unknown exit code.");
1833                 }
1834         }
1835
1836 finish:
1837         if (m) {
1838                 manager_free(m);
1839                 m = NULL;
1840         }
1841
1842         for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++) {
1843                 free(arg_default_rlimit[j]);
1844                 arg_default_rlimit[j] = NULL;
1845         }
1846
1847         free(arg_default_unit);
1848         arg_default_unit = NULL;
1849
1850         free_join_controllers();
1851
1852         strv_free(arg_default_environment);
1853         arg_default_environment = NULL;
1854
1855         set_free(arg_syscall_archs);
1856         arg_syscall_archs = NULL;
1857
1858         label_finish();
1859
1860         if (reexecute) {
1861                 const char **args;
1862                 unsigned i, args_size;
1863                 sigset_t ss, o_ss;
1864
1865                 /* Close and disarm the watchdog, so that the new
1866                  * instance can reinitialize it, but doesn't get
1867                  * rebooted while we do that */
1868                 watchdog_close(true);
1869
1870                 /* Reset the RLIMIT_NOFILE to the kernel default, so
1871                  * that the new systemd can pass the kernel default to
1872                  * its child processes */
1873                 if (saved_rlimit_nofile.rlim_cur > 0)
1874                         setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
1875
1876                 if (switch_root_dir) {
1877                         /* Kill all remaining processes from the
1878                          * initrd, but don't wait for them, so that we
1879                          * can handle the SIGCHLD for them after
1880                          * deserializing. */
1881                         broadcast_signal(SIGTERM, false, true);
1882
1883                         /* And switch root */
1884                         r = switch_root(switch_root_dir);
1885                         if (r < 0)
1886                                 log_error("Failed to switch root, ignoring: %s", strerror(-r));
1887                 }
1888
1889                 args_size = MAX(6, argc+1);
1890                 args = newa(const char*, args_size);
1891
1892                 if (!switch_root_init) {
1893                         char sfd[16];
1894
1895                         /* First try to spawn ourselves with the right
1896                          * path, and with full serialization. We do
1897                          * this only if the user didn't specify an
1898                          * explicit init to spawn. */
1899
1900                         assert(arg_serialization);
1901                         assert(fds);
1902
1903                         snprintf(sfd, sizeof(sfd), "%i", fileno(arg_serialization));
1904                         char_array_0(sfd);
1905
1906                         i = 0;
1907                         args[i++] = SYSTEMD_BINARY_PATH;
1908                         if (switch_root_dir)
1909                                 args[i++] = "--switched-root";
1910                         args[i++] = arg_running_as == SYSTEMD_SYSTEM ? "--system" : "--user";
1911                         args[i++] = "--deserialize";
1912                         args[i++] = sfd;
1913                         args[i++] = NULL;
1914
1915                         /* do not pass along the environment we inherit from the kernel or initrd */
1916                         if (switch_root_dir)
1917                                 clearenv();
1918
1919                         assert(i <= args_size);
1920                         execv(args[0], (char* const*) args);
1921                 }
1922
1923                 /* Try the fallback, if there is any, without any
1924                  * serialization. We pass the original argv[] and
1925                  * envp[]. (Well, modulo the ordering changes due to
1926                  * getopt() in argv[], and some cleanups in envp[],
1927                  * but let's hope that doesn't matter.) */
1928
1929                 if (arg_serialization) {
1930                         fclose(arg_serialization);
1931                         arg_serialization = NULL;
1932                 }
1933
1934                 if (fds) {
1935                         fdset_free(fds);
1936                         fds = NULL;
1937                 }
1938
1939                 /* Reopen the console */
1940                 make_console_stdio();
1941
1942                 for (j = 1, i = 1; j < (unsigned) argc; j++)
1943                         args[i++] = argv[j];
1944                 args[i++] = NULL;
1945                 assert(i <= args_size);
1946
1947                 /* reenable any blocked signals, especially important
1948                  * if we switch from initial ramdisk to init=... */
1949                 sigemptyset(&ss);
1950                 sigprocmask(SIG_SETMASK, &ss, &o_ss);
1951
1952                 if (switch_root_init) {
1953                         args[0] = switch_root_init;
1954                         execv(args[0], (char* const*) args);
1955                         log_warning("Failed to execute configured init, trying fallback: %m");
1956                 }
1957
1958                 args[0] = "/sbin/init";
1959                 execv(args[0], (char* const*) args);
1960
1961                 if (errno == ENOENT) {
1962                         log_warning("No /sbin/init, trying fallback");
1963
1964                         args[0] = "/bin/sh";
1965                         args[1] = NULL;
1966                         execv(args[0], (char* const*) args);
1967                         log_error("Failed to execute /bin/sh, giving up: %m");
1968                 } else
1969                         log_warning("Failed to execute /sbin/init, giving up: %m");
1970
1971                 sigprocmask(SIG_SETMASK, &o_ss, NULL);
1972         }
1973
1974         if (arg_serialization) {
1975                 fclose(arg_serialization);
1976                 arg_serialization = NULL;
1977         }
1978
1979         if (fds) {
1980                 fdset_free(fds);
1981                 fds = NULL;
1982         }
1983
1984 #ifdef HAVE_VALGRIND_VALGRIND_H
1985         /* If we are PID 1 and running under valgrind, then let's exit
1986          * here explicitly. valgrind will only generate nice output on
1987          * exit(), not on exec(), hence let's do the former not the
1988          * latter here. */
1989         if (getpid() == 1 && RUNNING_ON_VALGRIND)
1990                 return 0;
1991 #endif
1992
1993         if (shutdown_verb) {
1994                 char log_level[DECIMAL_STR_MAX(int) + 1];
1995                 const char* command_line[9] = {
1996                         SYSTEMD_SHUTDOWN_BINARY_PATH,
1997                         shutdown_verb,
1998                         "--log-level", log_level,
1999                         "--log-target",
2000                 };
2001                 unsigned pos = 5;
2002                 _cleanup_strv_free_ char **env_block = NULL;
2003
2004                 assert(command_line[pos] == NULL);
2005                 env_block = strv_copy(environ);
2006
2007                 snprintf(log_level, sizeof(log_level), "%d", log_get_max_level());
2008
2009                 switch (log_get_target()) {
2010                 case LOG_TARGET_KMSG:
2011                 case LOG_TARGET_JOURNAL_OR_KMSG:
2012                 case LOG_TARGET_SYSLOG_OR_KMSG:
2013                         command_line[pos++] = "kmsg";
2014                         break;
2015
2016                 case LOG_TARGET_CONSOLE:
2017                 default:
2018                         command_line[pos++] = "console";
2019                         break;
2020                 };
2021
2022                 if (log_get_show_color())
2023                         command_line[pos++] = "--log-color";
2024
2025                 if (log_get_show_location())
2026                         command_line[pos++] = "--log-location";
2027
2028                 assert(pos < ELEMENTSOF(command_line));
2029
2030                 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
2031                         char *e;
2032
2033                         /* If we reboot let's set the shutdown
2034                          * watchdog and tell the shutdown binary to
2035                          * repeatedly ping it */
2036                         watchdog_set_timeout(&arg_shutdown_watchdog);
2037                         watchdog_close(false);
2038
2039                         /* Tell the binary how often to ping, ignore failure */
2040                         if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
2041                                 strv_push(&env_block, e);
2042                 } else
2043                         watchdog_close(true);
2044
2045                 /* Avoid the creation of new processes forked by the
2046                  * kernel; at this point, we will not listen to the
2047                  * signals anyway */
2048                 if (detect_container(NULL) <= 0)
2049                         cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
2050
2051                 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
2052                 log_error("Failed to execute shutdown binary, %s: %m",
2053                           getpid() == 1 ? "freezing" : "quitting");
2054         }
2055
2056         if (getpid() == 1)
2057                 freeze();
2058
2059         return retval;
2060 }