chiark / gitweb /
main: minor code modernization for initializing the console
[elogind.git] / src / core / main.c
1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
2
3 /***
4   This file is part of systemd.
5
6   Copyright 2010 Lennart Poettering
7
8   systemd is free software; you can redistribute it and/or modify it
9   under the terms of the GNU Lesser General Public License as published by
10   the Free Software Foundation; either version 2.1 of the License, or
11   (at your option) any later version.
12
13   systemd is distributed in the hope that it will be useful, but
14   WITHOUT ANY WARRANTY; without even the implied warranty of
15   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16   Lesser General Public License for more details.
17
18   You should have received a copy of the GNU Lesser General Public License
19   along with systemd; If not, see <http://www.gnu.org/licenses/>.
20 ***/
21
22 #include <stdio.h>
23 #include <errno.h>
24 #include <string.h>
25 #include <unistd.h>
26 #include <sys/types.h>
27 #include <sys/stat.h>
28 #include <getopt.h>
29 #include <signal.h>
30 #include <sys/wait.h>
31 #include <fcntl.h>
32 #include <sys/prctl.h>
33 #include <sys/mount.h>
34
35 #ifdef HAVE_VALGRIND_VALGRIND_H
36 #include <valgrind/valgrind.h>
37 #endif
38 #ifdef HAVE_SECCOMP
39 #include <seccomp.h>
40 #endif
41
42 #include "sd-daemon.h"
43 #include "sd-messages.h"
44 #include "sd-bus.h"
45 #include "manager.h"
46 #include "log.h"
47 #include "load-fragment.h"
48 #include "fdset.h"
49 #include "special.h"
50 #include "conf-parser.h"
51 #include "missing.h"
52 #include "label.h"
53 #include "pager.h"
54 #include "build.h"
55 #include "strv.h"
56 #include "def.h"
57 #include "virt.h"
58 #include "architecture.h"
59 #include "watchdog.h"
60 #include "path-util.h"
61 #include "switch-root.h"
62 #include "capability.h"
63 #include "killall.h"
64 #include "env-util.h"
65 #include "clock-util.h"
66 #include "fileio.h"
67 #include "dbus-manager.h"
68 #include "bus-error.h"
69 #include "bus-util.h"
70
71 #include "mount-setup.h"
72 #include "loopback-setup.h"
73 #include "hostname-setup.h"
74 #include "machine-id-setup.h"
75 #include "selinux-setup.h"
76 #include "ima-setup.h"
77 #include "smack-setup.h"
78 #ifdef HAVE_KMOD
79 #include "kmod-setup.h"
80 #endif
81
82 static enum {
83         ACTION_RUN,
84         ACTION_HELP,
85         ACTION_VERSION,
86         ACTION_TEST,
87         ACTION_DUMP_CONFIGURATION_ITEMS,
88         ACTION_DONE
89 } arg_action = ACTION_RUN;
90 static char *arg_default_unit = NULL;
91 static SystemdRunningAs arg_running_as = _SYSTEMD_RUNNING_AS_INVALID;
92 static bool arg_dump_core = true;
93 static bool arg_crash_shell = false;
94 static int arg_crash_chvt = -1;
95 static bool arg_confirm_spawn = false;
96 static ShowStatus arg_show_status = _SHOW_STATUS_UNSET;
97 static bool arg_switched_root = false;
98 static int arg_no_pager = -1;
99 static char ***arg_join_controllers = NULL;
100 static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
101 static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
102 static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
103 static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
104 static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
105 static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
106 static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
107 static usec_t arg_runtime_watchdog = 0;
108 static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
109 static char **arg_default_environment = NULL;
110 static struct rlimit *arg_default_rlimit[_RLIMIT_MAX] = {};
111 static uint64_t arg_capability_bounding_set_drop = 0;
112 static nsec_t arg_timer_slack_nsec = NSEC_INFINITY;
113 static usec_t arg_default_timer_accuracy_usec = 1 * USEC_PER_MINUTE;
114 static Set* arg_syscall_archs = NULL;
115 static FILE* arg_serialization = NULL;
116 static bool arg_default_cpu_accounting = false;
117 static bool arg_default_blockio_accounting = false;
118 static bool arg_default_memory_accounting = false;
119
120 static void nop_handler(int sig) {}
121
122 static void pager_open_if_enabled(void) {
123
124         if (arg_no_pager <= 0)
125                 return;
126
127         pager_open(false);
128 }
129
130 noreturn static void crash(int sig) {
131
132         if (getpid() != 1)
133                 /* Pass this on immediately, if this is not PID 1 */
134                 raise(sig);
135         else if (!arg_dump_core)
136                 log_error("Caught <%s>, not dumping core.", signal_to_string(sig));
137         else {
138                 struct sigaction sa = {
139                         .sa_handler = nop_handler,
140                         .sa_flags = SA_NOCLDSTOP|SA_RESTART,
141                 };
142                 pid_t pid;
143
144                 /* We want to wait for the core process, hence let's enable SIGCHLD */
145                 sigaction(SIGCHLD, &sa, NULL);
146
147                 pid = fork();
148                 if (pid < 0)
149                         log_error("Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
150
151                 else if (pid == 0) {
152                         struct rlimit rl = {};
153
154                         /* Enable default signal handler for core dump */
155                         zero(sa);
156                         sa.sa_handler = SIG_DFL;
157                         sigaction(sig, &sa, NULL);
158
159                         /* Don't limit the core dump size */
160                         rl.rlim_cur = RLIM_INFINITY;
161                         rl.rlim_max = RLIM_INFINITY;
162                         setrlimit(RLIMIT_CORE, &rl);
163
164                         /* Just to be sure... */
165                         chdir("/");
166
167                         /* Raise the signal again */
168                         raise(sig);
169
170                         assert_not_reached("We shouldn't be here...");
171                         _exit(1);
172
173                 } else {
174                         siginfo_t status;
175                         int r;
176
177                         /* Order things nicely. */
178                         r = wait_for_terminate(pid, &status);
179                         if (r < 0)
180                                 log_error("Caught <%s>, waitpid() failed: %s", signal_to_string(sig), strerror(-r));
181                         else if (status.si_code != CLD_DUMPED)
182                                 log_error("Caught <%s>, core dump failed.", signal_to_string(sig));
183                         else
184                                 log_error("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
185                 }
186         }
187
188         if (arg_crash_chvt)
189                 chvt(arg_crash_chvt);
190
191         if (arg_crash_shell) {
192                 struct sigaction sa = {
193                         .sa_handler = SIG_IGN,
194                         .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
195                 };
196                 pid_t pid;
197
198                 log_info("Executing crash shell in 10s...");
199                 sleep(10);
200
201                 /* Let the kernel reap children for us */
202                 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
203
204                 pid = fork();
205                 if (pid < 0)
206                         log_error("Failed to fork off crash shell: %m");
207                 else if (pid == 0) {
208                         make_console_stdio();
209                         execl("/bin/sh", "/bin/sh", NULL);
210
211                         log_error("execl() failed: %m");
212                         _exit(1);
213                 }
214
215                 log_info("Successfully spawned crash shell as pid "PID_FMT".", pid);
216         }
217
218         log_info("Freezing execution.");
219         freeze();
220 }
221
222 static void install_crash_handler(void) {
223         struct sigaction sa = {
224                 .sa_handler = crash,
225                 .sa_flags = SA_NODEFER,
226         };
227
228         sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
229 }
230
231 static int console_setup(void) {
232         _cleanup_close_ int tty_fd = -1;
233         int r;
234
235         tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
236         if (tty_fd < 0) {
237                 log_error("Failed to open /dev/console: %s", strerror(-tty_fd));
238                 return tty_fd;
239         }
240
241         /* We don't want to force text mode.  plymouth may be showing
242          * pictures already from initrd. */
243         r = reset_terminal_fd(tty_fd, false);
244         if (r < 0) {
245                 log_error("Failed to reset /dev/console: %s", strerror(-r));
246                 return r;
247         }
248
249         return 0;
250 }
251
252 static int set_default_unit(const char *u) {
253         char *c;
254
255         assert(u);
256
257         c = strdup(u);
258         if (!c)
259                 return -ENOMEM;
260
261         free(arg_default_unit);
262         arg_default_unit = c;
263
264         return 0;
265 }
266
267 static int parse_proc_cmdline_item(const char *key, const char *value) {
268
269         static const char * const rlmap[] = {
270                 "emergency", SPECIAL_EMERGENCY_TARGET,
271                 "-b",        SPECIAL_EMERGENCY_TARGET,
272                 "single",    SPECIAL_RESCUE_TARGET,
273                 "-s",        SPECIAL_RESCUE_TARGET,
274                 "s",         SPECIAL_RESCUE_TARGET,
275                 "S",         SPECIAL_RESCUE_TARGET,
276                 "1",         SPECIAL_RESCUE_TARGET,
277                 "2",         SPECIAL_RUNLEVEL2_TARGET,
278                 "3",         SPECIAL_RUNLEVEL3_TARGET,
279                 "4",         SPECIAL_RUNLEVEL4_TARGET,
280                 "5",         SPECIAL_RUNLEVEL5_TARGET,
281         };
282         int r;
283
284         assert(key);
285
286         if (streq(key, "systemd.unit") && value) {
287
288                 if (!in_initrd())
289                         return set_default_unit(value);
290
291         } else if (streq(key, "rd.systemd.unit") && value) {
292
293                 if (in_initrd())
294                         return set_default_unit(value);
295
296         } else if (streq(key, "systemd.log_target") && value) {
297
298                 if (log_set_target_from_string(value) < 0)
299                         log_warning("Failed to parse log target %s. Ignoring.", value);
300
301         } else if (streq(key, "systemd.log_level") && value) {
302
303                 if (log_set_max_level_from_string(value) < 0)
304                         log_warning("Failed to parse log level %s. Ignoring.", value);
305
306         } else if (streq(key, "systemd.log_color") && value) {
307
308                 if (log_show_color_from_string(value) < 0)
309                         log_warning("Failed to parse log color setting %s. Ignoring.", value);
310
311         } else if (streq(key, "systemd.log_location") && value) {
312
313                 if (log_show_location_from_string(value) < 0)
314                         log_warning("Failed to parse log location setting %s. Ignoring.", value);
315
316         } else if (streq(key, "systemd.dump_core") && value) {
317
318                 r = parse_boolean(value);
319                 if (r < 0)
320                         log_warning("Failed to parse dump core switch %s. Ignoring.", value);
321                 else
322                         arg_dump_core = r;
323
324         } else if (streq(key, "systemd.crash_shell") && value) {
325
326                 r = parse_boolean(value);
327                 if (r < 0)
328                         log_warning("Failed to parse crash shell switch %s. Ignoring.", value);
329                 else
330                         arg_crash_shell = r;
331
332         } else if (streq(key, "systemd.crash_chvt") && value) {
333
334                 if (safe_atoi(value, &r) < 0)
335                         log_warning("Failed to parse crash chvt switch %s. Ignoring.", value);
336                 else
337                         arg_crash_chvt = r;
338
339         } else if (streq(key, "systemd.confirm_spawn") && value) {
340
341                 r = parse_boolean(value);
342                 if (r < 0)
343                         log_warning("Failed to parse confirm spawn switch %s. Ignoring.", value);
344                 else
345                         arg_confirm_spawn = r;
346
347         } else if (streq(key, "systemd.show_status") && value) {
348
349                 r = parse_show_status(value, &arg_show_status);
350                 if (r < 0)
351                         log_warning("Failed to parse show status switch %s. Ignoring.", value);
352
353         } else if (streq(key, "systemd.default_standard_output") && value) {
354
355                 r = exec_output_from_string(value);
356                 if (r < 0)
357                         log_warning("Failed to parse default standard output switch %s. Ignoring.", value);
358                 else
359                         arg_default_std_output = r;
360
361         } else if (streq(key, "systemd.default_standard_error") && value) {
362
363                 r = exec_output_from_string(value);
364                 if (r < 0)
365                         log_warning("Failed to parse default standard error switch %s. Ignoring.", value);
366                 else
367                         arg_default_std_error = r;
368
369         } else if (streq(key, "systemd.setenv") && value) {
370
371                 if (env_assignment_is_valid(value)) {
372                         char **env;
373
374                         env = strv_env_set(arg_default_environment, value);
375                         if (env)
376                                 arg_default_environment = env;
377                         else
378                                 log_warning("Setting environment variable '%s' failed, ignoring: %s", value, strerror(ENOMEM));
379                 } else
380                         log_warning("Environment variable name '%s' is not valid. Ignoring.", value);
381
382         } else if (streq(key, "quiet") && !value) {
383
384                 log_set_max_level(LOG_NOTICE);
385
386                 if (arg_show_status == _SHOW_STATUS_UNSET)
387                         arg_show_status = SHOW_STATUS_AUTO;
388
389         } else if (streq(key, "debug") && !value) {
390
391                 log_set_max_level(LOG_DEBUG);
392
393                 if (detect_container(NULL) > 0)
394                         log_set_target(LOG_TARGET_CONSOLE);
395
396         } else if (!in_initrd() && !value) {
397                 unsigned i;
398
399                 /* SysV compatibility */
400                 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
401                         if (streq(key, rlmap[i]))
402                                 return set_default_unit(rlmap[i+1]);
403         }
404
405         return 0;
406 }
407
408 #define DEFINE_SETTER(name, func, descr)                              \
409         static int name(const char *unit,                             \
410                         const char *filename,                         \
411                         unsigned line,                                \
412                         const char *section,                          \
413                         unsigned section_line,                        \
414                         const char *lvalue,                           \
415                         int ltype,                                    \
416                         const char *rvalue,                           \
417                         void *data,                                   \
418                         void *userdata) {                             \
419                                                                       \
420                 int r;                                                \
421                                                                       \
422                 assert(filename);                                     \
423                 assert(lvalue);                                       \
424                 assert(rvalue);                                       \
425                                                                       \
426                 r = func(rvalue);                                     \
427                 if (r < 0)                                            \
428                         log_syntax(unit, LOG_ERR, filename, line, -r, \
429                                    "Invalid " descr "'%s': %s",       \
430                                    rvalue, strerror(-r));             \
431                                                                       \
432                 return 0;                                             \
433         }
434
435 DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
436 DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
437 DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
438 DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
439
440 static int config_parse_cpu_affinity2(
441                 const char *unit,
442                 const char *filename,
443                 unsigned line,
444                 const char *section,
445                 unsigned section_line,
446                 const char *lvalue,
447                 int ltype,
448                 const char *rvalue,
449                 void *data,
450                 void *userdata) {
451
452         const char *word, *state;
453         size_t l;
454         cpu_set_t *c = NULL;
455         unsigned ncpus = 0;
456
457         assert(filename);
458         assert(lvalue);
459         assert(rvalue);
460
461         FOREACH_WORD_QUOTED(word, l, rvalue, state) {
462                 char *t;
463                 int r;
464                 unsigned cpu;
465
466                 if (!(t = strndup(word, l)))
467                         return log_oom();
468
469                 r = safe_atou(t, &cpu);
470                 free(t);
471
472                 if (!c)
473                         if (!(c = cpu_set_malloc(&ncpus)))
474                                 return log_oom();
475
476                 if (r < 0 || cpu >= ncpus) {
477                         log_syntax(unit, LOG_ERR, filename, line, -r,
478                                    "Failed to parse CPU affinity '%s'", rvalue);
479                         CPU_FREE(c);
480                         return -EBADMSG;
481                 }
482
483                 CPU_SET_S(cpu, CPU_ALLOC_SIZE(ncpus), c);
484         }
485         if (!isempty(state))
486                 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
487                            "Trailing garbage, ignoring.");
488
489         if (c) {
490                 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
491                         log_warning_unit(unit, "Failed to set CPU affinity: %m");
492
493                 CPU_FREE(c);
494         }
495
496         return 0;
497 }
498
499 static int config_parse_show_status(
500                 const char* unit,
501                 const char *filename,
502                 unsigned line,
503                 const char *section,
504                 unsigned section_line,
505                 const char *lvalue,
506                 int ltype,
507                 const char *rvalue,
508                 void *data,
509                 void *userdata) {
510
511         int k;
512         ShowStatus *b = data;
513
514         assert(filename);
515         assert(lvalue);
516         assert(rvalue);
517         assert(data);
518
519         k = parse_show_status(rvalue, b);
520         if (k < 0) {
521                 log_syntax(unit, LOG_ERR, filename, line, -k,
522                            "Failed to parse show status setting, ignoring: %s", rvalue);
523                 return 0;
524         }
525
526         return 0;
527 }
528
529 static void strv_free_free(char ***l) {
530         char ***i;
531
532         if (!l)
533                 return;
534
535         for (i = l; *i; i++)
536                 strv_free(*i);
537
538         free(l);
539 }
540
541 static void free_join_controllers(void) {
542         strv_free_free(arg_join_controllers);
543         arg_join_controllers = NULL;
544 }
545
546 static int config_parse_join_controllers(const char *unit,
547                                          const char *filename,
548                                          unsigned line,
549                                          const char *section,
550                                          unsigned section_line,
551                                          const char *lvalue,
552                                          int ltype,
553                                          const char *rvalue,
554                                          void *data,
555                                          void *userdata) {
556
557         unsigned n = 0;
558         const char *word, *state;
559         size_t length;
560
561         assert(filename);
562         assert(lvalue);
563         assert(rvalue);
564
565         free_join_controllers();
566
567         FOREACH_WORD_QUOTED(word, length, rvalue, state) {
568                 char *s, **l;
569
570                 s = strndup(word, length);
571                 if (!s)
572                         return log_oom();
573
574                 l = strv_split(s, ",");
575                 free(s);
576
577                 strv_uniq(l);
578
579                 if (strv_length(l) <= 1) {
580                         strv_free(l);
581                         continue;
582                 }
583
584                 if (!arg_join_controllers) {
585                         arg_join_controllers = new(char**, 2);
586                         if (!arg_join_controllers) {
587                                 strv_free(l);
588                                 return log_oom();
589                         }
590
591                         arg_join_controllers[0] = l;
592                         arg_join_controllers[1] = NULL;
593
594                         n = 1;
595                 } else {
596                         char ***a;
597                         char ***t;
598
599                         t = new0(char**, n+2);
600                         if (!t) {
601                                 strv_free(l);
602                                 return log_oom();
603                         }
604
605                         n = 0;
606
607                         for (a = arg_join_controllers; *a; a++) {
608
609                                 if (strv_overlap(*a, l)) {
610                                         if (strv_extend_strv(&l, *a) < 0) {
611                                                 strv_free(l);
612                                                 strv_free_free(t);
613                                                 return log_oom();
614                                         }
615
616                                 } else {
617                                         char **c;
618
619                                         c = strv_copy(*a);
620                                         if (!c) {
621                                                 strv_free(l);
622                                                 strv_free_free(t);
623                                                 return log_oom();
624                                         }
625
626                                         t[n++] = c;
627                                 }
628                         }
629
630                         t[n++] = strv_uniq(l);
631
632                         strv_free_free(arg_join_controllers);
633                         arg_join_controllers = t;
634                 }
635         }
636         if (!isempty(state))
637                 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
638                            "Trailing garbage, ignoring.");
639
640         return 0;
641 }
642
643 static int parse_config_file(void) {
644
645         const ConfigTableItem items[] = {
646                 { "Manager", "LogLevel",                  config_parse_level2,           0, NULL                                   },
647                 { "Manager", "LogTarget",                 config_parse_target,           0, NULL                                   },
648                 { "Manager", "LogColor",                  config_parse_color,            0, NULL                                   },
649                 { "Manager", "LogLocation",               config_parse_location,         0, NULL                                   },
650                 { "Manager", "DumpCore",                  config_parse_bool,             0, &arg_dump_core                         },
651                 { "Manager", "CrashShell",                config_parse_bool,             0, &arg_crash_shell                       },
652                 { "Manager", "ShowStatus",                config_parse_show_status,      0, &arg_show_status                       },
653                 { "Manager", "CrashChVT",                 config_parse_int,              0, &arg_crash_chvt                        },
654                 { "Manager", "CPUAffinity",               config_parse_cpu_affinity2,    0, NULL                                   },
655                 { "Manager", "JoinControllers",           config_parse_join_controllers, 0, &arg_join_controllers                  },
656                 { "Manager", "RuntimeWatchdogSec",        config_parse_sec,              0, &arg_runtime_watchdog                  },
657                 { "Manager", "ShutdownWatchdogSec",       config_parse_sec,              0, &arg_shutdown_watchdog                 },
658                 { "Manager", "CapabilityBoundingSet",     config_parse_bounding_set,     0, &arg_capability_bounding_set_drop      },
659 #ifdef HAVE_SECCOMP
660                 { "Manager", "SystemCallArchitectures",   config_parse_syscall_archs,    0, &arg_syscall_archs                     },
661 #endif
662                 { "Manager", "TimerSlackNSec",            config_parse_nsec,             0, &arg_timer_slack_nsec                  },
663                 { "Manager", "DefaultTimerAccuracySec",   config_parse_sec,              0, &arg_default_timer_accuracy_usec       },
664                 { "Manager", "DefaultStandardOutput",     config_parse_output,           0, &arg_default_std_output                },
665                 { "Manager", "DefaultStandardError",      config_parse_output,           0, &arg_default_std_error                 },
666                 { "Manager", "DefaultTimeoutStartSec",    config_parse_sec,              0, &arg_default_timeout_start_usec        },
667                 { "Manager", "DefaultTimeoutStopSec",     config_parse_sec,              0, &arg_default_timeout_stop_usec         },
668                 { "Manager", "DefaultRestartSec",         config_parse_sec,              0, &arg_default_restart_usec              },
669                 { "Manager", "DefaultStartLimitInterval", config_parse_sec,              0, &arg_default_start_limit_interval      },
670                 { "Manager", "DefaultStartLimitBurst",    config_parse_unsigned,         0, &arg_default_start_limit_burst         },
671                 { "Manager", "DefaultEnvironment",        config_parse_environ,          0, &arg_default_environment               },
672                 { "Manager", "DefaultLimitCPU",           config_parse_limit,            0, &arg_default_rlimit[RLIMIT_CPU]        },
673                 { "Manager", "DefaultLimitFSIZE",         config_parse_limit,            0, &arg_default_rlimit[RLIMIT_FSIZE]      },
674                 { "Manager", "DefaultLimitDATA",          config_parse_limit,            0, &arg_default_rlimit[RLIMIT_DATA]       },
675                 { "Manager", "DefaultLimitSTACK",         config_parse_limit,            0, &arg_default_rlimit[RLIMIT_STACK]      },
676                 { "Manager", "DefaultLimitCORE",          config_parse_limit,            0, &arg_default_rlimit[RLIMIT_CORE]       },
677                 { "Manager", "DefaultLimitRSS",           config_parse_limit,            0, &arg_default_rlimit[RLIMIT_RSS]        },
678                 { "Manager", "DefaultLimitNOFILE",        config_parse_limit,            0, &arg_default_rlimit[RLIMIT_NOFILE]     },
679                 { "Manager", "DefaultLimitAS",            config_parse_limit,            0, &arg_default_rlimit[RLIMIT_AS]         },
680                 { "Manager", "DefaultLimitNPROC",         config_parse_limit,            0, &arg_default_rlimit[RLIMIT_NPROC]      },
681                 { "Manager", "DefaultLimitMEMLOCK",       config_parse_limit,            0, &arg_default_rlimit[RLIMIT_MEMLOCK]    },
682                 { "Manager", "DefaultLimitLOCKS",         config_parse_limit,            0, &arg_default_rlimit[RLIMIT_LOCKS]      },
683                 { "Manager", "DefaultLimitSIGPENDING",    config_parse_limit,            0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
684                 { "Manager", "DefaultLimitMSGQUEUE",      config_parse_limit,            0, &arg_default_rlimit[RLIMIT_MSGQUEUE]   },
685                 { "Manager", "DefaultLimitNICE",          config_parse_limit,            0, &arg_default_rlimit[RLIMIT_NICE]       },
686                 { "Manager", "DefaultLimitRTPRIO",        config_parse_limit,            0, &arg_default_rlimit[RLIMIT_RTPRIO]     },
687                 { "Manager", "DefaultLimitRTTIME",        config_parse_limit,            0, &arg_default_rlimit[RLIMIT_RTTIME]     },
688                 { "Manager", "DefaultCPUAccounting",      config_parse_bool,             0, &arg_default_cpu_accounting            },
689                 { "Manager", "DefaultBlockIOAccounting",  config_parse_bool,             0, &arg_default_blockio_accounting        },
690                 { "Manager", "DefaultMemoryAccounting",   config_parse_bool,             0, &arg_default_memory_accounting         },
691                 {}
692         };
693
694         const char *fn;
695
696         fn = arg_running_as == SYSTEMD_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
697         config_parse(NULL, fn, NULL,
698                      "Manager\0",
699                      config_item_table_lookup, items,
700                      false, false, true, NULL);
701
702         return 0;
703 }
704
705 static int parse_argv(int argc, char *argv[]) {
706
707         enum {
708                 ARG_LOG_LEVEL = 0x100,
709                 ARG_LOG_TARGET,
710                 ARG_LOG_COLOR,
711                 ARG_LOG_LOCATION,
712                 ARG_UNIT,
713                 ARG_SYSTEM,
714                 ARG_USER,
715                 ARG_TEST,
716                 ARG_NO_PAGER,
717                 ARG_VERSION,
718                 ARG_DUMP_CONFIGURATION_ITEMS,
719                 ARG_DUMP_CORE,
720                 ARG_CRASH_SHELL,
721                 ARG_CONFIRM_SPAWN,
722                 ARG_SHOW_STATUS,
723                 ARG_DESERIALIZE,
724                 ARG_SWITCHED_ROOT,
725                 ARG_DEFAULT_STD_OUTPUT,
726                 ARG_DEFAULT_STD_ERROR
727         };
728
729         static const struct option options[] = {
730                 { "log-level",                required_argument, NULL, ARG_LOG_LEVEL                },
731                 { "log-target",               required_argument, NULL, ARG_LOG_TARGET               },
732                 { "log-color",                optional_argument, NULL, ARG_LOG_COLOR                },
733                 { "log-location",             optional_argument, NULL, ARG_LOG_LOCATION             },
734                 { "unit",                     required_argument, NULL, ARG_UNIT                     },
735                 { "system",                   no_argument,       NULL, ARG_SYSTEM                   },
736                 { "user",                     no_argument,       NULL, ARG_USER                     },
737                 { "test",                     no_argument,       NULL, ARG_TEST                     },
738                 { "no-pager",                 no_argument,       NULL, ARG_NO_PAGER                 },
739                 { "help",                     no_argument,       NULL, 'h'                          },
740                 { "version",                  no_argument,       NULL, ARG_VERSION                  },
741                 { "dump-configuration-items", no_argument,       NULL, ARG_DUMP_CONFIGURATION_ITEMS },
742                 { "dump-core",                optional_argument, NULL, ARG_DUMP_CORE                },
743                 { "crash-shell",              optional_argument, NULL, ARG_CRASH_SHELL              },
744                 { "confirm-spawn",            optional_argument, NULL, ARG_CONFIRM_SPAWN            },
745                 { "show-status",              optional_argument, NULL, ARG_SHOW_STATUS              },
746                 { "deserialize",              required_argument, NULL, ARG_DESERIALIZE              },
747                 { "switched-root",            no_argument,       NULL, ARG_SWITCHED_ROOT            },
748                 { "default-standard-output",  required_argument, NULL, ARG_DEFAULT_STD_OUTPUT,      },
749                 { "default-standard-error",   required_argument, NULL, ARG_DEFAULT_STD_ERROR,       },
750                 {}
751         };
752
753         int c, r;
754
755         assert(argc >= 1);
756         assert(argv);
757
758         if (getpid() == 1)
759                 opterr = 0;
760
761         while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
762
763                 switch (c) {
764
765                 case ARG_LOG_LEVEL:
766                         r = log_set_max_level_from_string(optarg);
767                         if (r < 0) {
768                                 log_error("Failed to parse log level %s.", optarg);
769                                 return r;
770                         }
771
772                         break;
773
774                 case ARG_LOG_TARGET:
775                         r = log_set_target_from_string(optarg);
776                         if (r < 0) {
777                                 log_error("Failed to parse log target %s.", optarg);
778                                 return r;
779                         }
780
781                         break;
782
783                 case ARG_LOG_COLOR:
784
785                         if (optarg) {
786                                 r = log_show_color_from_string(optarg);
787                                 if (r < 0) {
788                                         log_error("Failed to parse log color setting %s.", optarg);
789                                         return r;
790                                 }
791                         } else
792                                 log_show_color(true);
793
794                         break;
795
796                 case ARG_LOG_LOCATION:
797                         if (optarg) {
798                                 r = log_show_location_from_string(optarg);
799                                 if (r < 0) {
800                                         log_error("Failed to parse log location setting %s.", optarg);
801                                         return r;
802                                 }
803                         } else
804                                 log_show_location(true);
805
806                         break;
807
808                 case ARG_DEFAULT_STD_OUTPUT:
809                         r = exec_output_from_string(optarg);
810                         if (r < 0) {
811                                 log_error("Failed to parse default standard output setting %s.", optarg);
812                                 return r;
813                         } else
814                                 arg_default_std_output = r;
815                         break;
816
817                 case ARG_DEFAULT_STD_ERROR:
818                         r = exec_output_from_string(optarg);
819                         if (r < 0) {
820                                 log_error("Failed to parse default standard error output setting %s.", optarg);
821                                 return r;
822                         } else
823                                 arg_default_std_error = r;
824                         break;
825
826                 case ARG_UNIT:
827
828                         r = set_default_unit(optarg);
829                         if (r < 0) {
830                                 log_error("Failed to set default unit %s: %s", optarg, strerror(-r));
831                                 return r;
832                         }
833
834                         break;
835
836                 case ARG_SYSTEM:
837                         arg_running_as = SYSTEMD_SYSTEM;
838                         break;
839
840                 case ARG_USER:
841                         arg_running_as = SYSTEMD_USER;
842                         break;
843
844                 case ARG_TEST:
845                         arg_action = ACTION_TEST;
846                         if (arg_no_pager < 0)
847                                 arg_no_pager = true;
848                         break;
849
850                 case ARG_NO_PAGER:
851                         arg_no_pager = true;
852                         break;
853
854                 case ARG_VERSION:
855                         arg_action = ACTION_VERSION;
856                         break;
857
858                 case ARG_DUMP_CONFIGURATION_ITEMS:
859                         arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
860                         break;
861
862                 case ARG_DUMP_CORE:
863                         r = optarg ? parse_boolean(optarg) : 1;
864                         if (r < 0) {
865                                 log_error("Failed to parse dump core boolean %s.", optarg);
866                                 return r;
867                         }
868                         arg_dump_core = r;
869                         break;
870
871                 case ARG_CRASH_SHELL:
872                         r = optarg ? parse_boolean(optarg) : 1;
873                         if (r < 0) {
874                                 log_error("Failed to parse crash shell boolean %s.", optarg);
875                                 return r;
876                         }
877                         arg_crash_shell = r;
878                         break;
879
880                 case ARG_CONFIRM_SPAWN:
881                         r = optarg ? parse_boolean(optarg) : 1;
882                         if (r < 0) {
883                                 log_error("Failed to parse confirm spawn boolean %s.", optarg);
884                                 return r;
885                         }
886                         arg_confirm_spawn = r;
887                         break;
888
889                 case ARG_SHOW_STATUS:
890                         if (optarg) {
891                                 r = parse_show_status(optarg, &arg_show_status);
892                                 if (r < 0) {
893                                         log_error("Failed to parse show status boolean %s.", optarg);
894                                         return r;
895                                 }
896                         } else
897                                 arg_show_status = SHOW_STATUS_YES;
898                         break;
899
900                 case ARG_DESERIALIZE: {
901                         int fd;
902                         FILE *f;
903
904                         r = safe_atoi(optarg, &fd);
905                         if (r < 0 || fd < 0) {
906                                 log_error("Failed to parse deserialize option %s.", optarg);
907                                 return r < 0 ? r : -EINVAL;
908                         }
909
910                         fd_cloexec(fd, true);
911
912                         f = fdopen(fd, "r");
913                         if (!f) {
914                                 log_error("Failed to open serialization fd: %m");
915                                 return -errno;
916                         }
917
918                         if (arg_serialization)
919                                 fclose(arg_serialization);
920
921                         arg_serialization = f;
922
923                         break;
924                 }
925
926                 case ARG_SWITCHED_ROOT:
927                         arg_switched_root = true;
928                         break;
929
930                 case 'h':
931                         arg_action = ACTION_HELP;
932                         if (arg_no_pager < 0)
933                                 arg_no_pager = true;
934                         break;
935
936                 case 'D':
937                         log_set_max_level(LOG_DEBUG);
938                         break;
939
940                 case 'b':
941                 case 's':
942                 case 'z':
943                         /* Just to eat away the sysvinit kernel
944                          * cmdline args without getopt() error
945                          * messages that we'll parse in
946                          * parse_proc_cmdline_word() or ignore. */
947
948                 case '?':
949                         if (getpid() != 1)
950                                 return -EINVAL;
951                         else
952                                 return 0;
953
954                 default:
955                         assert_not_reached("Unhandled option code.");
956                 }
957
958         if (optind < argc && getpid() != 1) {
959                 /* Hmm, when we aren't run as init system
960                  * let's complain about excess arguments */
961
962                 log_error("Excess arguments.");
963                 return -EINVAL;
964         }
965
966         if (detect_container(NULL) > 0) {
967                 char **a;
968
969                 /* All /proc/cmdline arguments the kernel didn't
970                  * understand it passed to us. We're not really
971                  * interested in that usually since /proc/cmdline is
972                  * more interesting and complete. With one exception:
973                  * if we are run in a container /proc/cmdline is not
974                  * relevant for the container, hence we rely on argv[]
975                  * instead. */
976
977                 for (a = argv; a < argv + argc; a++) {
978                         _cleanup_free_ char *w;
979                         char *value;
980
981                         w = strdup(*a);
982                         if (!w)
983                                 return log_oom();
984
985                         value = strchr(w, '=');
986                         if (value)
987                                 *(value++) = 0;
988
989                         r = parse_proc_cmdline_item(w, value);
990                         if (r < 0) {
991                                 log_error("Failed on cmdline argument %s: %s", *a, strerror(-r));
992                                 return r;
993                         }
994                 }
995         }
996
997         return 0;
998 }
999
1000 static int help(void) {
1001
1002         printf("%s [OPTIONS...]\n\n"
1003                "Starts up and maintains the system or user services.\n\n"
1004                "  -h --help                      Show this help\n"
1005                "     --test                      Determine startup sequence, dump it and exit\n"
1006                "     --no-pager                  Do not pipe output into a pager\n"
1007                "     --dump-configuration-items  Dump understood unit configuration items\n"
1008                "     --unit=UNIT                 Set default unit\n"
1009                "     --system                    Run a system instance, even if PID != 1\n"
1010                "     --user                      Run a user instance\n"
1011                "     --dump-core[=0|1]           Dump core on crash\n"
1012                "     --crash-shell[=0|1]         Run shell on crash\n"
1013                "     --confirm-spawn[=0|1]       Ask for confirmation when spawning processes\n"
1014                "     --show-status[=0|1]         Show status updates on the console during bootup\n"
1015                "     --log-target=TARGET         Set log target (console, journal, kmsg, journal-or-kmsg, null)\n"
1016                "     --log-level=LEVEL           Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
1017                "     --log-color[=0|1]           Highlight important log messages\n"
1018                "     --log-location[=0|1]        Include code location in log messages\n"
1019                "     --default-standard-output=  Set default standard output for services\n"
1020                "     --default-standard-error=   Set default standard error output for services\n",
1021                program_invocation_short_name);
1022
1023         return 0;
1024 }
1025
1026 static int version(void) {
1027         puts(PACKAGE_STRING);
1028         puts(SYSTEMD_FEATURES);
1029
1030         return 0;
1031 }
1032
1033 static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
1034         FILE *f = NULL;
1035         FDSet *fds = NULL;
1036         int r;
1037
1038         assert(m);
1039         assert(_f);
1040         assert(_fds);
1041
1042         r = manager_open_serialization(m, &f);
1043         if (r < 0) {
1044                 log_error("Failed to create serialization file: %s", strerror(-r));
1045                 goto fail;
1046         }
1047
1048         /* Make sure nothing is really destructed when we shut down */
1049         m->n_reloading ++;
1050         bus_manager_send_reloading(m, true);
1051
1052         fds = fdset_new();
1053         if (!fds) {
1054                 r = -ENOMEM;
1055                 log_error("Failed to allocate fd set: %s", strerror(-r));
1056                 goto fail;
1057         }
1058
1059         r = manager_serialize(m, f, fds, switching_root);
1060         if (r < 0) {
1061                 log_error("Failed to serialize state: %s", strerror(-r));
1062                 goto fail;
1063         }
1064
1065         if (fseeko(f, 0, SEEK_SET) < 0) {
1066                 log_error("Failed to rewind serialization fd: %m");
1067                 goto fail;
1068         }
1069
1070         r = fd_cloexec(fileno(f), false);
1071         if (r < 0) {
1072                 log_error("Failed to disable O_CLOEXEC for serialization: %s", strerror(-r));
1073                 goto fail;
1074         }
1075
1076         r = fdset_cloexec(fds, false);
1077         if (r < 0) {
1078                 log_error("Failed to disable O_CLOEXEC for serialization fds: %s", strerror(-r));
1079                 goto fail;
1080         }
1081
1082         *_f = f;
1083         *_fds = fds;
1084
1085         return 0;
1086
1087 fail:
1088         fdset_free(fds);
1089
1090         if (f)
1091                 fclose(f);
1092
1093         return r;
1094 }
1095
1096 static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1097         struct rlimit nl;
1098         int r;
1099
1100         assert(saved_rlimit);
1101
1102         /* Save the original RLIMIT_NOFILE so that we can reset it
1103          * later when transitioning from the initrd to the main
1104          * systemd or suchlike. */
1105         if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0) {
1106                 log_error("Reading RLIMIT_NOFILE failed: %m");
1107                 return -errno;
1108         }
1109
1110         /* Make sure forked processes get the default kernel setting */
1111         if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1112                 struct rlimit *rl;
1113
1114                 rl = newdup(struct rlimit, saved_rlimit, 1);
1115                 if (!rl)
1116                         return log_oom();
1117
1118                 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1119         }
1120
1121         /* Bump up the resource limit for ourselves substantially */
1122         nl.rlim_cur = nl.rlim_max = 64*1024;
1123         r = setrlimit_closest(RLIMIT_NOFILE, &nl);
1124         if (r < 0) {
1125                 log_error("Setting RLIMIT_NOFILE failed: %s", strerror(-r));
1126                 return r;
1127         }
1128
1129         return 0;
1130 }
1131
1132 static void test_mtab(void) {
1133
1134         static const char ok[] =
1135                 "/proc/self/mounts\0"
1136                 "/proc/mounts\0"
1137                 "../proc/self/mounts\0"
1138                 "../proc/mounts\0";
1139
1140         _cleanup_free_ char *p = NULL;
1141         int r;
1142
1143         /* Check that /etc/mtab is a symlink to the right place or
1144          * non-existing. But certainly not a file, or a symlink to
1145          * some weird place... */
1146
1147         r = readlink_malloc("/etc/mtab", &p);
1148         if (r == -ENOENT)
1149                 return;
1150         if (r >= 0 && nulstr_contains(ok, p))
1151                 return;
1152
1153         log_warning("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1154                     "This is not supported anymore. "
1155                     "Please make sure to replace this file by a symlink to avoid incorrect or misleading mount(8) output.");
1156 }
1157
1158 static void test_usr(void) {
1159
1160         /* Check that /usr is not a separate fs */
1161
1162         if (dir_is_empty("/usr") <= 0)
1163                 return;
1164
1165         log_warning("/usr appears to be on its own filesytem and is not already mounted. This is not a supported setup. "
1166                     "Some things will probably break (sometimes even silently) in mysterious ways. "
1167                     "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1168 }
1169
1170 static int initialize_join_controllers(void) {
1171         /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1172          * + "net_prio". We'd like to add "cpuset" to the mix, but
1173          * "cpuset" does't really work for groups with no initialized
1174          * attributes. */
1175
1176         arg_join_controllers = new(char**, 3);
1177         if (!arg_join_controllers)
1178                 return -ENOMEM;
1179
1180         arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
1181         arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
1182         arg_join_controllers[2] = NULL;
1183
1184         if (!arg_join_controllers[0] || !arg_join_controllers[1]) {
1185                 free_join_controllers();
1186                 return -ENOMEM;
1187         }
1188
1189         return 0;
1190 }
1191
1192 static int enforce_syscall_archs(Set *archs) {
1193 #ifdef HAVE_SECCOMP
1194         scmp_filter_ctx *seccomp;
1195         Iterator i;
1196         void *id;
1197         int r;
1198
1199         seccomp = seccomp_init(SCMP_ACT_ALLOW);
1200         if (!seccomp)
1201                 return log_oom();
1202
1203         SET_FOREACH(id, arg_syscall_archs, i) {
1204                 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1205                 if (r == -EEXIST)
1206                         continue;
1207                 if (r < 0) {
1208                         log_error("Failed to add architecture to seccomp: %s", strerror(-r));
1209                         goto finish;
1210                 }
1211         }
1212
1213         r = seccomp_attr_set(seccomp, SCMP_FLTATR_CTL_NNP, 0);
1214         if (r < 0) {
1215                 log_error("Failed to unset NO_NEW_PRIVS: %s", strerror(-r));
1216                 goto finish;
1217         }
1218
1219         r = seccomp_load(seccomp);
1220         if (r < 0)
1221                 log_error("Failed to add install architecture seccomp: %s", strerror(-r));
1222
1223 finish:
1224         seccomp_release(seccomp);
1225         return r;
1226 #else
1227         return 0;
1228 #endif
1229 }
1230
1231 static int status_welcome(void) {
1232         _cleanup_free_ char *pretty_name = NULL, *ansi_color = NULL;
1233         int r;
1234
1235         r = parse_env_file("/etc/os-release", NEWLINE,
1236                            "PRETTY_NAME", &pretty_name,
1237                            "ANSI_COLOR", &ansi_color,
1238                            NULL);
1239         if (r == -ENOENT) {
1240                 r = parse_env_file("/usr/lib/os-release", NEWLINE,
1241                                    "PRETTY_NAME", &pretty_name,
1242                                    "ANSI_COLOR", &ansi_color,
1243                                    NULL);
1244         }
1245
1246         if (r < 0 && r != -ENOENT)
1247                 log_warning("Failed to read os-release file: %s", strerror(-r));
1248
1249         return status_printf(NULL, false, false,
1250                              "\nWelcome to \x1B[%sm%s\x1B[0m!\n",
1251                              isempty(ansi_color) ? "1" : ansi_color,
1252                              isempty(pretty_name) ? "Linux" : pretty_name);
1253 }
1254
1255 static int write_container_id(void) {
1256         const char *c;
1257
1258         c = getenv("container");
1259         if (isempty(c))
1260                 return 0;
1261
1262         return write_string_file("/run/systemd/container", c);
1263 }
1264
1265 int main(int argc, char *argv[]) {
1266         Manager *m = NULL;
1267         int r, retval = EXIT_FAILURE;
1268         usec_t before_startup, after_startup;
1269         char timespan[FORMAT_TIMESPAN_MAX];
1270         FDSet *fds = NULL;
1271         bool reexecute = false;
1272         const char *shutdown_verb = NULL;
1273         dual_timestamp initrd_timestamp = { 0ULL, 0ULL };
1274         dual_timestamp userspace_timestamp = { 0ULL, 0ULL };
1275         dual_timestamp kernel_timestamp = { 0ULL, 0ULL };
1276         dual_timestamp security_start_timestamp = { 0ULL, 0ULL };
1277         dual_timestamp security_finish_timestamp = { 0ULL, 0ULL };
1278         static char systemd[] = "systemd";
1279         bool skip_setup = false;
1280         unsigned j;
1281         bool loaded_policy = false;
1282         bool arm_reboot_watchdog = false;
1283         bool queue_default_job = false;
1284         bool empty_etc = false;
1285         char *switch_root_dir = NULL, *switch_root_init = NULL;
1286         static struct rlimit saved_rlimit_nofile = { 0, 0 };
1287
1288 #ifdef HAVE_SYSV_COMPAT
1289         if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
1290                 /* This is compatibility support for SysV, where
1291                  * calling init as a user is identical to telinit. */
1292
1293                 errno = -ENOENT;
1294                 execv(SYSTEMCTL_BINARY_PATH, argv);
1295                 log_error("Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
1296                 return 1;
1297         }
1298 #endif
1299
1300         dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1301         dual_timestamp_get(&userspace_timestamp);
1302
1303         /* Determine if this is a reexecution or normal bootup. We do
1304          * the full command line parsing much later, so let's just
1305          * have a quick peek here. */
1306         if (strv_find(argv+1, "--deserialize"))
1307                 skip_setup = true;
1308
1309         /* If we have switched root, do all the special setup
1310          * things */
1311         if (strv_find(argv+1, "--switched-root"))
1312                 skip_setup = false;
1313
1314         /* If we get started via the /sbin/init symlink then we are
1315            called 'init'. After a subsequent reexecution we are then
1316            called 'systemd'. That is confusing, hence let's call us
1317            systemd right-away. */
1318         program_invocation_short_name = systemd;
1319         prctl(PR_SET_NAME, systemd);
1320
1321         saved_argv = argv;
1322         saved_argc = argc;
1323
1324         log_show_color(isatty(STDERR_FILENO) > 0);
1325         log_set_upgrade_syslog_to_journal(true);
1326
1327         /* Disable the umask logic */
1328         if (getpid() == 1)
1329                 umask(0);
1330
1331         if (getpid() == 1 && detect_container(NULL) <= 0) {
1332
1333                 /* Running outside of a container as PID 1 */
1334                 arg_running_as = SYSTEMD_SYSTEM;
1335                 make_null_stdio();
1336                 log_set_target(LOG_TARGET_KMSG);
1337                 log_open();
1338
1339                 if (in_initrd())
1340                         initrd_timestamp = userspace_timestamp;
1341
1342                 if (!skip_setup) {
1343                         mount_setup_early();
1344                         dual_timestamp_get(&security_start_timestamp);
1345                         if (selinux_setup(&loaded_policy) < 0)
1346                                 goto finish;
1347                         if (ima_setup() < 0)
1348                                 goto finish;
1349                         if (smack_setup(&loaded_policy) < 0)
1350                                 goto finish;
1351                         dual_timestamp_get(&security_finish_timestamp);
1352                 }
1353
1354                 if (label_init(NULL) < 0)
1355                         goto finish;
1356
1357                 if (!skip_setup) {
1358                         if (clock_is_localtime() > 0) {
1359                                 int min;
1360
1361                                 /*
1362                                  * The very first call of settimeofday() also does a time warp in the kernel.
1363                                  *
1364                                  * In the rtc-in-local time mode, we set the kernel's timezone, and rely on
1365                                  * external tools to take care of maintaining the RTC and do all adjustments.
1366                                  * This matches the behavior of Windows, which leaves the RTC alone if the
1367                                  * registry tells that the RTC runs in UTC.
1368                                  */
1369                                 r = clock_set_timezone(&min);
1370                                 if (r < 0)
1371                                         log_error("Failed to apply local time delta, ignoring: %s", strerror(-r));
1372                                 else
1373                                         log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
1374                         } else if (!in_initrd()) {
1375                                 /*
1376                                  * Do a dummy very first call to seal the kernel's time warp magic.
1377                                  *
1378                                  * Do not call this this from inside the initrd. The initrd might not
1379                                  * carry /etc/adjtime with LOCAL, but the real system could be set up
1380                                  * that way. In such case, we need to delay the time-warp or the sealing
1381                                  * until we reach the real system.
1382                                  *
1383                                  * Do no set the kernel's timezone. The concept of local time cannot
1384                                  * be supported reliably, the time will jump or be incorrect at every daylight
1385                                  * saving time change. All kernel local time concepts will be treated
1386                                  * as UTC that way.
1387                                  */
1388                                 clock_reset_timewarp();
1389                         }
1390                 }
1391
1392                 /* Set the default for later on, but don't actually
1393                  * open the logs like this for now. Note that if we
1394                  * are transitioning from the initrd there might still
1395                  * be journal fd open, and we shouldn't attempt
1396                  * opening that before we parsed /proc/cmdline which
1397                  * might redirect output elsewhere. */
1398                 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1399
1400         } else if (getpid() == 1) {
1401                 /* Running inside a container, as PID 1 */
1402                 arg_running_as = SYSTEMD_SYSTEM;
1403                 log_set_target(LOG_TARGET_CONSOLE);
1404                 log_close_console(); /* force reopen of /dev/console */
1405                 log_open();
1406
1407                 /* For the later on, see above... */
1408                 log_set_target(LOG_TARGET_JOURNAL);
1409
1410                 /* clear the kernel timestamp,
1411                  * because we are in a container */
1412                 kernel_timestamp.monotonic = 0ULL;
1413                 kernel_timestamp.realtime = 0ULL;
1414
1415         } else {
1416                 /* Running as user instance */
1417                 arg_running_as = SYSTEMD_USER;
1418                 log_set_target(LOG_TARGET_AUTO);
1419                 log_open();
1420
1421                 /* clear the kernel timestamp,
1422                  * because we are not PID 1 */
1423                 kernel_timestamp.monotonic = 0ULL;
1424                 kernel_timestamp.realtime = 0ULL;
1425         }
1426
1427         /* Initialize default unit */
1428         r = set_default_unit(SPECIAL_DEFAULT_TARGET);
1429         if (r < 0) {
1430                 log_error("Failed to set default unit %s: %s", SPECIAL_DEFAULT_TARGET, strerror(-r));
1431                 goto finish;
1432         }
1433
1434         r = initialize_join_controllers();
1435         if (r < 0)
1436                 goto finish;
1437
1438         /* Mount /proc, /sys and friends, so that /proc/cmdline and
1439          * /proc/$PID/fd is available. */
1440         if (getpid() == 1) {
1441                 r = mount_setup(loaded_policy);
1442                 if (r < 0)
1443                         goto finish;
1444         }
1445
1446         /* Reset all signal handlers. */
1447         assert_se(reset_all_signal_handlers() == 0);
1448
1449         ignore_signals(SIGNALS_IGNORE, -1);
1450
1451         if (parse_config_file() < 0)
1452                 goto finish;
1453
1454         if (arg_running_as == SYSTEMD_SYSTEM)
1455                 if (parse_proc_cmdline(parse_proc_cmdline_item) < 0)
1456                         goto finish;
1457
1458         log_parse_environment();
1459
1460         if (parse_argv(argc, argv) < 0)
1461                 goto finish;
1462
1463         if (arg_action == ACTION_TEST &&
1464             geteuid() == 0) {
1465                 log_error("Don't run test mode as root.");
1466                 goto finish;
1467         }
1468
1469         if (arg_running_as == SYSTEMD_USER &&
1470             arg_action == ACTION_RUN &&
1471             sd_booted() <= 0) {
1472                 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1473                 goto finish;
1474         }
1475
1476         if (arg_running_as == SYSTEMD_SYSTEM &&
1477             arg_action == ACTION_RUN &&
1478             running_in_chroot() > 0) {
1479                 log_error("Cannot be run in a chroot() environment.");
1480                 goto finish;
1481         }
1482
1483         if (arg_action == ACTION_TEST)
1484                 skip_setup = true;
1485
1486         pager_open_if_enabled();
1487
1488         if (arg_action == ACTION_HELP) {
1489                 retval = help();
1490                 goto finish;
1491         } else if (arg_action == ACTION_VERSION) {
1492                 retval = version();
1493                 goto finish;
1494         } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
1495                 unit_dump_config_items(stdout);
1496                 retval = EXIT_SUCCESS;
1497                 goto finish;
1498         } else if (arg_action == ACTION_DONE) {
1499                 retval = EXIT_SUCCESS;
1500                 goto finish;
1501         }
1502
1503         if (arg_running_as == SYSTEMD_USER &&
1504             !getenv("XDG_RUNTIME_DIR")) {
1505                 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1506                 goto finish;
1507         }
1508
1509         assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
1510
1511         /* Close logging fds, in order not to confuse fdset below */
1512         log_close();
1513
1514         /* Remember open file descriptors for later deserialization */
1515         r = fdset_new_fill(&fds);
1516         if (r < 0) {
1517                 log_error("Failed to allocate fd set: %s", strerror(-r));
1518                 goto finish;
1519         } else
1520                 fdset_cloexec(fds, true);
1521
1522         if (arg_serialization)
1523                 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
1524
1525         if (arg_running_as == SYSTEMD_SYSTEM)
1526                 /* Become a session leader if we aren't one yet. */
1527                 setsid();
1528
1529         /* Move out of the way, so that we won't block unmounts */
1530         assert_se(chdir("/")  == 0);
1531
1532         /* Reset the console, but only if this is really init and we
1533          * are freshly booted */
1534         if (arg_running_as == SYSTEMD_SYSTEM && arg_action == ACTION_RUN) {
1535
1536                 /* If we are init, we connect stdin/stdout/stderr to
1537                  * /dev/null and make sure we don't have a controlling
1538                  * tty. */
1539                 release_terminal();
1540
1541                 if (getpid() == 1 && !skip_setup)
1542                         console_setup();
1543         }
1544
1545         /* Open the logging devices, if possible and necessary */
1546         log_open();
1547
1548         if (arg_show_status == _SHOW_STATUS_UNSET)
1549                 arg_show_status = SHOW_STATUS_YES;
1550
1551         /* Make sure we leave a core dump without panicing the
1552          * kernel. */
1553         if (getpid() == 1) {
1554                 install_crash_handler();
1555
1556                 r = mount_cgroup_controllers(arg_join_controllers);
1557                 if (r < 0)
1558                         goto finish;
1559         }
1560
1561         if (arg_running_as == SYSTEMD_SYSTEM) {
1562                 const char *virtualization = NULL;
1563
1564                 log_info(PACKAGE_STRING " running in %ssystem mode. (" SYSTEMD_FEATURES ")",
1565                          arg_action == ACTION_TEST ? "test " : "" );
1566
1567                 detect_virtualization(&virtualization);
1568                 if (virtualization)
1569                         log_info("Detected virtualization '%s'.", virtualization);
1570
1571                 write_container_id();
1572
1573                 log_info("Detected architecture '%s'.", architecture_to_string(uname_architecture()));
1574
1575                 if (in_initrd())
1576                         log_info("Running in initial RAM disk.");
1577
1578                 /* Let's check whether /etc is already populated. We
1579                  * don't actually really check for that, but use
1580                  * /etc/machine-id as flag file. This allows container
1581                  * managers and installers to provision a couple of
1582                  * files already. If the container manager wants to
1583                  * provision the machine ID itself it should pass
1584                  * $container_uuid to PID 1.*/
1585
1586                 empty_etc = access("/etc/machine-id", F_OK) < 0;
1587                 if (empty_etc)
1588                         log_info("Running with unpopulated /etc.");
1589         } else {
1590                 _cleanup_free_ char *t;
1591
1592                 t = uid_to_name(getuid());
1593                 log_debug(PACKAGE_STRING " running in %suser mode for user "UID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1594                           arg_action == ACTION_TEST ? " test" : "", getuid(), t);
1595         }
1596
1597         if (arg_running_as == SYSTEMD_SYSTEM && !skip_setup) {
1598                 if (arg_show_status > 0 || plymouth_running())
1599                         status_welcome();
1600
1601 #ifdef HAVE_KMOD
1602                 kmod_setup();
1603 #endif
1604                 hostname_setup();
1605                 machine_id_setup(NULL);
1606                 loopback_setup();
1607
1608                 test_mtab();
1609                 test_usr();
1610         }
1611
1612         if (arg_running_as == SYSTEMD_SYSTEM && arg_runtime_watchdog > 0)
1613                 watchdog_set_timeout(&arg_runtime_watchdog);
1614
1615         if (arg_timer_slack_nsec != NSEC_INFINITY)
1616                 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
1617                         log_error("Failed to adjust timer slack: %m");
1618
1619         if (arg_capability_bounding_set_drop) {
1620                 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
1621                 if (r < 0) {
1622                         log_error("Failed to drop capability bounding set of usermode helpers: %s", strerror(-r));
1623                         goto finish;
1624                 }
1625                 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
1626                 if (r < 0) {
1627                         log_error("Failed to drop capability bounding set: %s", strerror(-r));
1628                         goto finish;
1629                 }
1630         }
1631
1632         if (arg_syscall_archs) {
1633                 r = enforce_syscall_archs(arg_syscall_archs);
1634                 if (r < 0)
1635                         goto finish;
1636         }
1637
1638         if (arg_running_as == SYSTEMD_USER) {
1639                 /* Become reaper of our children */
1640                 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0) {
1641                         log_warning("Failed to make us a subreaper: %m");
1642                         if (errno == EINVAL)
1643                                 log_info("Perhaps the kernel version is too old (< 3.4?)");
1644                 }
1645         }
1646
1647         if (arg_running_as == SYSTEMD_SYSTEM) {
1648                 bump_rlimit_nofile(&saved_rlimit_nofile);
1649
1650                 if (empty_etc) {
1651                         r = unit_file_preset_all(UNIT_FILE_SYSTEM, false, NULL, UNIT_FILE_PRESET_FULL, false, NULL, 0);
1652                         if (r < 0)
1653                                 log_warning("Failed to populate /etc with preset unit settings, ignoring: %s", strerror(-r));
1654                         else
1655                                 log_info("Populated /etc with preset unit settings.");
1656                 }
1657         }
1658
1659         r = manager_new(arg_running_as, arg_action == ACTION_TEST, &m);
1660         if (r < 0) {
1661                 log_error("Failed to allocate manager object: %s", strerror(-r));
1662                 goto finish;
1663         }
1664
1665         m->confirm_spawn = arg_confirm_spawn;
1666         m->default_timer_accuracy_usec = arg_default_timer_accuracy_usec;
1667         m->default_std_output = arg_default_std_output;
1668         m->default_std_error = arg_default_std_error;
1669         m->default_restart_usec = arg_default_restart_usec;
1670         m->default_timeout_start_usec = arg_default_timeout_start_usec;
1671         m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
1672         m->default_start_limit_interval = arg_default_start_limit_interval;
1673         m->default_start_limit_burst = arg_default_start_limit_burst;
1674         m->default_cpu_accounting = arg_default_cpu_accounting;
1675         m->default_blockio_accounting = arg_default_blockio_accounting;
1676         m->default_memory_accounting = arg_default_memory_accounting;
1677         m->runtime_watchdog = arg_runtime_watchdog;
1678         m->shutdown_watchdog = arg_shutdown_watchdog;
1679         m->userspace_timestamp = userspace_timestamp;
1680         m->kernel_timestamp = kernel_timestamp;
1681         m->initrd_timestamp = initrd_timestamp;
1682         m->security_start_timestamp = security_start_timestamp;
1683         m->security_finish_timestamp = security_finish_timestamp;
1684
1685         manager_set_default_rlimits(m, arg_default_rlimit);
1686         manager_environment_add(m, NULL, arg_default_environment);
1687         manager_set_show_status(m, arg_show_status);
1688         manager_set_first_boot(m, empty_etc);
1689
1690         /* Remember whether we should queue the default job */
1691         queue_default_job = !arg_serialization || arg_switched_root;
1692
1693         before_startup = now(CLOCK_MONOTONIC);
1694
1695         r = manager_startup(m, arg_serialization, fds);
1696         if (r < 0)
1697                 log_error("Failed to fully start up daemon: %s", strerror(-r));
1698
1699         /* This will close all file descriptors that were opened, but
1700          * not claimed by any unit. */
1701         fdset_free(fds);
1702         fds = NULL;
1703
1704         if (arg_serialization) {
1705                 fclose(arg_serialization);
1706                 arg_serialization = NULL;
1707         }
1708
1709         if (queue_default_job) {
1710                 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
1711                 Unit *target = NULL;
1712                 Job *default_unit_job;
1713
1714                 log_debug("Activating default unit: %s", arg_default_unit);
1715
1716                 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
1717                 if (r < 0)
1718                         log_error("Failed to load default target: %s", bus_error_message(&error, r));
1719                 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
1720                         log_error("Failed to load default target: %s", strerror(-target->load_error));
1721                 else if (target->load_state == UNIT_MASKED)
1722                         log_error("Default target masked.");
1723
1724                 if (!target || target->load_state != UNIT_LOADED) {
1725                         log_info("Trying to load rescue target...");
1726
1727                         r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1728                         if (r < 0) {
1729                                 log_error("Failed to load rescue target: %s", bus_error_message(&error, r));
1730                                 goto finish;
1731                         } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
1732                                 log_error("Failed to load rescue target: %s", strerror(-target->load_error));
1733                                 goto finish;
1734                         } else if (target->load_state == UNIT_MASKED) {
1735                                 log_error("Rescue target masked.");
1736                                 goto finish;
1737                         }
1738                 }
1739
1740                 assert(target->load_state == UNIT_LOADED);
1741
1742                 if (arg_action == ACTION_TEST) {
1743                         printf("-> By units:\n");
1744                         manager_dump_units(m, stdout, "\t");
1745                 }
1746
1747                 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
1748                 if (r == -EPERM) {
1749                         log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
1750
1751                         r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1752                         if (r < 0) {
1753                                 log_error("Failed to start default target: %s", bus_error_message(&error, r));
1754                                 goto finish;
1755                         }
1756                 } else if (r < 0) {
1757                         log_error("Failed to isolate default target: %s", bus_error_message(&error, r));
1758                         goto finish;
1759                 }
1760
1761                 m->default_unit_job_id = default_unit_job->id;
1762
1763                 after_startup = now(CLOCK_MONOTONIC);
1764                 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1765                          "Loaded units and determined initial transaction in %s.",
1766                          format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 0));
1767
1768                 if (arg_action == ACTION_TEST) {
1769                         printf("-> By jobs:\n");
1770                         manager_dump_jobs(m, stdout, "\t");
1771                         retval = EXIT_SUCCESS;
1772                         goto finish;
1773                 }
1774         }
1775
1776         for (;;) {
1777                 r = manager_loop(m);
1778                 if (r < 0) {
1779                         log_error("Failed to run mainloop: %s", strerror(-r));
1780                         goto finish;
1781                 }
1782
1783                 switch (m->exit_code) {
1784
1785                 case MANAGER_EXIT:
1786                         retval = EXIT_SUCCESS;
1787                         log_debug("Exit.");
1788                         goto finish;
1789
1790                 case MANAGER_RELOAD:
1791                         log_info("Reloading.");
1792                         r = manager_reload(m);
1793                         if (r < 0)
1794                                 log_error("Failed to reload: %s", strerror(-r));
1795                         break;
1796
1797                 case MANAGER_REEXECUTE:
1798
1799                         if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0)
1800                                 goto finish;
1801
1802                         reexecute = true;
1803                         log_notice("Reexecuting.");
1804                         goto finish;
1805
1806                 case MANAGER_SWITCH_ROOT:
1807                         /* Steal the switch root parameters */
1808                         switch_root_dir = m->switch_root;
1809                         switch_root_init = m->switch_root_init;
1810                         m->switch_root = m->switch_root_init = NULL;
1811
1812                         if (!switch_root_init)
1813                                 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0)
1814                                         goto finish;
1815
1816                         reexecute = true;
1817                         log_notice("Switching root.");
1818                         goto finish;
1819
1820                 case MANAGER_REBOOT:
1821                 case MANAGER_POWEROFF:
1822                 case MANAGER_HALT:
1823                 case MANAGER_KEXEC: {
1824                         static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
1825                                 [MANAGER_REBOOT] = "reboot",
1826                                 [MANAGER_POWEROFF] = "poweroff",
1827                                 [MANAGER_HALT] = "halt",
1828                                 [MANAGER_KEXEC] = "kexec"
1829                         };
1830
1831                         assert_se(shutdown_verb = table[m->exit_code]);
1832                         arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
1833
1834                         log_notice("Shutting down.");
1835                         goto finish;
1836                 }
1837
1838                 default:
1839                         assert_not_reached("Unknown exit code.");
1840                 }
1841         }
1842
1843 finish:
1844         pager_close();
1845
1846         if (m) {
1847                 manager_free(m);
1848                 m = NULL;
1849         }
1850
1851         for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++) {
1852                 free(arg_default_rlimit[j]);
1853                 arg_default_rlimit[j] = NULL;
1854         }
1855
1856         free(arg_default_unit);
1857         arg_default_unit = NULL;
1858
1859         free_join_controllers();
1860
1861         strv_free(arg_default_environment);
1862         arg_default_environment = NULL;
1863
1864         set_free(arg_syscall_archs);
1865         arg_syscall_archs = NULL;
1866
1867         label_finish();
1868
1869         if (reexecute) {
1870                 const char **args;
1871                 unsigned i, args_size;
1872                 sigset_t ss;
1873
1874                 /* Close and disarm the watchdog, so that the new
1875                  * instance can reinitialize it, but doesn't get
1876                  * rebooted while we do that */
1877                 watchdog_close(true);
1878
1879                 /* Reset the RLIMIT_NOFILE to the kernel default, so
1880                  * that the new systemd can pass the kernel default to
1881                  * its child processes */
1882                 if (saved_rlimit_nofile.rlim_cur > 0)
1883                         setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
1884
1885                 if (switch_root_dir) {
1886                         /* Kill all remaining processes from the
1887                          * initrd, but don't wait for them, so that we
1888                          * can handle the SIGCHLD for them after
1889                          * deserializing. */
1890                         broadcast_signal(SIGTERM, false, true);
1891
1892                         /* And switch root */
1893                         r = switch_root(switch_root_dir);
1894                         if (r < 0)
1895                                 log_error("Failed to switch root, ignoring: %s", strerror(-r));
1896                 }
1897
1898                 args_size = MAX(6, argc+1);
1899                 args = newa(const char*, args_size);
1900
1901                 if (!switch_root_init) {
1902                         char sfd[16];
1903
1904                         /* First try to spawn ourselves with the right
1905                          * path, and with full serialization. We do
1906                          * this only if the user didn't specify an
1907                          * explicit init to spawn. */
1908
1909                         assert(arg_serialization);
1910                         assert(fds);
1911
1912                         snprintf(sfd, sizeof(sfd), "%i", fileno(arg_serialization));
1913                         char_array_0(sfd);
1914
1915                         i = 0;
1916                         args[i++] = SYSTEMD_BINARY_PATH;
1917                         if (switch_root_dir)
1918                                 args[i++] = "--switched-root";
1919                         args[i++] = arg_running_as == SYSTEMD_SYSTEM ? "--system" : "--user";
1920                         args[i++] = "--deserialize";
1921                         args[i++] = sfd;
1922                         args[i++] = NULL;
1923
1924                         /* do not pass along the environment we inherit from the kernel or initrd */
1925                         if (switch_root_dir)
1926                                 clearenv();
1927
1928                         assert(i <= args_size);
1929                         execv(args[0], (char* const*) args);
1930                 }
1931
1932                 /* Try the fallback, if there is any, without any
1933                  * serialization. We pass the original argv[] and
1934                  * envp[]. (Well, modulo the ordering changes due to
1935                  * getopt() in argv[], and some cleanups in envp[],
1936                  * but let's hope that doesn't matter.) */
1937
1938                 if (arg_serialization) {
1939                         fclose(arg_serialization);
1940                         arg_serialization = NULL;
1941                 }
1942
1943                 if (fds) {
1944                         fdset_free(fds);
1945                         fds = NULL;
1946                 }
1947
1948                 /* Reopen the console */
1949                 make_console_stdio();
1950
1951                 for (j = 1, i = 1; j < (unsigned) argc; j++)
1952                         args[i++] = argv[j];
1953                 args[i++] = NULL;
1954                 assert(i <= args_size);
1955
1956                 /* reenable any blocked signals, especially important
1957                  * if we switch from initial ramdisk to init=... */
1958                 reset_all_signal_handlers();
1959
1960                 assert_se(sigemptyset(&ss) == 0);
1961                 assert_se(sigprocmask(SIG_SETMASK, &ss, NULL) == 0);
1962
1963                 if (switch_root_init) {
1964                         args[0] = switch_root_init;
1965                         execv(args[0], (char* const*) args);
1966                         log_warning("Failed to execute configured init, trying fallback: %m");
1967                 }
1968
1969                 args[0] = "/sbin/init";
1970                 execv(args[0], (char* const*) args);
1971
1972                 if (errno == ENOENT) {
1973                         log_warning("No /sbin/init, trying fallback");
1974
1975                         args[0] = "/bin/sh";
1976                         args[1] = NULL;
1977                         execv(args[0], (char* const*) args);
1978                         log_error("Failed to execute /bin/sh, giving up: %m");
1979                 } else
1980                         log_warning("Failed to execute /sbin/init, giving up: %m");
1981         }
1982
1983         if (arg_serialization) {
1984                 fclose(arg_serialization);
1985                 arg_serialization = NULL;
1986         }
1987
1988         if (fds) {
1989                 fdset_free(fds);
1990                 fds = NULL;
1991         }
1992
1993 #ifdef HAVE_VALGRIND_VALGRIND_H
1994         /* If we are PID 1 and running under valgrind, then let's exit
1995          * here explicitly. valgrind will only generate nice output on
1996          * exit(), not on exec(), hence let's do the former not the
1997          * latter here. */
1998         if (getpid() == 1 && RUNNING_ON_VALGRIND)
1999                 return 0;
2000 #endif
2001
2002         if (shutdown_verb) {
2003                 char log_level[DECIMAL_STR_MAX(int) + 1];
2004                 const char* command_line[9] = {
2005                         SYSTEMD_SHUTDOWN_BINARY_PATH,
2006                         shutdown_verb,
2007                         "--log-level", log_level,
2008                         "--log-target",
2009                 };
2010                 unsigned pos = 5;
2011                 _cleanup_strv_free_ char **env_block = NULL;
2012
2013                 assert(command_line[pos] == NULL);
2014                 env_block = strv_copy(environ);
2015
2016                 snprintf(log_level, sizeof(log_level), "%d", log_get_max_level());
2017
2018                 switch (log_get_target()) {
2019                 case LOG_TARGET_KMSG:
2020                 case LOG_TARGET_JOURNAL_OR_KMSG:
2021                 case LOG_TARGET_SYSLOG_OR_KMSG:
2022                         command_line[pos++] = "kmsg";
2023                         break;
2024
2025                 case LOG_TARGET_CONSOLE:
2026                 default:
2027                         command_line[pos++] = "console";
2028                         break;
2029                 };
2030
2031                 if (log_get_show_color())
2032                         command_line[pos++] = "--log-color";
2033
2034                 if (log_get_show_location())
2035                         command_line[pos++] = "--log-location";
2036
2037                 assert(pos < ELEMENTSOF(command_line));
2038
2039                 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
2040                         char *e;
2041
2042                         /* If we reboot let's set the shutdown
2043                          * watchdog and tell the shutdown binary to
2044                          * repeatedly ping it */
2045                         watchdog_set_timeout(&arg_shutdown_watchdog);
2046                         watchdog_close(false);
2047
2048                         /* Tell the binary how often to ping, ignore failure */
2049                         if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
2050                                 strv_push(&env_block, e);
2051                 } else
2052                         watchdog_close(true);
2053
2054                 /* Avoid the creation of new processes forked by the
2055                  * kernel; at this point, we will not listen to the
2056                  * signals anyway */
2057                 if (detect_container(NULL) <= 0)
2058                         cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
2059
2060                 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
2061                 log_error("Failed to execute shutdown binary, %s: %m",
2062                           getpid() == 1 ? "freezing" : "quitting");
2063         }
2064
2065         if (getpid() == 1)
2066                 freeze();
2067
2068         return retval;
2069 }