1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
31 #include <sys/resource.h>
32 #include <linux/sched.h>
33 #include <sys/types.h>
37 #include <sys/ioctl.h>
39 #include <linux/tiocl.h>
42 #include <sys/inotify.h>
45 #include <sys/prctl.h>
46 #include <sys/utsname.h>
48 #include <netinet/ip.h>
57 #include <sys/mount.h>
58 #include <linux/magic.h>
62 #include <sys/personality.h>
66 #ifdef HAVE_SYS_AUXV_H
78 #include "path-util.h"
79 #include "exit-status.h"
83 #include "device-nodes.h"
90 char **saved_argv = NULL;
92 static volatile unsigned cached_columns = 0;
93 static volatile unsigned cached_lines = 0;
95 size_t page_size(void) {
96 static thread_local size_t pgsz = 0;
99 if (_likely_(pgsz > 0))
102 r = sysconf(_SC_PAGESIZE);
109 bool streq_ptr(const char *a, const char *b) {
111 /* Like streq(), but tries to make sense of NULL pointers */
122 char* endswith(const char *s, const char *postfix) {
129 pl = strlen(postfix);
132 return (char*) s + sl;
137 if (memcmp(s + sl - pl, postfix, pl) != 0)
140 return (char*) s + sl - pl;
143 bool first_word(const char *s, const char *word) {
158 if (memcmp(s, word, wl) != 0)
162 strchr(WHITESPACE, s[wl]);
165 int close_nointr(int fd) {
172 else if (errno == EINTR)
174 * Just ignore EINTR; a retry loop is the wrong
175 * thing to do on Linux.
177 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
178 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
179 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
180 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
187 int safe_close(int fd) {
190 * Like close_nointr() but cannot fail. Guarantees errno is
191 * unchanged. Is a NOP with negative fds passed, and returns
192 * -1, so that it can be used in this syntax:
194 * fd = safe_close(fd);
200 /* The kernel might return pretty much any error code
201 * via close(), but the fd will be closed anyway. The
202 * only condition we want to check for here is whether
203 * the fd was invalid at all... */
205 assert_se(close_nointr(fd) != -EBADF);
211 void close_many(const int fds[], unsigned n_fd) {
214 assert(fds || n_fd <= 0);
216 for (i = 0; i < n_fd; i++)
220 int unlink_noerrno(const char *path) {
231 int parse_boolean(const char *v) {
234 if (streq(v, "1") || v[0] == 'y' || v[0] == 'Y' || v[0] == 't' || v[0] == 'T' || strcaseeq(v, "on"))
236 else if (streq(v, "0") || v[0] == 'n' || v[0] == 'N' || v[0] == 'f' || v[0] == 'F' || strcaseeq(v, "off"))
242 int parse_pid(const char *s, pid_t* ret_pid) {
243 unsigned long ul = 0;
250 r = safe_atolu(s, &ul);
256 if ((unsigned long) pid != ul)
266 int parse_uid(const char *s, uid_t* ret_uid) {
267 unsigned long ul = 0;
274 r = safe_atolu(s, &ul);
280 if ((unsigned long) uid != ul)
283 /* Some libc APIs use (uid_t) -1 as special placeholder */
284 if (uid == (uid_t) 0xFFFFFFFF)
287 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
288 if (uid == (uid_t) 0xFFFF)
295 int safe_atou(const char *s, unsigned *ret_u) {
303 l = strtoul(s, &x, 0);
305 if (!x || x == s || *x || errno)
306 return errno > 0 ? -errno : -EINVAL;
308 if ((unsigned long) (unsigned) l != l)
311 *ret_u = (unsigned) l;
315 int safe_atoi(const char *s, int *ret_i) {
323 l = strtol(s, &x, 0);
325 if (!x || x == s || *x || errno)
326 return errno > 0 ? -errno : -EINVAL;
328 if ((long) (int) l != l)
335 int safe_atollu(const char *s, long long unsigned *ret_llu) {
337 unsigned long long l;
343 l = strtoull(s, &x, 0);
345 if (!x || x == s || *x || errno)
346 return errno ? -errno : -EINVAL;
352 int safe_atolli(const char *s, long long int *ret_lli) {
360 l = strtoll(s, &x, 0);
362 if (!x || x == s || *x || errno)
363 return errno ? -errno : -EINVAL;
369 int safe_atod(const char *s, double *ret_d) {
376 RUN_WITH_LOCALE(LC_NUMERIC_MASK, "C") {
381 if (!x || x == s || *x || errno)
382 return errno ? -errno : -EINVAL;
388 static size_t strcspn_escaped(const char *s, const char *reject) {
389 bool escaped = false;
392 for (n=0; s[n]; n++) {
395 else if (s[n] == '\\')
397 else if (strchr(reject, s[n]))
403 /* Split a string into words. */
404 char *split(const char *c, size_t *l, const char *separator, bool quoted, char **state) {
407 current = *state ? *state : (char*) c;
409 if (!*current || *c == 0)
412 current += strspn(current, separator);
416 if (quoted && strchr("\'\"", *current)) {
417 char quotechar = *(current++);
418 *l = strcspn_escaped(current, (char[]){quotechar, '\0'});
419 *state = current+*l+1;
421 *l = strcspn_escaped(current, separator);
424 *l = strcspn(current, separator);
428 return (char*) current;
431 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
433 _cleanup_free_ char *line = NULL;
445 p = procfs_file_alloca(pid, "stat");
446 r = read_one_line_file(p, &line);
450 /* Let's skip the pid and comm fields. The latter is enclosed
451 * in () but does not escape any () in its value, so let's
452 * skip over it manually */
454 p = strrchr(line, ')');
466 if ((long unsigned) (pid_t) ppid != ppid)
469 *_ppid = (pid_t) ppid;
474 int get_starttime_of_pid(pid_t pid, unsigned long long *st) {
476 _cleanup_free_ char *line = NULL;
482 p = procfs_file_alloca(pid, "stat");
483 r = read_one_line_file(p, &line);
487 /* Let's skip the pid and comm fields. The latter is enclosed
488 * in () but does not escape any () in its value, so let's
489 * skip over it manually */
491 p = strrchr(line, ')');
513 "%*d " /* priority */
515 "%*d " /* num_threads */
516 "%*d " /* itrealvalue */
517 "%llu " /* starttime */,
524 int fchmod_umask(int fd, mode_t m) {
529 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
535 char *truncate_nl(char *s) {
538 s[strcspn(s, NEWLINE)] = 0;
542 int get_process_state(pid_t pid) {
546 _cleanup_free_ char *line = NULL;
550 p = procfs_file_alloca(pid, "stat");
551 r = read_one_line_file(p, &line);
555 p = strrchr(line, ')');
561 if (sscanf(p, " %c", &state) != 1)
564 return (unsigned char) state;
567 int get_process_comm(pid_t pid, char **name) {
574 p = procfs_file_alloca(pid, "comm");
576 r = read_one_line_file(p, name);
583 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
584 _cleanup_fclose_ FILE *f = NULL;
592 p = procfs_file_alloca(pid, "cmdline");
598 if (max_length == 0) {
599 size_t len = 0, allocated = 0;
601 while ((c = getc(f)) != EOF) {
603 if (!GREEDY_REALLOC(r, allocated, len+2)) {
608 r[len++] = isprint(c) ? c : ' ';
618 r = new(char, max_length);
624 while ((c = getc(f)) != EOF) {
646 size_t n = MIN(left-1, 3U);
653 /* Kernel threads have no argv[] */
654 if (r == NULL || r[0] == 0) {
655 _cleanup_free_ char *t = NULL;
663 h = get_process_comm(pid, &t);
667 r = strjoin("[", t, "]", NULL);
676 int is_kernel_thread(pid_t pid) {
688 p = procfs_file_alloca(pid, "cmdline");
693 count = fread(&c, 1, 1, f);
697 /* Kernel threads have an empty cmdline */
700 return eof ? 1 : -errno;
705 int get_process_capeff(pid_t pid, char **capeff) {
711 p = procfs_file_alloca(pid, "status");
713 return get_status_field(p, "\nCapEff:", capeff);
716 int get_process_exe(pid_t pid, char **name) {
724 p = procfs_file_alloca(pid, "exe");
726 r = readlink_malloc(p, name);
728 return r == -ENOENT ? -ESRCH : r;
730 d = endswith(*name, " (deleted)");
737 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
738 _cleanup_fclose_ FILE *f = NULL;
748 p = procfs_file_alloca(pid, "status");
753 FOREACH_LINE(line, f, return -errno) {
758 if (startswith(l, field)) {
760 l += strspn(l, WHITESPACE);
762 l[strcspn(l, WHITESPACE)] = 0;
764 return parse_uid(l, uid);
771 int get_process_uid(pid_t pid, uid_t *uid) {
772 return get_process_id(pid, "Uid:", uid);
775 int get_process_gid(pid_t pid, gid_t *gid) {
776 assert_cc(sizeof(uid_t) == sizeof(gid_t));
777 return get_process_id(pid, "Gid:", gid);
780 char *strnappend(const char *s, const char *suffix, size_t b) {
788 return strndup(suffix, b);
797 if (b > ((size_t) -1) - a)
800 r = new(char, a+b+1);
805 memcpy(r+a, suffix, b);
811 char *strappend(const char *s, const char *suffix) {
812 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
815 int readlinkat_malloc(int fd, const char *p, char **ret) {
830 n = readlinkat(fd, p, c, l-1);
837 if ((size_t) n < l-1) {
848 int readlink_malloc(const char *p, char **ret) {
849 return readlinkat_malloc(AT_FDCWD, p, ret);
852 int readlink_and_make_absolute(const char *p, char **r) {
853 _cleanup_free_ char *target = NULL;
860 j = readlink_malloc(p, &target);
864 k = file_in_same_dir(p, target);
872 int readlink_and_canonicalize(const char *p, char **r) {
879 j = readlink_and_make_absolute(p, &t);
883 s = canonicalize_file_name(t);
890 path_kill_slashes(*r);
895 int reset_all_signal_handlers(void) {
898 for (sig = 1; sig < _NSIG; sig++) {
899 struct sigaction sa = {
900 .sa_handler = SIG_DFL,
901 .sa_flags = SA_RESTART,
904 if (sig == SIGKILL || sig == SIGSTOP)
907 /* On Linux the first two RT signals are reserved by
908 * glibc, and sigaction() will return EINVAL for them. */
909 if ((sigaction(sig, &sa, NULL) < 0))
917 char *strstrip(char *s) {
920 /* Drops trailing whitespace. Modifies the string in
921 * place. Returns pointer to first non-space character */
923 s += strspn(s, WHITESPACE);
925 for (e = strchr(s, 0); e > s; e --)
926 if (!strchr(WHITESPACE, e[-1]))
934 char *delete_chars(char *s, const char *bad) {
937 /* Drops all whitespace, regardless where in the string */
939 for (f = s, t = s; *f; f++) {
951 char *file_in_same_dir(const char *path, const char *filename) {
958 /* This removes the last component of path and appends
959 * filename, unless the latter is absolute anyway or the
962 if (path_is_absolute(filename))
963 return strdup(filename);
965 if (!(e = strrchr(path, '/')))
966 return strdup(filename);
968 k = strlen(filename);
969 if (!(r = new(char, e-path+1+k+1)))
972 memcpy(r, path, e-path+1);
973 memcpy(r+(e-path)+1, filename, k+1);
978 int rmdir_parents(const char *path, const char *stop) {
987 /* Skip trailing slashes */
988 while (l > 0 && path[l-1] == '/')
994 /* Skip last component */
995 while (l > 0 && path[l-1] != '/')
998 /* Skip trailing slashes */
999 while (l > 0 && path[l-1] == '/')
1005 if (!(t = strndup(path, l)))
1008 if (path_startswith(stop, t)) {
1017 if (errno != ENOENT)
1024 char hexchar(int x) {
1025 static const char table[16] = "0123456789abcdef";
1027 return table[x & 15];
1030 int unhexchar(char c) {
1032 if (c >= '0' && c <= '9')
1035 if (c >= 'a' && c <= 'f')
1036 return c - 'a' + 10;
1038 if (c >= 'A' && c <= 'F')
1039 return c - 'A' + 10;
1044 char *hexmem(const void *p, size_t l) {
1048 z = r = malloc(l * 2 + 1);
1052 for (x = p; x < (const uint8_t*) p + l; x++) {
1053 *(z++) = hexchar(*x >> 4);
1054 *(z++) = hexchar(*x & 15);
1061 void *unhexmem(const char *p, size_t l) {
1067 z = r = malloc((l + 1) / 2 + 1);
1071 for (x = p; x < p + l; x += 2) {
1074 a = unhexchar(x[0]);
1076 b = unhexchar(x[1]);
1080 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1087 char octchar(int x) {
1088 return '0' + (x & 7);
1091 int unoctchar(char c) {
1093 if (c >= '0' && c <= '7')
1099 char decchar(int x) {
1100 return '0' + (x % 10);
1103 int undecchar(char c) {
1105 if (c >= '0' && c <= '9')
1111 char *cescape(const char *s) {
1117 /* Does C style string escaping. */
1119 r = new(char, strlen(s)*4 + 1);
1123 for (f = s, t = r; *f; f++)
1169 /* For special chars we prefer octal over
1170 * hexadecimal encoding, simply because glib's
1171 * g_strescape() does the same */
1172 if ((*f < ' ') || (*f >= 127)) {
1174 *(t++) = octchar((unsigned char) *f >> 6);
1175 *(t++) = octchar((unsigned char) *f >> 3);
1176 *(t++) = octchar((unsigned char) *f);
1187 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1194 /* Undoes C style string escaping, and optionally prefixes it. */
1196 pl = prefix ? strlen(prefix) : 0;
1198 r = new(char, pl+length+1);
1203 memcpy(r, prefix, pl);
1205 for (f = s, t = r + pl; f < s + length; f++) {
1248 /* This is an extension of the XDG syntax files */
1253 /* hexadecimal encoding */
1256 a = unhexchar(f[1]);
1257 b = unhexchar(f[2]);
1259 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1260 /* Invalid escape code, let's take it literal then */
1264 *(t++) = (char) ((a << 4) | b);
1279 /* octal encoding */
1282 a = unoctchar(f[0]);
1283 b = unoctchar(f[1]);
1284 c = unoctchar(f[2]);
1286 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1287 /* Invalid escape code, let's take it literal then */
1291 *(t++) = (char) ((a << 6) | (b << 3) | c);
1299 /* premature end of string.*/
1304 /* Invalid escape code, let's take it literal then */
1316 char *cunescape_length(const char *s, size_t length) {
1317 return cunescape_length_with_prefix(s, length, NULL);
1320 char *cunescape(const char *s) {
1323 return cunescape_length(s, strlen(s));
1326 char *xescape(const char *s, const char *bad) {
1330 /* Escapes all chars in bad, in addition to \ and all special
1331 * chars, in \xFF style escaping. May be reversed with
1334 r = new(char, strlen(s) * 4 + 1);
1338 for (f = s, t = r; *f; f++) {
1340 if ((*f < ' ') || (*f >= 127) ||
1341 (*f == '\\') || strchr(bad, *f)) {
1344 *(t++) = hexchar(*f >> 4);
1345 *(t++) = hexchar(*f);
1355 char *ascii_strlower(char *t) {
1360 for (p = t; *p; p++)
1361 if (*p >= 'A' && *p <= 'Z')
1362 *p = *p - 'A' + 'a';
1367 _pure_ static bool ignore_file_allow_backup(const char *filename) {
1371 filename[0] == '.' ||
1372 streq(filename, "lost+found") ||
1373 streq(filename, "aquota.user") ||
1374 streq(filename, "aquota.group") ||
1375 endswith(filename, ".rpmnew") ||
1376 endswith(filename, ".rpmsave") ||
1377 endswith(filename, ".rpmorig") ||
1378 endswith(filename, ".dpkg-old") ||
1379 endswith(filename, ".dpkg-new") ||
1380 endswith(filename, ".swp");
1383 bool ignore_file(const char *filename) {
1386 if (endswith(filename, "~"))
1389 return ignore_file_allow_backup(filename);
1392 int fd_nonblock(int fd, bool nonblock) {
1397 flags = fcntl(fd, F_GETFL, 0);
1402 nflags = flags | O_NONBLOCK;
1404 nflags = flags & ~O_NONBLOCK;
1406 if (nflags == flags)
1409 if (fcntl(fd, F_SETFL, nflags) < 0)
1415 int fd_cloexec(int fd, bool cloexec) {
1420 flags = fcntl(fd, F_GETFD, 0);
1425 nflags = flags | FD_CLOEXEC;
1427 nflags = flags & ~FD_CLOEXEC;
1429 if (nflags == flags)
1432 if (fcntl(fd, F_SETFD, nflags) < 0)
1438 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1441 assert(n_fdset == 0 || fdset);
1443 for (i = 0; i < n_fdset; i++)
1450 int close_all_fds(const int except[], unsigned n_except) {
1451 _cleanup_closedir_ DIR *d = NULL;
1455 assert(n_except == 0 || except);
1457 d = opendir("/proc/self/fd");
1462 /* When /proc isn't available (for example in chroots)
1463 * the fallback is brute forcing through the fd
1466 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1467 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1469 if (fd_in_set(fd, except, n_except))
1472 if (close_nointr(fd) < 0)
1473 if (errno != EBADF && r == 0)
1480 while ((de = readdir(d))) {
1483 if (ignore_file(de->d_name))
1486 if (safe_atoi(de->d_name, &fd) < 0)
1487 /* Let's better ignore this, just in case */
1496 if (fd_in_set(fd, except, n_except))
1499 if (close_nointr(fd) < 0) {
1500 /* Valgrind has its own FD and doesn't want to have it closed */
1501 if (errno != EBADF && r == 0)
1509 bool chars_intersect(const char *a, const char *b) {
1512 /* Returns true if any of the chars in a are in b. */
1513 for (p = a; *p; p++)
1520 bool fstype_is_network(const char *fstype) {
1521 static const char table[] =
1535 x = startswith(fstype, "fuse.");
1539 return nulstr_contains(table, fstype);
1543 _cleanup_close_ int fd;
1545 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1551 TIOCL_GETKMSGREDIRECT,
1555 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1558 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1561 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1567 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1568 struct termios old_termios, new_termios;
1569 char c, line[LINE_MAX];
1574 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1575 new_termios = old_termios;
1577 new_termios.c_lflag &= ~ICANON;
1578 new_termios.c_cc[VMIN] = 1;
1579 new_termios.c_cc[VTIME] = 0;
1581 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1584 if (t != (usec_t) -1) {
1585 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1586 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1591 k = fread(&c, 1, 1, f);
1593 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1599 *need_nl = c != '\n';
1606 if (t != (usec_t) -1) {
1607 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1612 if (!fgets(line, sizeof(line), f))
1613 return errno ? -errno : -EIO;
1617 if (strlen(line) != 1)
1627 int ask_char(char *ret, const char *replies, const char *text, ...) {
1637 bool need_nl = true;
1640 fputs(ANSI_HIGHLIGHT_ON, stdout);
1647 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1651 r = read_one_char(stdin, &c, (usec_t) -1, &need_nl);
1654 if (r == -EBADMSG) {
1655 puts("Bad input, please try again.");
1666 if (strchr(replies, c)) {
1671 puts("Read unexpected character, please try again.");
1675 int ask_string(char **ret, const char *text, ...) {
1680 char line[LINE_MAX];
1684 fputs(ANSI_HIGHLIGHT_ON, stdout);
1691 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1696 if (!fgets(line, sizeof(line), stdin))
1697 return errno ? -errno : -EIO;
1699 if (!endswith(line, "\n"))
1718 int reset_terminal_fd(int fd, bool switch_to_text) {
1719 struct termios termios;
1722 /* Set terminal to some sane defaults */
1726 /* We leave locked terminal attributes untouched, so that
1727 * Plymouth may set whatever it wants to set, and we don't
1728 * interfere with that. */
1730 /* Disable exclusive mode, just in case */
1731 ioctl(fd, TIOCNXCL);
1733 /* Switch to text mode */
1735 ioctl(fd, KDSETMODE, KD_TEXT);
1737 /* Enable console unicode mode */
1738 ioctl(fd, KDSKBMODE, K_UNICODE);
1740 if (tcgetattr(fd, &termios) < 0) {
1745 /* We only reset the stuff that matters to the software. How
1746 * hardware is set up we don't touch assuming that somebody
1747 * else will do that for us */
1749 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1750 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1751 termios.c_oflag |= ONLCR;
1752 termios.c_cflag |= CREAD;
1753 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1755 termios.c_cc[VINTR] = 03; /* ^C */
1756 termios.c_cc[VQUIT] = 034; /* ^\ */
1757 termios.c_cc[VERASE] = 0177;
1758 termios.c_cc[VKILL] = 025; /* ^X */
1759 termios.c_cc[VEOF] = 04; /* ^D */
1760 termios.c_cc[VSTART] = 021; /* ^Q */
1761 termios.c_cc[VSTOP] = 023; /* ^S */
1762 termios.c_cc[VSUSP] = 032; /* ^Z */
1763 termios.c_cc[VLNEXT] = 026; /* ^V */
1764 termios.c_cc[VWERASE] = 027; /* ^W */
1765 termios.c_cc[VREPRINT] = 022; /* ^R */
1766 termios.c_cc[VEOL] = 0;
1767 termios.c_cc[VEOL2] = 0;
1769 termios.c_cc[VTIME] = 0;
1770 termios.c_cc[VMIN] = 1;
1772 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1776 /* Just in case, flush all crap out */
1777 tcflush(fd, TCIOFLUSH);
1782 int reset_terminal(const char *name) {
1783 _cleanup_close_ int fd = -1;
1785 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1789 return reset_terminal_fd(fd, true);
1792 int open_terminal(const char *name, int mode) {
1797 * If a TTY is in the process of being closed opening it might
1798 * cause EIO. This is horribly awful, but unlikely to be
1799 * changed in the kernel. Hence we work around this problem by
1800 * retrying a couple of times.
1802 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
1805 assert(!(mode & O_CREAT));
1808 fd = open(name, mode, 0);
1815 /* Max 1s in total */
1819 usleep(50 * USEC_PER_MSEC);
1840 int flush_fd(int fd) {
1841 struct pollfd pollfd = {
1851 r = poll(&pollfd, 1, 0);
1861 l = read(fd, buf, sizeof(buf));
1867 if (errno == EAGAIN)
1876 int acquire_terminal(
1880 bool ignore_tiocstty_eperm,
1883 int fd = -1, notify = -1, r = 0, wd = -1;
1888 /* We use inotify to be notified when the tty is closed. We
1889 * create the watch before checking if we can actually acquire
1890 * it, so that we don't lose any event.
1892 * Note: strictly speaking this actually watches for the
1893 * device being closed, it does *not* really watch whether a
1894 * tty loses its controlling process. However, unless some
1895 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
1896 * its tty otherwise this will not become a problem. As long
1897 * as the administrator makes sure not configure any service
1898 * on the same tty as an untrusted user this should not be a
1899 * problem. (Which he probably should not do anyway.) */
1901 if (timeout != (usec_t) -1)
1902 ts = now(CLOCK_MONOTONIC);
1904 if (!fail && !force) {
1905 notify = inotify_init1(IN_CLOEXEC | (timeout != (usec_t) -1 ? IN_NONBLOCK : 0));
1911 wd = inotify_add_watch(notify, name, IN_CLOSE);
1919 struct sigaction sa_old, sa_new = {
1920 .sa_handler = SIG_IGN,
1921 .sa_flags = SA_RESTART,
1925 r = flush_fd(notify);
1930 /* We pass here O_NOCTTY only so that we can check the return
1931 * value TIOCSCTTY and have a reliable way to figure out if we
1932 * successfully became the controlling process of the tty */
1933 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1937 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
1938 * if we already own the tty. */
1939 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
1941 /* First, try to get the tty */
1942 if (ioctl(fd, TIOCSCTTY, force) < 0)
1945 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
1947 /* Sometimes it makes sense to ignore TIOCSCTTY
1948 * returning EPERM, i.e. when very likely we already
1949 * are have this controlling terminal. */
1950 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
1953 if (r < 0 && (force || fail || r != -EPERM)) {
1962 assert(notify >= 0);
1965 uint8_t inotify_buffer[sizeof(struct inotify_event) + FILENAME_MAX];
1967 struct inotify_event *e;
1969 if (timeout != (usec_t) -1) {
1972 n = now(CLOCK_MONOTONIC);
1973 if (ts + timeout < n) {
1978 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
1988 l = read(notify, inotify_buffer, sizeof(inotify_buffer));
1991 if (errno == EINTR || errno == EAGAIN)
1998 e = (struct inotify_event*) inotify_buffer;
2003 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2008 step = sizeof(struct inotify_event) + e->len;
2009 assert(step <= (size_t) l);
2011 e = (struct inotify_event*) ((uint8_t*) e + step);
2018 /* We close the tty fd here since if the old session
2019 * ended our handle will be dead. It's important that
2020 * we do this after sleeping, so that we don't enter
2021 * an endless loop. */
2027 r = reset_terminal_fd(fd, true);
2029 log_warning("Failed to reset terminal: %s", strerror(-r));
2040 int release_terminal(void) {
2042 struct sigaction sa_old, sa_new = {
2043 .sa_handler = SIG_IGN,
2044 .sa_flags = SA_RESTART,
2046 _cleanup_close_ int fd;
2048 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2052 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2053 * by our own TIOCNOTTY */
2054 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2056 if (ioctl(fd, TIOCNOTTY) < 0)
2059 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2064 int sigaction_many(const struct sigaction *sa, ...) {
2069 while ((sig = va_arg(ap, int)) > 0)
2070 if (sigaction(sig, sa, NULL) < 0)
2077 int ignore_signals(int sig, ...) {
2078 struct sigaction sa = {
2079 .sa_handler = SIG_IGN,
2080 .sa_flags = SA_RESTART,
2085 if (sigaction(sig, &sa, NULL) < 0)
2089 while ((sig = va_arg(ap, int)) > 0)
2090 if (sigaction(sig, &sa, NULL) < 0)
2097 int default_signals(int sig, ...) {
2098 struct sigaction sa = {
2099 .sa_handler = SIG_DFL,
2100 .sa_flags = SA_RESTART,
2105 if (sigaction(sig, &sa, NULL) < 0)
2109 while ((sig = va_arg(ap, int)) > 0)
2110 if (sigaction(sig, &sa, NULL) < 0)
2117 void safe_close_pair(int p[]) {
2121 /* Special case pairs which use the same fd in both
2123 p[0] = p[1] = safe_close(p[0]);
2127 p[0] = safe_close(p[0]);
2128 p[1] = safe_close(p[1]);
2131 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2138 while (nbytes > 0) {
2141 k = read(fd, p, nbytes);
2142 if (k < 0 && errno == EINTR)
2145 if (k < 0 && errno == EAGAIN && do_poll) {
2147 /* We knowingly ignore any return value here,
2148 * and expect that any error/EOF is reported
2151 fd_wait_for_event(fd, POLLIN, (usec_t) -1);
2156 return n > 0 ? n : (k < 0 ? -errno : 0);
2166 ssize_t loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2167 const uint8_t *p = buf;
2173 while (nbytes > 0) {
2176 k = write(fd, p, nbytes);
2177 if (k < 0 && errno == EINTR)
2180 if (k < 0 && errno == EAGAIN && do_poll) {
2182 /* We knowingly ignore any return value here,
2183 * and expect that any error/EOF is reported
2186 fd_wait_for_event(fd, POLLOUT, (usec_t) -1);
2191 return n > 0 ? n : (k < 0 ? -errno : 0);
2201 int parse_size(const char *t, off_t base, off_t *size) {
2203 /* Soo, sometimes we want to parse IEC binary suffxies, and
2204 * sometimes SI decimal suffixes. This function can parse
2205 * both. Which one is the right way depends on the
2206 * context. Wikipedia suggests that SI is customary for
2207 * hardrware metrics and network speeds, while IEC is
2208 * customary for most data sizes used by software and volatile
2209 * (RAM) memory. Hence be careful which one you pick!
2211 * In either case we use just K, M, G as suffix, and not Ki,
2212 * Mi, Gi or so (as IEC would suggest). That's because that's
2213 * frickin' ugly. But this means you really need to make sure
2214 * to document which base you are parsing when you use this
2219 unsigned long long factor;
2222 static const struct table iec[] = {
2223 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2224 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2225 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2226 { "G", 1024ULL*1024ULL*1024ULL },
2227 { "M", 1024ULL*1024ULL },
2233 static const struct table si[] = {
2234 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2235 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2236 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2237 { "G", 1000ULL*1000ULL*1000ULL },
2238 { "M", 1000ULL*1000ULL },
2244 const struct table *table;
2246 unsigned long long r = 0;
2247 unsigned n_entries, start_pos = 0;
2250 assert(base == 1000 || base == 1024);
2255 n_entries = ELEMENTSOF(si);
2258 n_entries = ELEMENTSOF(iec);
2264 unsigned long long l2;
2270 l = strtoll(p, &e, 10);
2283 if (*e >= '0' && *e <= '9') {
2286 /* strotoull itself would accept space/+/- */
2287 l2 = strtoull(e, &e2, 10);
2289 if (errno == ERANGE)
2292 /* Ignore failure. E.g. 10.M is valid */
2299 e += strspn(e, WHITESPACE);
2301 for (i = start_pos; i < n_entries; i++)
2302 if (startswith(e, table[i].suffix)) {
2303 unsigned long long tmp;
2304 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2306 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2307 if (tmp > ULLONG_MAX - r)
2311 if ((unsigned long long) (off_t) r != r)
2314 p = e + strlen(table[i].suffix);
2330 int make_stdio(int fd) {
2335 r = dup3(fd, STDIN_FILENO, 0);
2336 s = dup3(fd, STDOUT_FILENO, 0);
2337 t = dup3(fd, STDERR_FILENO, 0);
2342 if (r < 0 || s < 0 || t < 0)
2345 /* We rely here that the new fd has O_CLOEXEC not set */
2350 int make_null_stdio(void) {
2353 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2357 return make_stdio(null_fd);
2360 bool is_device_path(const char *path) {
2362 /* Returns true on paths that refer to a device, either in
2363 * sysfs or in /dev */
2366 path_startswith(path, "/dev/") ||
2367 path_startswith(path, "/sys/");
2370 int dir_is_empty(const char *path) {
2371 _cleanup_closedir_ DIR *d;
2382 if (!de && errno != 0)
2388 if (!ignore_file(de->d_name))
2393 char* dirname_malloc(const char *path) {
2394 char *d, *dir, *dir2;
2411 int dev_urandom(void *p, size_t n) {
2412 _cleanup_close_ int fd;
2415 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2417 return errno == ENOENT ? -ENOSYS : -errno;
2419 k = loop_read(fd, p, n, true);
2422 if ((size_t) k != n)
2428 void random_bytes(void *p, size_t n) {
2429 static bool srand_called = false;
2433 r = dev_urandom(p, n);
2437 /* If some idiot made /dev/urandom unavailable to us, he'll
2438 * get a PRNG instead. */
2440 if (!srand_called) {
2443 #ifdef HAVE_SYS_AUXV_H
2444 /* The kernel provides us with a bit of entropy in
2445 * auxv, so let's try to make use of that to seed the
2446 * pseudo-random generator. It's better than
2451 auxv = (void*) getauxval(AT_RANDOM);
2453 x ^= *(unsigned*) auxv;
2456 x ^= (unsigned) now(CLOCK_REALTIME);
2457 x ^= (unsigned) gettid();
2460 srand_called = true;
2463 for (q = p; q < (uint8_t*) p + n; q ++)
2467 void rename_process(const char name[8]) {
2470 /* This is a like a poor man's setproctitle(). It changes the
2471 * comm field, argv[0], and also the glibc's internally used
2472 * name of the process. For the first one a limit of 16 chars
2473 * applies, to the second one usually one of 10 (i.e. length
2474 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2475 * "systemd"). If you pass a longer string it will be
2478 prctl(PR_SET_NAME, name);
2480 if (program_invocation_name)
2481 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2483 if (saved_argc > 0) {
2487 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2489 for (i = 1; i < saved_argc; i++) {
2493 memzero(saved_argv[i], strlen(saved_argv[i]));
2498 void sigset_add_many(sigset_t *ss, ...) {
2505 while ((sig = va_arg(ap, int)) > 0)
2506 assert_se(sigaddset(ss, sig) == 0);
2510 int sigprocmask_many(int how, ...) {
2515 assert_se(sigemptyset(&ss) == 0);
2518 while ((sig = va_arg(ap, int)) > 0)
2519 assert_se(sigaddset(&ss, sig) == 0);
2522 if (sigprocmask(how, &ss, NULL) < 0)
2528 char* gethostname_malloc(void) {
2531 assert_se(uname(&u) >= 0);
2533 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2534 return strdup(u.nodename);
2536 return strdup(u.sysname);
2539 bool hostname_is_set(void) {
2542 assert_se(uname(&u) >= 0);
2544 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2547 static char *lookup_uid(uid_t uid) {
2550 _cleanup_free_ char *buf = NULL;
2551 struct passwd pwbuf, *pw = NULL;
2553 /* Shortcut things to avoid NSS lookups */
2555 return strdup("root");
2557 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2561 buf = malloc(bufsize);
2565 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2566 return strdup(pw->pw_name);
2568 if (asprintf(&name, UID_FMT, uid) < 0)
2574 char* getlogname_malloc(void) {
2578 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2583 return lookup_uid(uid);
2586 char *getusername_malloc(void) {
2593 return lookup_uid(getuid());
2596 int getttyname_malloc(int fd, char **r) {
2597 char path[PATH_MAX], *c;
2602 k = ttyname_r(fd, path, sizeof(path));
2608 c = strdup(startswith(path, "/dev/") ? path + 5 : path);
2616 int getttyname_harder(int fd, char **r) {
2620 k = getttyname_malloc(fd, &s);
2624 if (streq(s, "tty")) {
2626 return get_ctty(0, NULL, r);
2633 int get_ctty_devnr(pid_t pid, dev_t *d) {
2635 _cleanup_free_ char *line = NULL;
2637 unsigned long ttynr;
2641 p = procfs_file_alloca(pid, "stat");
2642 r = read_one_line_file(p, &line);
2646 p = strrchr(line, ')');
2656 "%*d " /* session */
2661 if (major(ttynr) == 0 && minor(ttynr) == 0)
2670 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2671 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2672 _cleanup_free_ char *s = NULL;
2679 k = get_ctty_devnr(pid, &devnr);
2683 snprintf(fn, sizeof(fn), "/dev/char/%u:%u", major(devnr), minor(devnr));
2685 k = readlink_malloc(fn, &s);
2691 /* This is an ugly hack */
2692 if (major(devnr) == 136) {
2693 asprintf(&b, "pts/%u", minor(devnr));
2697 /* Probably something like the ptys which have no
2698 * symlink in /dev/char. Let's return something
2699 * vaguely useful. */
2705 if (startswith(s, "/dev/"))
2707 else if (startswith(s, "../"))
2725 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2726 _cleanup_closedir_ DIR *d = NULL;
2731 /* This returns the first error we run into, but nevertheless
2732 * tries to go on. This closes the passed fd. */
2738 return errno == ENOENT ? 0 : -errno;
2743 bool is_dir, keep_around;
2750 if (errno != 0 && ret == 0)
2755 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
2758 if (de->d_type == DT_UNKNOWN ||
2760 (de->d_type == DT_DIR && root_dev)) {
2761 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
2762 if (ret == 0 && errno != ENOENT)
2767 is_dir = S_ISDIR(st.st_mode);
2770 (st.st_uid == 0 || st.st_uid == getuid()) &&
2771 (st.st_mode & S_ISVTX);
2773 is_dir = de->d_type == DT_DIR;
2774 keep_around = false;
2780 /* if root_dev is set, remove subdirectories only, if device is same as dir */
2781 if (root_dev && st.st_dev != root_dev->st_dev)
2784 subdir_fd = openat(fd, de->d_name,
2785 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
2786 if (subdir_fd < 0) {
2787 if (ret == 0 && errno != ENOENT)
2792 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
2793 if (r < 0 && ret == 0)
2797 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
2798 if (ret == 0 && errno != ENOENT)
2802 } else if (!only_dirs && !keep_around) {
2804 if (unlinkat(fd, de->d_name, 0) < 0) {
2805 if (ret == 0 && errno != ENOENT)
2812 _pure_ static int is_temporary_fs(struct statfs *s) {
2815 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
2816 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
2819 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2824 if (fstatfs(fd, &s) < 0) {
2829 /* We refuse to clean disk file systems with this call. This
2830 * is extra paranoia just to be sure we never ever remove
2832 if (!is_temporary_fs(&s)) {
2833 log_error("Attempted to remove disk file system, and we can't allow that.");
2838 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
2841 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
2847 /* We refuse to clean the root file system with this
2848 * call. This is extra paranoia to never cause a really
2849 * seriously broken system. */
2850 if (path_equal(path, "/")) {
2851 log_error("Attempted to remove entire root file system, and we can't allow that.");
2855 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
2858 if (errno != ENOTDIR)
2862 if (statfs(path, &s) < 0)
2865 if (!is_temporary_fs(&s)) {
2866 log_error("Attempted to remove disk file system, and we can't allow that.");
2871 if (delete_root && !only_dirs)
2872 if (unlink(path) < 0 && errno != ENOENT)
2879 if (fstatfs(fd, &s) < 0) {
2884 if (!is_temporary_fs(&s)) {
2885 log_error("Attempted to remove disk file system, and we can't allow that.");
2891 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
2894 if (honour_sticky && file_is_priv_sticky(path) > 0)
2897 if (rmdir(path) < 0 && errno != ENOENT) {
2906 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
2907 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
2910 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
2911 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
2914 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
2917 /* Under the assumption that we are running privileged we
2918 * first change the access mode and only then hand out
2919 * ownership to avoid a window where access is too open. */
2921 if (mode != (mode_t) -1)
2922 if (chmod(path, mode) < 0)
2925 if (uid != (uid_t) -1 || gid != (gid_t) -1)
2926 if (chown(path, uid, gid) < 0)
2932 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
2935 /* Under the assumption that we are running privileged we
2936 * first change the access mode and only then hand out
2937 * ownership to avoid a window where access is too open. */
2939 if (mode != (mode_t) -1)
2940 if (fchmod(fd, mode) < 0)
2943 if (uid != (uid_t) -1 || gid != (gid_t) -1)
2944 if (fchown(fd, uid, gid) < 0)
2950 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
2954 /* Allocates the cpuset in the right size */
2957 if (!(r = CPU_ALLOC(n)))
2960 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
2961 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
2971 if (errno != EINVAL)
2978 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
2979 static const char status_indent[] = " "; /* "[" STATUS "] " */
2980 _cleanup_free_ char *s = NULL;
2981 _cleanup_close_ int fd = -1;
2982 struct iovec iovec[6] = {};
2984 static bool prev_ephemeral;
2988 /* This is independent of logging, as status messages are
2989 * optional and go exclusively to the console. */
2991 if (vasprintf(&s, format, ap) < 0)
2994 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3007 sl = status ? sizeof(status_indent)-1 : 0;
3013 e = ellipsize(s, emax, 75);
3021 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3022 prev_ephemeral = ephemeral;
3025 if (!isempty(status)) {
3026 IOVEC_SET_STRING(iovec[n++], "[");
3027 IOVEC_SET_STRING(iovec[n++], status);
3028 IOVEC_SET_STRING(iovec[n++], "] ");
3030 IOVEC_SET_STRING(iovec[n++], status_indent);
3033 IOVEC_SET_STRING(iovec[n++], s);
3035 IOVEC_SET_STRING(iovec[n++], "\n");
3037 if (writev(fd, iovec, n) < 0)
3043 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3049 va_start(ap, format);
3050 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3056 char *replace_env(const char *format, char **env) {
3063 const char *e, *word = format;
3068 for (e = format; *e; e ++) {
3079 if (!(k = strnappend(r, word, e-word-1)))
3088 } else if (*e == '$') {
3089 if (!(k = strnappend(r, word, e-word)))
3105 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3107 k = strappend(r, t);
3121 if (!(k = strnappend(r, word, e-word)))
3132 char **replace_env_argv(char **argv, char **env) {
3134 unsigned k = 0, l = 0;
3136 l = strv_length(argv);
3138 if (!(r = new(char*, l+1)))
3141 STRV_FOREACH(i, argv) {
3143 /* If $FOO appears as single word, replace it by the split up variable */
3144 if ((*i)[0] == '$' && (*i)[1] != '{') {
3149 e = strv_env_get(env, *i+1);
3152 if (!(m = strv_split_quoted(e))) {
3163 if (!(w = realloc(r, sizeof(char*) * (l+1)))) {
3172 memcpy(r + k, m, q * sizeof(char*));
3180 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3181 if (!(r[k++] = replace_env(*i, env))) {
3191 int fd_columns(int fd) {
3192 struct winsize ws = {};
3194 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3203 unsigned columns(void) {
3207 if (_likely_(cached_columns > 0))
3208 return cached_columns;
3211 e = getenv("COLUMNS");
3216 c = fd_columns(STDOUT_FILENO);
3225 int fd_lines(int fd) {
3226 struct winsize ws = {};
3228 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3237 unsigned lines(void) {
3241 if (_likely_(cached_lines > 0))
3242 return cached_lines;
3245 e = getenv("LINES");
3250 l = fd_lines(STDOUT_FILENO);
3256 return cached_lines;
3259 /* intended to be used as a SIGWINCH sighandler */
3260 void columns_lines_cache_reset(int signum) {
3266 static int cached_on_tty = -1;
3268 if (_unlikely_(cached_on_tty < 0))
3269 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3271 return cached_on_tty;
3274 int files_same(const char *filea, const char *fileb) {
3277 if (stat(filea, &a) < 0)
3280 if (stat(fileb, &b) < 0)
3283 return a.st_dev == b.st_dev &&
3284 a.st_ino == b.st_ino;
3287 int running_in_chroot(void) {
3290 ret = files_same("/proc/1/root", "/");
3297 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3302 assert(percent <= 100);
3303 assert(new_length >= 3);
3305 if (old_length <= 3 || old_length <= new_length)
3306 return strndup(s, old_length);
3308 r = new0(char, new_length+1);
3312 x = (new_length * percent) / 100;
3314 if (x > new_length - 3)
3322 s + old_length - (new_length - x - 3),
3323 new_length - x - 3);
3328 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3332 unsigned k, len, len2;
3335 assert(percent <= 100);
3336 assert(new_length >= 3);
3338 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3339 if (ascii_is_valid(s))
3340 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3342 if (old_length <= 3 || old_length <= new_length)
3343 return strndup(s, old_length);
3345 x = (new_length * percent) / 100;
3347 if (x > new_length - 3)
3351 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3354 c = utf8_encoded_to_unichar(i);
3357 k += unichar_iswide(c) ? 2 : 1;
3360 if (k > x) /* last character was wide and went over quota */
3363 for (j = s + old_length; k < new_length && j > i; ) {
3366 j = utf8_prev_char(j);
3367 c = utf8_encoded_to_unichar(j);
3370 k += unichar_iswide(c) ? 2 : 1;
3374 /* we don't actually need to ellipsize */
3376 return memdup(s, old_length + 1);
3378 /* make space for ellipsis */
3379 j = utf8_next_char(j);
3382 len2 = s + old_length - j;
3383 e = new(char, len + 3 + len2 + 1);
3388 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3389 old_length, new_length, x, len, len2, k);
3393 e[len] = 0xe2; /* tri-dot ellipsis: … */
3397 memcpy(e + len + 3, j, len2 + 1);
3402 char *ellipsize(const char *s, size_t length, unsigned percent) {
3403 return ellipsize_mem(s, strlen(s), length, percent);
3406 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3407 _cleanup_close_ int fd;
3413 mkdir_parents(path, 0755);
3415 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3420 r = fchmod(fd, mode);
3425 if (uid != (uid_t) -1 || gid != (gid_t) -1) {
3426 r = fchown(fd, uid, gid);
3431 if (stamp != (usec_t) -1) {
3432 struct timespec ts[2];
3434 timespec_store(&ts[0], stamp);
3436 r = futimens(fd, ts);
3438 r = futimens(fd, NULL);
3445 int touch(const char *path) {
3446 return touch_file(path, false, (usec_t) -1, (uid_t) -1, (gid_t) -1, 0);
3449 char *unquote(const char *s, const char* quotes) {
3453 /* This is rather stupid, simply removes the heading and
3454 * trailing quotes if there is one. Doesn't care about
3455 * escaping or anything. We should make this smarter one
3462 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3463 return strndup(s+1, l-2);
3468 char *normalize_env_assignment(const char *s) {
3469 _cleanup_free_ char *name = NULL, *value = NULL, *p = NULL;
3472 eq = strchr(s, '=');
3484 memmove(r, t, strlen(t) + 1);
3488 name = strndup(s, eq - s);
3496 value = unquote(strstrip(p), QUOTES);
3500 if (asprintf(&r, "%s=%s", strstrip(name), value) < 0)
3506 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3517 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3531 * < 0 : wait_for_terminate() failed to get the state of the
3532 * process, the process was terminated by a signal, or
3533 * failed for an unknown reason.
3534 * >=0 : The process terminated normally, and its exit code is
3537 * That is, success is indicated by a return value of zero, and an
3538 * error is indicated by a non-zero value.
3540 int wait_for_terminate_and_warn(const char *name, pid_t pid) {
3547 r = wait_for_terminate(pid, &status);
3549 log_warning("Failed to wait for %s: %s", name, strerror(-r));
3553 if (status.si_code == CLD_EXITED) {
3554 if (status.si_status != 0) {
3555 log_warning("%s failed with error code %i.", name, status.si_status);
3556 return status.si_status;
3559 log_debug("%s succeeded.", name);
3562 } else if (status.si_code == CLD_KILLED ||
3563 status.si_code == CLD_DUMPED) {
3565 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3569 log_warning("%s failed due to unknown reason.", name);
3573 noreturn void freeze(void) {
3575 /* Make sure nobody waits for us on a socket anymore */
3576 close_all_fds(NULL, 0);
3584 bool null_or_empty(struct stat *st) {
3587 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3590 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3596 int null_or_empty_path(const char *fn) {
3601 if (stat(fn, &st) < 0)
3604 return null_or_empty(&st);
3607 int null_or_empty_fd(int fd) {
3612 if (fstat(fd, &st) < 0)
3615 return null_or_empty(&st);
3618 DIR *xopendirat(int fd, const char *name, int flags) {
3622 assert(!(flags & O_CREAT));
3624 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3637 int signal_from_string_try_harder(const char *s) {
3641 signo = signal_from_string(s);
3643 if (startswith(s, "SIG"))
3644 return signal_from_string(s+3);
3649 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3650 _cleanup_free_ char *t = NULL, *u = NULL;
3653 u = unquote(tagvalue, "\"\'");
3657 enc_len = strlen(u) * 4 + 1;
3658 t = new(char, enc_len);
3662 if (encode_devnode_name(u, t, enc_len) < 0)
3665 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3668 char *fstab_node_to_udev_node(const char *p) {
3671 if (startswith(p, "LABEL="))
3672 return tag_to_udev_node(p+6, "label");
3674 if (startswith(p, "UUID="))
3675 return tag_to_udev_node(p+5, "uuid");
3677 if (startswith(p, "PARTUUID="))
3678 return tag_to_udev_node(p+9, "partuuid");
3680 if (startswith(p, "PARTLABEL="))
3681 return tag_to_udev_node(p+10, "partlabel");
3686 bool tty_is_vc(const char *tty) {
3689 return vtnr_from_tty(tty) >= 0;
3692 bool tty_is_console(const char *tty) {
3695 if (startswith(tty, "/dev/"))
3698 return streq(tty, "console");
3701 int vtnr_from_tty(const char *tty) {
3706 if (startswith(tty, "/dev/"))
3709 if (!startswith(tty, "tty") )
3712 if (tty[3] < '0' || tty[3] > '9')
3715 r = safe_atoi(tty+3, &i);
3719 if (i < 0 || i > 63)
3725 char *resolve_dev_console(char **active) {
3728 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3729 * (i.e. not read-only-mounted which is a sign for container setups) */
3731 if (path_is_read_only_fs("/sys") > 0)
3734 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3737 /* If multiple log outputs are configured the last one is what
3738 * /dev/console points to */
3739 tty = strrchr(*active, ' ');
3745 if (streq(tty, "tty0")) {
3748 /* Get the active VC (e.g. tty1) */
3749 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
3751 tty = *active = tmp;
3758 bool tty_is_vc_resolve(const char *tty) {
3759 _cleanup_free_ char *active = NULL;
3763 if (startswith(tty, "/dev/"))
3766 if (streq(tty, "console")) {
3767 tty = resolve_dev_console(&active);
3772 return tty_is_vc(tty);
3775 const char *default_term_for_tty(const char *tty) {
3778 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt102";
3781 bool dirent_is_file(const struct dirent *de) {
3784 if (ignore_file(de->d_name))
3787 if (de->d_type != DT_REG &&
3788 de->d_type != DT_LNK &&
3789 de->d_type != DT_UNKNOWN)
3795 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
3798 if (de->d_type != DT_REG &&
3799 de->d_type != DT_LNK &&
3800 de->d_type != DT_UNKNOWN)
3803 if (ignore_file_allow_backup(de->d_name))
3806 return endswith(de->d_name, suffix);
3809 void execute_directory(const char *directory, DIR *d, usec_t timeout, char *argv[]) {
3815 /* Executes all binaries in a directory in parallel and waits
3816 * for them to finish. Optionally a timeout is applied. */
3818 executor_pid = fork();
3819 if (executor_pid < 0) {
3820 log_error("Failed to fork: %m");
3823 } else if (executor_pid == 0) {
3824 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
3825 _cleanup_closedir_ DIR *_d = NULL;
3829 /* We fork this all off from a child process so that
3830 * we can somewhat cleanly make use of SIGALRM to set
3833 reset_all_signal_handlers();
3835 assert_se(sigemptyset(&ss) == 0);
3836 assert_se(sigprocmask(SIG_SETMASK, &ss, NULL) == 0);
3838 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
3841 d = _d = opendir(directory);
3843 if (errno == ENOENT)
3844 _exit(EXIT_SUCCESS);
3846 log_error("Failed to enumerate directory %s: %m", directory);
3847 _exit(EXIT_FAILURE);
3851 pids = hashmap_new(NULL, NULL);
3854 _exit(EXIT_FAILURE);
3857 FOREACH_DIRENT(de, d, break) {
3858 _cleanup_free_ char *path = NULL;
3861 if (!dirent_is_file(de))
3864 path = strjoin(directory, "/", de->d_name, NULL);
3867 _exit(EXIT_FAILURE);
3872 log_error("Failed to fork: %m");
3874 } else if (pid == 0) {
3877 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
3887 log_error("Failed to execute %s: %m", path);
3888 _exit(EXIT_FAILURE);
3892 log_debug("Spawned %s as " PID_FMT ".", path, pid);
3894 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
3897 _exit(EXIT_FAILURE);
3903 /* Abort execution of this process after the
3904 * timout. We simply rely on SIGALRM as default action
3905 * terminating the process, and turn on alarm(). */
3907 if (timeout != (usec_t) -1)
3908 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
3910 while (!hashmap_isempty(pids)) {
3911 _cleanup_free_ char *path = NULL;
3914 pid = PTR_TO_UINT(hashmap_first_key(pids));
3917 path = hashmap_remove(pids, UINT_TO_PTR(pid));
3920 wait_for_terminate_and_warn(path, pid);
3923 _exit(EXIT_SUCCESS);
3926 wait_for_terminate_and_warn(directory, executor_pid);
3929 int kill_and_sigcont(pid_t pid, int sig) {
3932 r = kill(pid, sig) < 0 ? -errno : 0;
3940 bool nulstr_contains(const char*nulstr, const char *needle) {
3946 NULSTR_FOREACH(i, nulstr)
3947 if (streq(i, needle))
3953 bool plymouth_running(void) {
3954 return access("/run/plymouth/pid", F_OK) >= 0;
3957 char* strshorten(char *s, size_t l) {
3966 static bool hostname_valid_char(char c) {
3968 (c >= 'a' && c <= 'z') ||
3969 (c >= 'A' && c <= 'Z') ||
3970 (c >= '0' && c <= '9') ||
3976 bool hostname_is_valid(const char *s) {
3983 for (p = s, dot = true; *p; p++) {
3990 if (!hostname_valid_char(*p))
4000 if (p-s > HOST_NAME_MAX)
4006 char* hostname_cleanup(char *s, bool lowercase) {
4010 for (p = s, d = s, dot = true; *p; p++) {
4017 } else if (hostname_valid_char(*p)) {
4018 *(d++) = lowercase ? tolower(*p) : *p;
4029 strshorten(s, HOST_NAME_MAX);
4034 bool machine_name_is_valid(const char *s) {
4036 if (!hostname_is_valid(s))
4039 /* Machine names should be useful hostnames, but also be
4040 * useful in unit names, hence we enforce a stricter length
4049 int pipe_eof(int fd) {
4050 struct pollfd pollfd = {
4052 .events = POLLIN|POLLHUP,
4057 r = poll(&pollfd, 1, 0);
4064 return pollfd.revents & POLLHUP;
4067 int fd_wait_for_event(int fd, int event, usec_t t) {
4069 struct pollfd pollfd = {
4077 r = ppoll(&pollfd, 1, t == (usec_t) -1 ? NULL : timespec_store(&ts, t), NULL);
4084 return pollfd.revents;
4087 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4096 t = tempfn_xxxxxx(path);
4100 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4106 f = fdopen(fd, "we");
4119 int terminal_vhangup_fd(int fd) {
4122 if (ioctl(fd, TIOCVHANGUP) < 0)
4128 int terminal_vhangup(const char *name) {
4129 _cleanup_close_ int fd;
4131 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4135 return terminal_vhangup_fd(fd);
4138 int vt_disallocate(const char *name) {
4142 /* Deallocate the VT if possible. If not possible
4143 * (i.e. because it is the active one), at least clear it
4144 * entirely (including the scrollback buffer) */
4146 if (!startswith(name, "/dev/"))
4149 if (!tty_is_vc(name)) {
4150 /* So this is not a VT. I guess we cannot deallocate
4151 * it then. But let's at least clear the screen */
4153 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4158 "\033[r" /* clear scrolling region */
4159 "\033[H" /* move home */
4160 "\033[2J", /* clear screen */
4167 if (!startswith(name, "/dev/tty"))
4170 r = safe_atou(name+8, &u);
4177 /* Try to deallocate */
4178 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4182 r = ioctl(fd, VT_DISALLOCATE, u);
4191 /* Couldn't deallocate, so let's clear it fully with
4193 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4198 "\033[r" /* clear scrolling region */
4199 "\033[H" /* move home */
4200 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4207 int symlink_atomic(const char *from, const char *to) {
4208 _cleanup_free_ char *t = NULL;
4213 t = tempfn_random(to);
4217 if (symlink(from, t) < 0)
4220 if (rename(t, to) < 0) {
4228 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4229 _cleanup_free_ char *t = NULL;
4233 t = tempfn_random(path);
4237 if (mknod(t, mode, dev) < 0)
4240 if (rename(t, path) < 0) {
4248 int mkfifo_atomic(const char *path, mode_t mode) {
4249 _cleanup_free_ char *t = NULL;
4253 t = tempfn_random(path);
4257 if (mkfifo(t, mode) < 0)
4260 if (rename(t, path) < 0) {
4268 bool display_is_local(const char *display) {
4272 display[0] == ':' &&
4273 display[1] >= '0' &&
4277 int socket_from_display(const char *display, char **path) {
4284 if (!display_is_local(display))
4287 k = strspn(display+1, "0123456789");
4289 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4293 c = stpcpy(f, "/tmp/.X11-unix/X");
4294 memcpy(c, display+1, k);
4303 const char **username,
4304 uid_t *uid, gid_t *gid,
4306 const char **shell) {
4314 /* We enforce some special rules for uid=0: in order to avoid
4315 * NSS lookups for root we hardcode its data. */
4317 if (streq(*username, "root") || streq(*username, "0")) {
4335 if (parse_uid(*username, &u) >= 0) {
4339 /* If there are multiple users with the same id, make
4340 * sure to leave $USER to the configured value instead
4341 * of the first occurrence in the database. However if
4342 * the uid was configured by a numeric uid, then let's
4343 * pick the real username from /etc/passwd. */
4345 *username = p->pw_name;
4348 p = getpwnam(*username);
4352 return errno > 0 ? -errno : -ESRCH;
4364 *shell = p->pw_shell;
4369 char* uid_to_name(uid_t uid) {
4374 return strdup("root");
4378 return strdup(p->pw_name);
4380 if (asprintf(&r, UID_FMT, uid) < 0)
4386 char* gid_to_name(gid_t gid) {
4391 return strdup("root");
4395 return strdup(p->gr_name);
4397 if (asprintf(&r, GID_FMT, gid) < 0)
4403 int get_group_creds(const char **groupname, gid_t *gid) {
4409 /* We enforce some special rules for gid=0: in order to avoid
4410 * NSS lookups for root we hardcode its data. */
4412 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4413 *groupname = "root";
4421 if (parse_gid(*groupname, &id) >= 0) {
4426 *groupname = g->gr_name;
4429 g = getgrnam(*groupname);
4433 return errno > 0 ? -errno : -ESRCH;
4441 int in_gid(gid_t gid) {
4443 int ngroups_max, r, i;
4445 if (getgid() == gid)
4448 if (getegid() == gid)
4451 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4452 assert(ngroups_max > 0);
4454 gids = alloca(sizeof(gid_t) * ngroups_max);
4456 r = getgroups(ngroups_max, gids);
4460 for (i = 0; i < r; i++)
4467 int in_group(const char *name) {
4471 r = get_group_creds(&name, &gid);
4478 int glob_exists(const char *path) {
4479 _cleanup_globfree_ glob_t g = {};
4485 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4487 if (k == GLOB_NOMATCH)
4489 else if (k == GLOB_NOSPACE)
4492 return !strv_isempty(g.gl_pathv);
4494 return errno ? -errno : -EIO;
4497 int glob_extend(char ***strv, const char *path) {
4498 _cleanup_globfree_ glob_t g = {};
4503 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4505 if (k == GLOB_NOMATCH)
4507 else if (k == GLOB_NOSPACE)
4509 else if (k != 0 || strv_isempty(g.gl_pathv))
4510 return errno ? -errno : -EIO;
4512 STRV_FOREACH(p, g.gl_pathv) {
4513 k = strv_extend(strv, *p);
4521 int dirent_ensure_type(DIR *d, struct dirent *de) {
4527 if (de->d_type != DT_UNKNOWN)
4530 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4534 S_ISREG(st.st_mode) ? DT_REG :
4535 S_ISDIR(st.st_mode) ? DT_DIR :
4536 S_ISLNK(st.st_mode) ? DT_LNK :
4537 S_ISFIFO(st.st_mode) ? DT_FIFO :
4538 S_ISSOCK(st.st_mode) ? DT_SOCK :
4539 S_ISCHR(st.st_mode) ? DT_CHR :
4540 S_ISBLK(st.st_mode) ? DT_BLK :
4546 int get_files_in_directory(const char *path, char ***list) {
4547 _cleanup_closedir_ DIR *d = NULL;
4548 size_t bufsize = 0, n = 0;
4549 _cleanup_strv_free_ char **l = NULL;
4553 /* Returns all files in a directory in *list, and the number
4554 * of files as return value. If list is NULL returns only the
4566 if (!de && errno != 0)
4571 dirent_ensure_type(d, de);
4573 if (!dirent_is_file(de))
4577 /* one extra slot is needed for the terminating NULL */
4578 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4581 l[n] = strdup(de->d_name);
4592 l = NULL; /* avoid freeing */
4598 char *strjoin(const char *x, ...) {
4612 t = va_arg(ap, const char *);
4617 if (n > ((size_t) -1) - l) {
4641 t = va_arg(ap, const char *);
4655 bool is_main_thread(void) {
4656 static thread_local int cached = 0;
4658 if (_unlikely_(cached == 0))
4659 cached = getpid() == gettid() ? 1 : -1;
4664 int block_get_whole_disk(dev_t d, dev_t *ret) {
4671 /* If it has a queue this is good enough for us */
4672 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4675 r = access(p, F_OK);
4683 /* If it is a partition find the originating device */
4684 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4687 r = access(p, F_OK);
4693 /* Get parent dev_t */
4694 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4697 r = read_one_line_file(p, &s);
4703 r = sscanf(s, "%u:%u", &m, &n);
4709 /* Only return this if it is really good enough for us. */
4710 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4713 r = access(p, F_OK);
4717 *ret = makedev(m, n);
4724 int file_is_priv_sticky(const char *p) {
4729 if (lstat(p, &st) < 0)
4733 (st.st_uid == 0 || st.st_uid == getuid()) &&
4734 (st.st_mode & S_ISVTX);
4737 static const char *const ioprio_class_table[] = {
4738 [IOPRIO_CLASS_NONE] = "none",
4739 [IOPRIO_CLASS_RT] = "realtime",
4740 [IOPRIO_CLASS_BE] = "best-effort",
4741 [IOPRIO_CLASS_IDLE] = "idle"
4744 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
4746 static const char *const sigchld_code_table[] = {
4747 [CLD_EXITED] = "exited",
4748 [CLD_KILLED] = "killed",
4749 [CLD_DUMPED] = "dumped",
4750 [CLD_TRAPPED] = "trapped",
4751 [CLD_STOPPED] = "stopped",
4752 [CLD_CONTINUED] = "continued",
4755 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
4757 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
4758 [LOG_FAC(LOG_KERN)] = "kern",
4759 [LOG_FAC(LOG_USER)] = "user",
4760 [LOG_FAC(LOG_MAIL)] = "mail",
4761 [LOG_FAC(LOG_DAEMON)] = "daemon",
4762 [LOG_FAC(LOG_AUTH)] = "auth",
4763 [LOG_FAC(LOG_SYSLOG)] = "syslog",
4764 [LOG_FAC(LOG_LPR)] = "lpr",
4765 [LOG_FAC(LOG_NEWS)] = "news",
4766 [LOG_FAC(LOG_UUCP)] = "uucp",
4767 [LOG_FAC(LOG_CRON)] = "cron",
4768 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
4769 [LOG_FAC(LOG_FTP)] = "ftp",
4770 [LOG_FAC(LOG_LOCAL0)] = "local0",
4771 [LOG_FAC(LOG_LOCAL1)] = "local1",
4772 [LOG_FAC(LOG_LOCAL2)] = "local2",
4773 [LOG_FAC(LOG_LOCAL3)] = "local3",
4774 [LOG_FAC(LOG_LOCAL4)] = "local4",
4775 [LOG_FAC(LOG_LOCAL5)] = "local5",
4776 [LOG_FAC(LOG_LOCAL6)] = "local6",
4777 [LOG_FAC(LOG_LOCAL7)] = "local7"
4780 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
4782 static const char *const log_level_table[] = {
4783 [LOG_EMERG] = "emerg",
4784 [LOG_ALERT] = "alert",
4785 [LOG_CRIT] = "crit",
4787 [LOG_WARNING] = "warning",
4788 [LOG_NOTICE] = "notice",
4789 [LOG_INFO] = "info",
4790 [LOG_DEBUG] = "debug"
4793 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
4795 static const char* const sched_policy_table[] = {
4796 [SCHED_OTHER] = "other",
4797 [SCHED_BATCH] = "batch",
4798 [SCHED_IDLE] = "idle",
4799 [SCHED_FIFO] = "fifo",
4803 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
4805 static const char* const rlimit_table[_RLIMIT_MAX] = {
4806 [RLIMIT_CPU] = "LimitCPU",
4807 [RLIMIT_FSIZE] = "LimitFSIZE",
4808 [RLIMIT_DATA] = "LimitDATA",
4809 [RLIMIT_STACK] = "LimitSTACK",
4810 [RLIMIT_CORE] = "LimitCORE",
4811 [RLIMIT_RSS] = "LimitRSS",
4812 [RLIMIT_NOFILE] = "LimitNOFILE",
4813 [RLIMIT_AS] = "LimitAS",
4814 [RLIMIT_NPROC] = "LimitNPROC",
4815 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
4816 [RLIMIT_LOCKS] = "LimitLOCKS",
4817 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
4818 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
4819 [RLIMIT_NICE] = "LimitNICE",
4820 [RLIMIT_RTPRIO] = "LimitRTPRIO",
4821 [RLIMIT_RTTIME] = "LimitRTTIME"
4824 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
4826 static const char* const ip_tos_table[] = {
4827 [IPTOS_LOWDELAY] = "low-delay",
4828 [IPTOS_THROUGHPUT] = "throughput",
4829 [IPTOS_RELIABILITY] = "reliability",
4830 [IPTOS_LOWCOST] = "low-cost",
4833 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
4835 static const char *const __signal_table[] = {
4852 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
4863 [SIGVTALRM] = "VTALRM",
4865 [SIGWINCH] = "WINCH",
4871 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
4873 const char *signal_to_string(int signo) {
4874 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
4877 name = __signal_to_string(signo);
4881 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
4882 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
4884 snprintf(buf, sizeof(buf), "%d", signo);
4889 int signal_from_string(const char *s) {
4894 signo = __signal_from_string(s);
4898 if (startswith(s, "RTMIN+")) {
4902 if (safe_atou(s, &u) >= 0) {
4903 signo = (int) u + offset;
4904 if (signo > 0 && signo < _NSIG)
4910 bool kexec_loaded(void) {
4911 bool loaded = false;
4914 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
4922 int strdup_or_null(const char *a, char **b) {
4940 int prot_from_flags(int flags) {
4942 switch (flags & O_ACCMODE) {
4951 return PROT_READ|PROT_WRITE;
4958 char *format_bytes(char *buf, size_t l, off_t t) {
4961 static const struct {
4965 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
4966 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
4967 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
4968 { "G", 1024ULL*1024ULL*1024ULL },
4969 { "M", 1024ULL*1024ULL },
4973 for (i = 0; i < ELEMENTSOF(table); i++) {
4975 if (t >= table[i].factor) {
4978 (unsigned long long) (t / table[i].factor),
4979 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
4986 snprintf(buf, l, "%lluB", (unsigned long long) t);
4994 void* memdup(const void *p, size_t l) {
5007 int fd_inc_sndbuf(int fd, size_t n) {
5009 socklen_t l = sizeof(value);
5011 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5012 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5015 /* If we have the privileges we will ignore the kernel limit. */
5018 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5019 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5025 int fd_inc_rcvbuf(int fd, size_t n) {
5027 socklen_t l = sizeof(value);
5029 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5030 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5033 /* If we have the privileges we will ignore the kernel limit. */
5036 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5037 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5042 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5043 pid_t parent_pid, agent_pid;
5045 bool stdout_is_tty, stderr_is_tty;
5053 parent_pid = getpid();
5055 /* Spawns a temporary TTY agent, making sure it goes away when
5062 if (agent_pid != 0) {
5069 * Make sure the agent goes away when the parent dies */
5070 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5071 _exit(EXIT_FAILURE);
5073 /* Check whether our parent died before we were able
5074 * to set the death signal */
5075 if (getppid() != parent_pid)
5076 _exit(EXIT_SUCCESS);
5078 /* Don't leak fds to the agent */
5079 close_all_fds(except, n_except);
5081 stdout_is_tty = isatty(STDOUT_FILENO);
5082 stderr_is_tty = isatty(STDERR_FILENO);
5084 if (!stdout_is_tty || !stderr_is_tty) {
5085 /* Detach from stdout/stderr. and reopen
5086 * /dev/tty for them. This is important to
5087 * ensure that when systemctl is started via
5088 * popen() or a similar call that expects to
5089 * read EOF we actually do generate EOF and
5090 * not delay this indefinitely by because we
5091 * keep an unused copy of stdin around. */
5092 fd = open("/dev/tty", O_WRONLY);
5094 log_error("Failed to open /dev/tty: %m");
5095 _exit(EXIT_FAILURE);
5099 dup2(fd, STDOUT_FILENO);
5102 dup2(fd, STDERR_FILENO);
5108 /* Count arguments */
5110 for (n = 0; va_arg(ap, char*); n++)
5115 l = alloca(sizeof(char *) * (n + 1));
5117 /* Fill in arguments */
5119 for (i = 0; i <= n; i++)
5120 l[i] = va_arg(ap, char*);
5124 _exit(EXIT_FAILURE);
5127 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5128 struct rlimit highest, fixed;
5132 if (setrlimit(resource, rlim) >= 0)
5138 /* So we failed to set the desired setrlimit, then let's try
5139 * to get as close as we can */
5140 assert_se(getrlimit(resource, &highest) == 0);
5142 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5143 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5145 if (setrlimit(resource, &fixed) < 0)
5151 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5152 _cleanup_fclose_ FILE *f = NULL;
5163 path = procfs_file_alloca(pid, "environ");
5165 f = fopen(path, "re");
5173 char line[LINE_MAX];
5176 for (i = 0; i < sizeof(line)-1; i++) {
5180 if (_unlikely_(c == EOF)) {
5190 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5191 value = strdup(line + l + 1);
5205 bool is_valid_documentation_url(const char *url) {
5208 if (startswith(url, "http://") && url[7])
5211 if (startswith(url, "https://") && url[8])
5214 if (startswith(url, "file:") && url[5])
5217 if (startswith(url, "info:") && url[5])
5220 if (startswith(url, "man:") && url[4])
5226 bool in_initrd(void) {
5227 static int saved = -1;
5233 /* We make two checks here:
5235 * 1. the flag file /etc/initrd-release must exist
5236 * 2. the root file system must be a memory file system
5238 * The second check is extra paranoia, since misdetecting an
5239 * initrd can have bad bad consequences due the initrd
5240 * emptying when transititioning to the main systemd.
5243 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5244 statfs("/", &s) >= 0 &&
5245 is_temporary_fs(&s);
5250 void warn_melody(void) {
5251 _cleanup_close_ int fd = -1;
5253 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5257 /* Yeah, this is synchronous. Kinda sucks. But well... */
5259 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5260 usleep(125*USEC_PER_MSEC);
5262 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5263 usleep(125*USEC_PER_MSEC);
5265 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5266 usleep(125*USEC_PER_MSEC);
5268 ioctl(fd, KIOCSOUND, 0);
5271 int make_console_stdio(void) {
5274 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5276 fd = acquire_terminal("/dev/console", false, true, true, (usec_t) -1);
5278 log_error("Failed to acquire terminal: %s", strerror(-fd));
5284 log_error("Failed to duplicate terminal fd: %s", strerror(-r));
5291 int get_home_dir(char **_h) {
5299 /* Take the user specified one */
5300 e = secure_getenv("HOME");
5301 if (e && path_is_absolute(e)) {
5310 /* Hardcode home directory for root to avoid NSS */
5313 h = strdup("/root");
5321 /* Check the database... */
5325 return errno > 0 ? -errno : -ESRCH;
5327 if (!path_is_absolute(p->pw_dir))
5330 h = strdup(p->pw_dir);
5338 int get_shell(char **_s) {
5346 /* Take the user specified one */
5347 e = getenv("SHELL");
5357 /* Hardcode home directory for root to avoid NSS */
5360 s = strdup("/bin/sh");
5368 /* Check the database... */
5372 return errno > 0 ? -errno : -ESRCH;
5374 if (!path_is_absolute(p->pw_shell))
5377 s = strdup(p->pw_shell);
5385 bool filename_is_safe(const char *p) {
5399 if (strlen(p) > FILENAME_MAX)
5405 bool string_is_safe(const char *p) {
5411 for (t = p; *t; t++) {
5412 if (*t > 0 && *t < ' ')
5415 if (strchr("\\\"\'\0x7f", *t))
5423 * Check if a string contains control characters. If 'ok' is non-NULL
5424 * it may be a string containing additional CCs to be considered OK.
5426 bool string_has_cc(const char *p, const char *ok) {
5431 for (t = p; *t; t++) {
5432 if (ok && strchr(ok, *t))
5435 if (*t > 0 && *t < ' ')
5445 bool path_is_safe(const char *p) {
5450 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5453 if (strlen(p) > PATH_MAX)
5456 /* The following two checks are not really dangerous, but hey, they still are confusing */
5457 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5460 if (strstr(p, "//"))
5466 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5467 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5468 int (*compar) (const void *, const void *, void *), void *arg) {
5477 p = (void *)(((const char *) base) + (idx * size));
5478 comparison = compar(key, p, arg);
5481 else if (comparison > 0)
5489 bool is_locale_utf8(void) {
5491 static int cached_answer = -1;
5493 if (cached_answer >= 0)
5496 if (!setlocale(LC_ALL, "")) {
5497 cached_answer = true;
5501 set = nl_langinfo(CODESET);
5503 cached_answer = true;
5507 if (streq(set, "UTF-8")) {
5508 cached_answer = true;
5512 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5513 * unset and everything can do to UTF-8 nowadays. */
5514 set = setlocale(LC_CTYPE, NULL);
5516 cached_answer = true;
5520 /* Check result, but ignore the result if C was set
5524 !getenv("LC_ALL") &&
5525 !getenv("LC_CTYPE") &&
5529 return (bool) cached_answer;
5532 const char *draw_special_char(DrawSpecialChar ch) {
5533 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5536 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5537 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5538 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5539 [DRAW_TREE_SPACE] = " ", /* */
5540 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5541 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5542 [DRAW_ARROW] = "\342\206\222", /* → */
5543 [DRAW_DASH] = "\342\200\223", /* – */
5546 /* ASCII fallback */ {
5547 [DRAW_TREE_VERTICAL] = "| ",
5548 [DRAW_TREE_BRANCH] = "|-",
5549 [DRAW_TREE_RIGHT] = "`-",
5550 [DRAW_TREE_SPACE] = " ",
5551 [DRAW_TRIANGULAR_BULLET] = ">",
5552 [DRAW_BLACK_CIRCLE] = "*",
5553 [DRAW_ARROW] = "->",
5558 return draw_table[!is_locale_utf8()][ch];
5561 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5564 size_t l, old_len, new_len;
5570 old_len = strlen(old_string);
5571 new_len = strlen(new_string);
5584 if (!startswith(f, old_string)) {
5590 nl = l - old_len + new_len;
5591 a = realloc(r, nl + 1);
5599 t = stpcpy(t, new_string);
5611 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5612 const char *i, *begin = NULL;
5617 } state = STATE_OTHER;
5619 size_t osz = 0, isz;
5625 /* Strips ANSI color and replaces TABs by 8 spaces */
5627 isz = _isz ? *_isz : strlen(*ibuf);
5629 f = open_memstream(&obuf, &osz);
5633 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5638 if (i >= *ibuf + isz) /* EOT */
5640 else if (*i == '\x1B')
5641 state = STATE_ESCAPE;
5642 else if (*i == '\t')
5649 if (i >= *ibuf + isz) { /* EOT */
5652 } else if (*i == '[') {
5653 state = STATE_BRACKET;
5658 state = STATE_OTHER;
5665 if (i >= *ibuf + isz || /* EOT */
5666 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5669 state = STATE_OTHER;
5671 } else if (*i == 'm')
5672 state = STATE_OTHER;
5694 int on_ac_power(void) {
5695 bool found_offline = false, found_online = false;
5696 _cleanup_closedir_ DIR *d = NULL;
5698 d = opendir("/sys/class/power_supply");
5704 _cleanup_close_ int fd = -1, device = -1;
5710 if (!de && errno != 0)
5716 if (ignore_file(de->d_name))
5719 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
5721 if (errno == ENOENT || errno == ENOTDIR)
5727 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5729 if (errno == ENOENT)
5735 n = read(fd, contents, sizeof(contents));
5739 if (n != 6 || memcmp(contents, "Mains\n", 6))
5743 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5745 if (errno == ENOENT)
5751 n = read(fd, contents, sizeof(contents));
5755 if (n != 2 || contents[1] != '\n')
5758 if (contents[0] == '1') {
5759 found_online = true;
5761 } else if (contents[0] == '0')
5762 found_offline = true;
5767 return found_online || !found_offline;
5770 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
5777 if (!path_strv_resolve_uniq(search, root))
5780 STRV_FOREACH(i, search) {
5781 _cleanup_free_ char *p = NULL;
5785 p = strjoin(root, *i, "/", path, NULL);
5787 p = strjoin(*i, "/", path, NULL);
5797 if (errno != ENOENT)
5804 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
5805 _cleanup_strv_free_ char **copy = NULL;
5811 if (path_is_absolute(path)) {
5814 f = fopen(path, mode);
5823 copy = strv_copy((char**) search);
5827 return search_and_fopen_internal(path, mode, root, copy, _f);
5830 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
5831 _cleanup_strv_free_ char **s = NULL;
5833 if (path_is_absolute(path)) {
5836 f = fopen(path, mode);
5845 s = strv_split_nulstr(search);
5849 return search_and_fopen_internal(path, mode, root, s, _f);
5852 char *strextend(char **x, ...) {
5859 l = f = *x ? strlen(*x) : 0;
5866 t = va_arg(ap, const char *);
5871 if (n > ((size_t) -1) - l) {
5880 r = realloc(*x, l+1);
5890 t = va_arg(ap, const char *);
5904 char *strrep(const char *s, unsigned n) {
5912 p = r = malloc(l * n + 1);
5916 for (i = 0; i < n; i++)
5923 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
5930 if (*allocated >= need)
5933 newalloc = MAX(need * 2, 64u / size);
5934 a = newalloc * size;
5936 /* check for overflows */
5937 if (a < size * need)
5945 *allocated = newalloc;
5949 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
5958 q = greedy_realloc(p, allocated, need, size);
5962 if (*allocated > prev)
5963 memzero(q + prev * size, (*allocated - prev) * size);
5968 bool id128_is_valid(const char *s) {
5974 /* Simple formatted 128bit hex string */
5976 for (i = 0; i < l; i++) {
5979 if (!(c >= '0' && c <= '9') &&
5980 !(c >= 'a' && c <= 'z') &&
5981 !(c >= 'A' && c <= 'Z'))
5985 } else if (l == 36) {
5987 /* Formatted UUID */
5989 for (i = 0; i < l; i++) {
5992 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
5996 if (!(c >= '0' && c <= '9') &&
5997 !(c >= 'a' && c <= 'z') &&
5998 !(c >= 'A' && c <= 'Z'))
6009 int split_pair(const char *s, const char *sep, char **l, char **r) {
6024 a = strndup(s, x - s);
6028 b = strdup(x + strlen(sep));
6040 int shall_restore_state(void) {
6041 _cleanup_free_ char *line = NULL;
6046 r = proc_cmdline(&line);
6049 if (r == 0) /* Container ... */
6054 FOREACH_WORD_QUOTED(w, l, line, state) {
6062 e = startswith(n, "systemd.restore_state=");
6066 k = parse_boolean(e);
6074 int proc_cmdline(char **ret) {
6077 if (detect_container(NULL) > 0) {
6078 char *buf = NULL, *p;
6081 r = read_full_file("/proc/1/cmdline", &buf, &sz);
6085 for (p = buf; p + 1 < buf + sz; p++)
6094 r = read_one_line_file("/proc/cmdline", ret);
6101 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6102 _cleanup_free_ char *line = NULL;
6109 r = proc_cmdline(&line);
6111 log_warning("Failed to read /proc/cmdline, ignoring: %s", strerror(-r));
6115 FOREACH_WORD_QUOTED(w, l, line, state) {
6116 char word[l+1], *value;
6121 /* Filter out arguments that are intended only for the
6123 if (!in_initrd() && startswith(word, "rd."))
6126 value = strchr(word, '=');
6130 r = parse_item(word, value);
6138 int container_get_leader(const char *machine, pid_t *pid) {
6139 _cleanup_free_ char *s = NULL, *class = NULL;
6147 p = strappenda("/run/systemd/machines/", machine);
6148 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6156 if (!streq_ptr(class, "container"))
6159 r = parse_pid(s, &leader);
6169 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6170 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6178 mntns = procfs_file_alloca(pid, "ns/mnt");
6179 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6187 pidns = procfs_file_alloca(pid, "ns/pid");
6188 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6196 netns = procfs_file_alloca(pid, "ns/net");
6197 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6205 root = procfs_file_alloca(pid, "root");
6206 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6212 *pidns_fd = pidnsfd;
6215 *mntns_fd = mntnsfd;
6218 *netns_fd = netnsfd;
6223 pidnsfd = mntnsfd = netnsfd = -1;
6228 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6231 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6235 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6239 if (setns(netns_fd, CLONE_NEWNET) < 0)
6243 if (fchdir(root_fd) < 0)
6246 if (chroot(".") < 0)
6250 if (setresgid(0, 0, 0) < 0)
6253 if (setgroups(0, NULL) < 0)
6256 if (setresuid(0, 0, 0) < 0)
6262 bool pid_is_unwaited(pid_t pid) {
6263 /* Checks whether a PID is still valid at all, including a zombie */
6268 if (kill(pid, 0) >= 0)
6271 return errno != ESRCH;
6274 bool pid_is_alive(pid_t pid) {
6277 /* Checks whether a PID is still valid and not a zombie */
6282 r = get_process_state(pid);
6283 if (r == -ENOENT || r == 'Z')
6289 int getpeercred(int fd, struct ucred *ucred) {
6290 socklen_t n = sizeof(struct ucred);
6297 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6301 if (n != sizeof(struct ucred))
6304 /* Check if the data is actually useful and not suppressed due
6305 * to namespacing issues */
6313 int getpeersec(int fd, char **ret) {
6325 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6329 if (errno != ERANGE)
6336 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6352 /* This is much like like mkostemp() but is subject to umask(). */
6353 int mkostemp_safe(char *pattern, int flags) {
6354 _cleanup_umask_ mode_t u;
6361 fd = mkostemp(pattern, flags);
6368 int open_tmpfile(const char *path, int flags) {
6375 /* Try O_TMPFILE first, if it is supported */
6376 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6381 /* Fall back to unguessable name + unlinking */
6382 p = strappenda(path, "/systemd-tmp-XXXXXX");
6384 fd = mkostemp_safe(p, flags);
6392 int fd_warn_permissions(const char *path, int fd) {
6395 if (fstat(fd, &st) < 0)
6398 if (st.st_mode & 0111)
6399 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6401 if (st.st_mode & 0002)
6402 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6404 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6405 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6410 unsigned long personality_from_string(const char *p) {
6412 /* Parse a personality specifier. We introduce our own
6413 * identifiers that indicate specific ABIs, rather than just
6414 * hints regarding the register size, since we want to keep
6415 * things open for multiple locally supported ABIs for the
6416 * same register size. We try to reuse the ABI identifiers
6417 * used by libseccomp. */
6419 #if defined(__x86_64__)
6421 if (streq(p, "x86"))
6424 if (streq(p, "x86-64"))
6427 #elif defined(__i386__)
6429 if (streq(p, "x86"))
6433 /* personality(7) documents that 0xffffffffUL is used for
6434 * querying the current personality, hence let's use that here
6435 * as error indicator. */
6436 return 0xffffffffUL;
6439 const char* personality_to_string(unsigned long p) {
6441 #if defined(__x86_64__)
6443 if (p == PER_LINUX32)
6449 #elif defined(__i386__)
6458 uint64_t physical_memory(void) {
6461 /* We return this as uint64_t in case we are running as 32bit
6462 * process on a 64bit kernel with huge amounts of memory */
6464 mem = sysconf(_SC_PHYS_PAGES);
6467 return (uint64_t) mem * (uint64_t) page_size();
6470 char* mount_test_option(const char *haystack, const char *needle) {
6472 struct mntent me = {
6473 .mnt_opts = (char*) haystack
6478 /* Like glibc's hasmntopt(), but works on a string, not a
6484 return hasmntopt(&me, needle);
6487 void hexdump(FILE *f, const void *p, size_t s) {
6488 const uint8_t *b = p;
6491 assert(s == 0 || b);
6496 fprintf(f, "%04x ", n);
6498 for (i = 0; i < 16; i++) {
6503 fprintf(f, "%02x ", b[i]);
6511 for (i = 0; i < 16; i++) {
6516 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6530 int update_reboot_param_file(const char *param) {
6535 r = write_string_file(REBOOT_PARAM_FILE, param);
6537 log_error("Failed to write reboot param to "
6538 REBOOT_PARAM_FILE": %s", strerror(-r));
6540 unlink(REBOOT_PARAM_FILE);
6545 int umount_recursive(const char *prefix, int flags) {
6549 /* Try to umount everything recursively below a
6550 * directory. Also, take care of stacked mounts, and keep
6551 * unmounting them until they are gone. */
6554 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6559 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6560 if (!proc_self_mountinfo)
6564 _cleanup_free_ char *path = NULL, *p = NULL;
6567 k = fscanf(proc_self_mountinfo,
6568 "%*s " /* (1) mount id */
6569 "%*s " /* (2) parent id */
6570 "%*s " /* (3) major:minor */
6571 "%*s " /* (4) root */
6572 "%ms " /* (5) mount point */
6573 "%*s" /* (6) mount options */
6574 "%*[^-]" /* (7) optional fields */
6575 "- " /* (8) separator */
6576 "%*s " /* (9) file system type */
6577 "%*s" /* (10) mount source */
6578 "%*s" /* (11) mount options 2 */
6579 "%*[^\n]", /* some rubbish at the end */
6588 p = cunescape(path);
6592 if (!path_startswith(p, prefix))
6595 if (umount2(p, flags) < 0) {
6611 int bind_remount_recursive(const char *prefix, bool ro) {
6612 _cleanup_set_free_free_ Set *done = NULL;
6613 _cleanup_free_ char *cleaned = NULL;
6616 /* Recursively remount a directory (and all its submounts)
6617 * read-only or read-write. If the directory is already
6618 * mounted, we reuse the mount and simply mark it
6619 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6620 * operation). If it isn't we first make it one. Afterwards we
6621 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6622 * submounts we can access, too. When mounts are stacked on
6623 * the same mount point we only care for each individual
6624 * "top-level" mount on each point, as we cannot
6625 * influence/access the underlying mounts anyway. We do not
6626 * have any effect on future submounts that might get
6627 * propagated, they migt be writable. This includes future
6628 * submounts that have been triggered via autofs. */
6630 cleaned = strdup(prefix);
6634 path_kill_slashes(cleaned);
6636 done = set_new(string_hash_func, string_compare_func);
6641 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6642 _cleanup_set_free_free_ Set *todo = NULL;
6643 bool top_autofs = false;
6646 todo = set_new(string_hash_func, string_compare_func);
6650 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6651 if (!proc_self_mountinfo)
6655 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6658 k = fscanf(proc_self_mountinfo,
6659 "%*s " /* (1) mount id */
6660 "%*s " /* (2) parent id */
6661 "%*s " /* (3) major:minor */
6662 "%*s " /* (4) root */
6663 "%ms " /* (5) mount point */
6664 "%*s" /* (6) mount options (superblock) */
6665 "%*[^-]" /* (7) optional fields */
6666 "- " /* (8) separator */
6667 "%ms " /* (9) file system type */
6668 "%*s" /* (10) mount source */
6669 "%*s" /* (11) mount options (bind mount) */
6670 "%*[^\n]", /* some rubbish at the end */
6680 p = cunescape(path);
6684 /* Let's ignore autofs mounts. If they aren't
6685 * triggered yet, we want to avoid triggering
6686 * them, as we don't make any guarantees for
6687 * future submounts anyway. If they are
6688 * already triggered, then we will find
6689 * another entry for this. */
6690 if (streq(type, "autofs")) {
6691 top_autofs = top_autofs || path_equal(cleaned, p);
6695 if (path_startswith(p, cleaned) &&
6696 !set_contains(done, p)) {
6698 r = set_consume(todo, p);
6708 /* If we have no submounts to process anymore and if
6709 * the root is either already done, or an autofs, we
6711 if (set_isempty(todo) &&
6712 (top_autofs || set_contains(done, cleaned)))
6715 if (!set_contains(done, cleaned) &&
6716 !set_contains(todo, cleaned)) {
6717 /* The prefix directory itself is not yet a
6718 * mount, make it one. */
6719 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
6722 if (mount(NULL, prefix, NULL, MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
6725 x = strdup(cleaned);
6729 r = set_consume(done, x);
6734 while ((x = set_steal_first(todo))) {
6736 r = set_consume(done, x);
6742 if (mount(NULL, x, NULL, MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
6744 /* Deal with mount points that are
6745 * obstructed by a later mount */
6747 if (errno != ENOENT)
6755 int fflush_and_check(FILE *f) {
6762 return errno ? -errno : -EIO;
6767 char *tempfn_xxxxxx(const char *p) {
6774 t = new(char, strlen(p) + 1 + 6 + 1);
6781 strcpy(stpcpy(stpcpy(mempcpy(t, p, k), "."), fn), "XXXXXX");
6786 char *tempfn_random(const char *p) {
6795 t = new(char, strlen(p) + 1 + 16 + 1);
6802 x = stpcpy(stpcpy(mempcpy(t, p, k), "."), fn);
6805 for (i = 0; i < 16; i++) {
6806 *(x++) = hexchar(u & 0xF);
6815 /* make sure the hostname is not "localhost" */
6816 bool is_localhost(const char *hostname) {
6819 /* This tries to identify local hostnames described in RFC6761
6820 * plus the redhatism of .localdomain */
6822 return streq(hostname, "localhost") ||
6823 streq(hostname, "localhost.") ||
6824 endswith(hostname, ".localhost") ||
6825 endswith(hostname, ".localhost.") ||
6826 endswith(hostname, ".localdomain") ||
6827 endswith(hostname, ".localdomain.");
6830 int take_password_lock(const char *root) {
6832 struct flock flock = {
6834 .l_whence = SEEK_SET,
6842 /* This is roughly the same as lckpwdf(), but not as awful. We
6843 * don't want to use alarm() and signals, hence we implement
6844 * our own trivial version of this.
6846 * Note that shadow-utils also takes per-database locks in
6847 * addition to lckpwdf(). However, we don't given that they
6848 * are redundant as they they invoke lckpwdf() first and keep
6849 * it during everything they do. The per-database locks are
6850 * awfully racy, and thus we just won't do them. */
6853 path = strappenda(root, "/etc/.pwd.lock");
6855 path = "/etc/.pwd.lock";
6857 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
6861 r = fcntl(fd, F_SETLKW, &flock);