1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
31 #include <sys/resource.h>
32 #include <linux/sched.h>
33 #include <sys/types.h>
37 #include <sys/ioctl.h>
39 #include <linux/tiocl.h>
44 #include <sys/prctl.h>
45 #include <sys/utsname.h>
47 #include <netinet/ip.h>
56 #include <sys/mount.h>
57 #include <linux/magic.h>
61 #include <sys/personality.h>
62 #include <sys/xattr.h>
64 #include <sys/statvfs.h>
69 #ifdef HAVE_SYS_AUXV_H
81 #include "path-util.h"
82 #include "exit-status.h"
86 #include "device-nodes.h"
91 #include "sparse-endian.h"
94 char **saved_argv = NULL;
96 static volatile unsigned cached_columns = 0;
97 static volatile unsigned cached_lines = 0;
99 size_t page_size(void) {
100 static thread_local size_t pgsz = 0;
103 if (_likely_(pgsz > 0))
106 r = sysconf(_SC_PAGESIZE);
113 bool streq_ptr(const char *a, const char *b) {
115 /* Like streq(), but tries to make sense of NULL pointers */
126 char* endswith(const char *s, const char *postfix) {
133 pl = strlen(postfix);
136 return (char*) s + sl;
141 if (memcmp(s + sl - pl, postfix, pl) != 0)
144 return (char*) s + sl - pl;
147 char* first_word(const char *s, const char *word) {
154 /* Checks if the string starts with the specified word, either
155 * followed by NUL or by whitespace. Returns a pointer to the
156 * NUL or the first character after the whitespace. */
167 if (memcmp(s, word, wl) != 0)
174 if (!strchr(WHITESPACE, *p))
177 p += strspn(p, WHITESPACE);
181 static size_t cescape_char(char c, char *buf) {
182 char * buf_old = buf;
228 /* For special chars we prefer octal over
229 * hexadecimal encoding, simply because glib's
230 * g_strescape() does the same */
231 if ((c < ' ') || (c >= 127)) {
233 *(buf++) = octchar((unsigned char) c >> 6);
234 *(buf++) = octchar((unsigned char) c >> 3);
235 *(buf++) = octchar((unsigned char) c);
241 return buf - buf_old;
244 int close_nointr(int fd) {
251 * Just ignore EINTR; a retry loop is the wrong thing to do on
254 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
255 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
256 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
257 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
265 int safe_close(int fd) {
268 * Like close_nointr() but cannot fail. Guarantees errno is
269 * unchanged. Is a NOP with negative fds passed, and returns
270 * -1, so that it can be used in this syntax:
272 * fd = safe_close(fd);
278 /* The kernel might return pretty much any error code
279 * via close(), but the fd will be closed anyway. The
280 * only condition we want to check for here is whether
281 * the fd was invalid at all... */
283 assert_se(close_nointr(fd) != -EBADF);
289 void close_many(const int fds[], unsigned n_fd) {
292 assert(fds || n_fd <= 0);
294 for (i = 0; i < n_fd; i++)
298 int unlink_noerrno(const char *path) {
309 int parse_boolean(const char *v) {
312 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
314 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
320 int parse_pid(const char *s, pid_t* ret_pid) {
321 unsigned long ul = 0;
328 r = safe_atolu(s, &ul);
334 if ((unsigned long) pid != ul)
344 int parse_uid(const char *s, uid_t* ret_uid) {
345 unsigned long ul = 0;
352 r = safe_atolu(s, &ul);
358 if ((unsigned long) uid != ul)
361 /* Some libc APIs use UID_INVALID as special placeholder */
362 if (uid == (uid_t) 0xFFFFFFFF)
365 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
366 if (uid == (uid_t) 0xFFFF)
373 int safe_atou(const char *s, unsigned *ret_u) {
381 l = strtoul(s, &x, 0);
383 if (!x || x == s || *x || errno)
384 return errno > 0 ? -errno : -EINVAL;
386 if ((unsigned long) (unsigned) l != l)
389 *ret_u = (unsigned) l;
393 int safe_atoi(const char *s, int *ret_i) {
401 l = strtol(s, &x, 0);
403 if (!x || x == s || *x || errno)
404 return errno > 0 ? -errno : -EINVAL;
406 if ((long) (int) l != l)
413 int safe_atou8(const char *s, uint8_t *ret) {
421 l = strtoul(s, &x, 0);
423 if (!x || x == s || *x || errno)
424 return errno > 0 ? -errno : -EINVAL;
426 if ((unsigned long) (uint8_t) l != l)
433 int safe_atou16(const char *s, uint16_t *ret) {
441 l = strtoul(s, &x, 0);
443 if (!x || x == s || *x || errno)
444 return errno > 0 ? -errno : -EINVAL;
446 if ((unsigned long) (uint16_t) l != l)
453 int safe_atoi16(const char *s, int16_t *ret) {
461 l = strtol(s, &x, 0);
463 if (!x || x == s || *x || errno)
464 return errno > 0 ? -errno : -EINVAL;
466 if ((long) (int16_t) l != l)
473 int safe_atollu(const char *s, long long unsigned *ret_llu) {
475 unsigned long long l;
481 l = strtoull(s, &x, 0);
483 if (!x || x == s || *x || errno)
484 return errno ? -errno : -EINVAL;
490 int safe_atolli(const char *s, long long int *ret_lli) {
498 l = strtoll(s, &x, 0);
500 if (!x || x == s || *x || errno)
501 return errno ? -errno : -EINVAL;
507 int safe_atod(const char *s, double *ret_d) {
515 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
516 if (loc == (locale_t) 0)
520 d = strtod_l(s, &x, loc);
522 if (!x || x == s || *x || errno) {
524 return errno ? -errno : -EINVAL;
532 static size_t strcspn_escaped(const char *s, const char *reject) {
533 bool escaped = false;
536 for (n=0; s[n]; n++) {
539 else if (s[n] == '\\')
541 else if (strchr(reject, s[n]))
545 /* if s ends in \, return index of previous char */
549 /* Split a string into words. */
550 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
556 assert(**state == '\0');
560 current += strspn(current, separator);
566 if (quoted && strchr("\'\"", *current)) {
567 char quotechars[2] = {*current, '\0'};
569 *l = strcspn_escaped(current + 1, quotechars);
570 if (current[*l + 1] == '\0' ||
571 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
572 /* right quote missing or garbage at the end */
576 assert(current[*l + 1] == quotechars[0]);
577 *state = current++ + *l + 2;
579 *l = strcspn_escaped(current, separator);
580 if (current[*l] && !strchr(separator, current[*l])) {
581 /* unfinished escape */
585 *state = current + *l;
587 *l = strcspn(current, separator);
588 *state = current + *l;
594 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
596 _cleanup_free_ char *line = NULL;
608 p = procfs_file_alloca(pid, "stat");
609 r = read_one_line_file(p, &line);
613 /* Let's skip the pid and comm fields. The latter is enclosed
614 * in () but does not escape any () in its value, so let's
615 * skip over it manually */
617 p = strrchr(line, ')');
629 if ((long unsigned) (pid_t) ppid != ppid)
632 *_ppid = (pid_t) ppid;
637 int fchmod_umask(int fd, mode_t m) {
642 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
648 char *truncate_nl(char *s) {
651 s[strcspn(s, NEWLINE)] = 0;
655 int get_process_state(pid_t pid) {
659 _cleanup_free_ char *line = NULL;
663 p = procfs_file_alloca(pid, "stat");
664 r = read_one_line_file(p, &line);
668 p = strrchr(line, ')');
674 if (sscanf(p, " %c", &state) != 1)
677 return (unsigned char) state;
680 int get_process_comm(pid_t pid, char **name) {
687 p = procfs_file_alloca(pid, "comm");
689 r = read_one_line_file(p, name);
696 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
697 _cleanup_fclose_ FILE *f = NULL;
705 p = procfs_file_alloca(pid, "cmdline");
711 if (max_length == 0) {
712 size_t len = 0, allocated = 0;
714 while ((c = getc(f)) != EOF) {
716 if (!GREEDY_REALLOC(r, allocated, len+2)) {
721 r[len++] = isprint(c) ? c : ' ';
731 r = new(char, max_length);
737 while ((c = getc(f)) != EOF) {
759 size_t n = MIN(left-1, 3U);
766 /* Kernel threads have no argv[] */
768 _cleanup_free_ char *t = NULL;
776 h = get_process_comm(pid, &t);
780 r = strjoin("[", t, "]", NULL);
789 int is_kernel_thread(pid_t pid) {
801 p = procfs_file_alloca(pid, "cmdline");
806 count = fread(&c, 1, 1, f);
810 /* Kernel threads have an empty cmdline */
813 return eof ? 1 : -errno;
818 int get_process_capeff(pid_t pid, char **capeff) {
824 p = procfs_file_alloca(pid, "status");
826 return get_status_field(p, "\nCapEff:", capeff);
829 static int get_process_link_contents(const char *proc_file, char **name) {
835 r = readlink_malloc(proc_file, name);
837 return r == -ENOENT ? -ESRCH : r;
842 int get_process_exe(pid_t pid, char **name) {
849 p = procfs_file_alloca(pid, "exe");
850 r = get_process_link_contents(p, name);
854 d = endswith(*name, " (deleted)");
861 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
862 _cleanup_fclose_ FILE *f = NULL;
872 p = procfs_file_alloca(pid, "status");
877 FOREACH_LINE(line, f, return -errno) {
882 if (startswith(l, field)) {
884 l += strspn(l, WHITESPACE);
886 l[strcspn(l, WHITESPACE)] = 0;
888 return parse_uid(l, uid);
895 int get_process_uid(pid_t pid, uid_t *uid) {
896 return get_process_id(pid, "Uid:", uid);
899 int get_process_gid(pid_t pid, gid_t *gid) {
900 assert_cc(sizeof(uid_t) == sizeof(gid_t));
901 return get_process_id(pid, "Gid:", gid);
904 int get_process_cwd(pid_t pid, char **cwd) {
909 p = procfs_file_alloca(pid, "cwd");
911 return get_process_link_contents(p, cwd);
914 int get_process_root(pid_t pid, char **root) {
919 p = procfs_file_alloca(pid, "root");
921 return get_process_link_contents(p, root);
924 int get_process_environ(pid_t pid, char **env) {
925 _cleanup_fclose_ FILE *f = NULL;
926 _cleanup_free_ char *outcome = NULL;
929 size_t allocated = 0, sz = 0;
934 p = procfs_file_alloca(pid, "environ");
940 while ((c = fgetc(f)) != EOF) {
941 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
945 outcome[sz++] = '\n';
947 sz += cescape_char(c, outcome + sz);
957 char *strnappend(const char *s, const char *suffix, size_t b) {
965 return strndup(suffix, b);
974 if (b > ((size_t) -1) - a)
977 r = new(char, a+b+1);
982 memcpy(r+a, suffix, b);
988 char *strappend(const char *s, const char *suffix) {
989 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
992 int readlinkat_malloc(int fd, const char *p, char **ret) {
1007 n = readlinkat(fd, p, c, l-1);
1014 if ((size_t) n < l-1) {
1025 int readlink_malloc(const char *p, char **ret) {
1026 return readlinkat_malloc(AT_FDCWD, p, ret);
1029 int readlink_value(const char *p, char **ret) {
1030 _cleanup_free_ char *link = NULL;
1034 r = readlink_malloc(p, &link);
1038 value = basename(link);
1042 value = strdup(value);
1051 int readlink_and_make_absolute(const char *p, char **r) {
1052 _cleanup_free_ char *target = NULL;
1059 j = readlink_malloc(p, &target);
1063 k = file_in_same_dir(p, target);
1071 int readlink_and_canonicalize(const char *p, char **r) {
1078 j = readlink_and_make_absolute(p, &t);
1082 s = canonicalize_file_name(t);
1089 path_kill_slashes(*r);
1094 int reset_all_signal_handlers(void) {
1097 for (sig = 1; sig < _NSIG; sig++) {
1098 struct sigaction sa = {
1099 .sa_handler = SIG_DFL,
1100 .sa_flags = SA_RESTART,
1103 /* These two cannot be caught... */
1104 if (sig == SIGKILL || sig == SIGSTOP)
1107 /* On Linux the first two RT signals are reserved by
1108 * glibc, and sigaction() will return EINVAL for them. */
1109 if ((sigaction(sig, &sa, NULL) < 0))
1110 if (errno != EINVAL && r == 0)
1117 int reset_signal_mask(void) {
1120 if (sigemptyset(&ss) < 0)
1123 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1129 char *strstrip(char *s) {
1132 /* Drops trailing whitespace. Modifies the string in
1133 * place. Returns pointer to first non-space character */
1135 s += strspn(s, WHITESPACE);
1137 for (e = strchr(s, 0); e > s; e --)
1138 if (!strchr(WHITESPACE, e[-1]))
1146 char *delete_chars(char *s, const char *bad) {
1149 /* Drops all whitespace, regardless where in the string */
1151 for (f = s, t = s; *f; f++) {
1152 if (strchr(bad, *f))
1163 char *file_in_same_dir(const char *path, const char *filename) {
1170 /* This removes the last component of path and appends
1171 * filename, unless the latter is absolute anyway or the
1174 if (path_is_absolute(filename))
1175 return strdup(filename);
1177 e = strrchr(path, '/');
1179 return strdup(filename);
1181 k = strlen(filename);
1182 ret = new(char, (e + 1 - path) + k + 1);
1186 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1190 int rmdir_parents(const char *path, const char *stop) {
1199 /* Skip trailing slashes */
1200 while (l > 0 && path[l-1] == '/')
1206 /* Skip last component */
1207 while (l > 0 && path[l-1] != '/')
1210 /* Skip trailing slashes */
1211 while (l > 0 && path[l-1] == '/')
1217 if (!(t = strndup(path, l)))
1220 if (path_startswith(stop, t)) {
1229 if (errno != ENOENT)
1236 char hexchar(int x) {
1237 static const char table[16] = "0123456789abcdef";
1239 return table[x & 15];
1242 int unhexchar(char c) {
1244 if (c >= '0' && c <= '9')
1247 if (c >= 'a' && c <= 'f')
1248 return c - 'a' + 10;
1250 if (c >= 'A' && c <= 'F')
1251 return c - 'A' + 10;
1256 char *hexmem(const void *p, size_t l) {
1260 z = r = malloc(l * 2 + 1);
1264 for (x = p; x < (const uint8_t*) p + l; x++) {
1265 *(z++) = hexchar(*x >> 4);
1266 *(z++) = hexchar(*x & 15);
1273 void *unhexmem(const char *p, size_t l) {
1279 z = r = malloc((l + 1) / 2 + 1);
1283 for (x = p; x < p + l; x += 2) {
1286 a = unhexchar(x[0]);
1288 b = unhexchar(x[1]);
1292 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1299 char octchar(int x) {
1300 return '0' + (x & 7);
1303 int unoctchar(char c) {
1305 if (c >= '0' && c <= '7')
1311 char decchar(int x) {
1312 return '0' + (x % 10);
1315 int undecchar(char c) {
1317 if (c >= '0' && c <= '9')
1323 char *cescape(const char *s) {
1329 /* Does C style string escaping. */
1331 r = new(char, strlen(s)*4 + 1);
1335 for (f = s, t = r; *f; f++)
1336 t += cescape_char(*f, t);
1343 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1350 /* Undoes C style string escaping, and optionally prefixes it. */
1352 pl = prefix ? strlen(prefix) : 0;
1354 r = new(char, pl+length+1);
1359 memcpy(r, prefix, pl);
1361 for (f = s, t = r + pl; f < s + length; f++) {
1362 size_t remaining = s + length - f;
1363 assert(remaining > 0);
1365 if (*f != '\\') { /* a literal literal */
1370 if (--remaining == 0) { /* copy trailing backslash verbatim */
1411 /* This is an extension of the XDG syntax files */
1416 /* hexadecimal encoding */
1419 if (remaining >= 2) {
1420 a = unhexchar(f[1]);
1421 b = unhexchar(f[2]);
1424 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1425 /* Invalid escape code, let's take it literal then */
1429 *(t++) = (char) ((a << 4) | b);
1444 /* octal encoding */
1445 int a = -1, b = -1, c = -1;
1447 if (remaining >= 3) {
1448 a = unoctchar(f[0]);
1449 b = unoctchar(f[1]);
1450 c = unoctchar(f[2]);
1453 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1454 /* Invalid escape code, let's take it literal then */
1458 *(t++) = (char) ((a << 6) | (b << 3) | c);
1466 /* Invalid escape code, let's take it literal then */
1477 char *cunescape_length(const char *s, size_t length) {
1478 return cunescape_length_with_prefix(s, length, NULL);
1481 char *cunescape(const char *s) {
1484 return cunescape_length(s, strlen(s));
1487 char *xescape(const char *s, const char *bad) {
1491 /* Escapes all chars in bad, in addition to \ and all special
1492 * chars, in \xFF style escaping. May be reversed with
1495 r = new(char, strlen(s) * 4 + 1);
1499 for (f = s, t = r; *f; f++) {
1501 if ((*f < ' ') || (*f >= 127) ||
1502 (*f == '\\') || strchr(bad, *f)) {
1505 *(t++) = hexchar(*f >> 4);
1506 *(t++) = hexchar(*f);
1516 char *ascii_strlower(char *t) {
1521 for (p = t; *p; p++)
1522 if (*p >= 'A' && *p <= 'Z')
1523 *p = *p - 'A' + 'a';
1528 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1532 filename[0] == '.' ||
1533 streq(filename, "lost+found") ||
1534 streq(filename, "aquota.user") ||
1535 streq(filename, "aquota.group") ||
1536 endswith(filename, ".rpmnew") ||
1537 endswith(filename, ".rpmsave") ||
1538 endswith(filename, ".rpmorig") ||
1539 endswith(filename, ".dpkg-old") ||
1540 endswith(filename, ".dpkg-new") ||
1541 endswith(filename, ".dpkg-tmp") ||
1542 endswith(filename, ".swp");
1545 bool hidden_file(const char *filename) {
1548 if (endswith(filename, "~"))
1551 return hidden_file_allow_backup(filename);
1554 int fd_nonblock(int fd, bool nonblock) {
1559 flags = fcntl(fd, F_GETFL, 0);
1564 nflags = flags | O_NONBLOCK;
1566 nflags = flags & ~O_NONBLOCK;
1568 if (nflags == flags)
1571 if (fcntl(fd, F_SETFL, nflags) < 0)
1577 int fd_cloexec(int fd, bool cloexec) {
1582 flags = fcntl(fd, F_GETFD, 0);
1587 nflags = flags | FD_CLOEXEC;
1589 nflags = flags & ~FD_CLOEXEC;
1591 if (nflags == flags)
1594 if (fcntl(fd, F_SETFD, nflags) < 0)
1600 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1603 assert(n_fdset == 0 || fdset);
1605 for (i = 0; i < n_fdset; i++)
1612 int close_all_fds(const int except[], unsigned n_except) {
1613 _cleanup_closedir_ DIR *d = NULL;
1617 assert(n_except == 0 || except);
1619 d = opendir("/proc/self/fd");
1624 /* When /proc isn't available (for example in chroots)
1625 * the fallback is brute forcing through the fd
1628 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1629 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1631 if (fd_in_set(fd, except, n_except))
1634 if (close_nointr(fd) < 0)
1635 if (errno != EBADF && r == 0)
1642 while ((de = readdir(d))) {
1645 if (hidden_file(de->d_name))
1648 if (safe_atoi(de->d_name, &fd) < 0)
1649 /* Let's better ignore this, just in case */
1658 if (fd_in_set(fd, except, n_except))
1661 if (close_nointr(fd) < 0) {
1662 /* Valgrind has its own FD and doesn't want to have it closed */
1663 if (errno != EBADF && r == 0)
1671 bool chars_intersect(const char *a, const char *b) {
1674 /* Returns true if any of the chars in a are in b. */
1675 for (p = a; *p; p++)
1682 bool fstype_is_network(const char *fstype) {
1683 static const char table[] =
1697 x = startswith(fstype, "fuse.");
1701 return nulstr_contains(table, fstype);
1705 _cleanup_close_ int fd;
1707 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1713 TIOCL_GETKMSGREDIRECT,
1717 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1720 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1723 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1729 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1730 struct termios old_termios, new_termios;
1731 char c, line[LINE_MAX];
1736 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1737 new_termios = old_termios;
1739 new_termios.c_lflag &= ~ICANON;
1740 new_termios.c_cc[VMIN] = 1;
1741 new_termios.c_cc[VTIME] = 0;
1743 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1746 if (t != USEC_INFINITY) {
1747 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1748 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1753 k = fread(&c, 1, 1, f);
1755 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1761 *need_nl = c != '\n';
1768 if (t != USEC_INFINITY) {
1769 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1774 if (!fgets(line, sizeof(line), f))
1775 return errno ? -errno : -EIO;
1779 if (strlen(line) != 1)
1789 int ask_char(char *ret, const char *replies, const char *text, ...) {
1799 bool need_nl = true;
1802 fputs(ANSI_HIGHLIGHT_ON, stdout);
1809 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1813 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1816 if (r == -EBADMSG) {
1817 puts("Bad input, please try again.");
1828 if (strchr(replies, c)) {
1833 puts("Read unexpected character, please try again.");
1837 int ask_string(char **ret, const char *text, ...) {
1842 char line[LINE_MAX];
1846 fputs(ANSI_HIGHLIGHT_ON, stdout);
1853 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1858 if (!fgets(line, sizeof(line), stdin))
1859 return errno ? -errno : -EIO;
1861 if (!endswith(line, "\n"))
1880 int reset_terminal_fd(int fd, bool switch_to_text) {
1881 struct termios termios;
1884 /* Set terminal to some sane defaults */
1888 /* We leave locked terminal attributes untouched, so that
1889 * Plymouth may set whatever it wants to set, and we don't
1890 * interfere with that. */
1892 /* Disable exclusive mode, just in case */
1893 ioctl(fd, TIOCNXCL);
1895 /* Switch to text mode */
1897 ioctl(fd, KDSETMODE, KD_TEXT);
1899 /* Enable console unicode mode */
1900 ioctl(fd, KDSKBMODE, K_UNICODE);
1902 if (tcgetattr(fd, &termios) < 0) {
1907 /* We only reset the stuff that matters to the software. How
1908 * hardware is set up we don't touch assuming that somebody
1909 * else will do that for us */
1911 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1912 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1913 termios.c_oflag |= ONLCR;
1914 termios.c_cflag |= CREAD;
1915 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1917 termios.c_cc[VINTR] = 03; /* ^C */
1918 termios.c_cc[VQUIT] = 034; /* ^\ */
1919 termios.c_cc[VERASE] = 0177;
1920 termios.c_cc[VKILL] = 025; /* ^X */
1921 termios.c_cc[VEOF] = 04; /* ^D */
1922 termios.c_cc[VSTART] = 021; /* ^Q */
1923 termios.c_cc[VSTOP] = 023; /* ^S */
1924 termios.c_cc[VSUSP] = 032; /* ^Z */
1925 termios.c_cc[VLNEXT] = 026; /* ^V */
1926 termios.c_cc[VWERASE] = 027; /* ^W */
1927 termios.c_cc[VREPRINT] = 022; /* ^R */
1928 termios.c_cc[VEOL] = 0;
1929 termios.c_cc[VEOL2] = 0;
1931 termios.c_cc[VTIME] = 0;
1932 termios.c_cc[VMIN] = 1;
1934 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1938 /* Just in case, flush all crap out */
1939 tcflush(fd, TCIOFLUSH);
1944 int reset_terminal(const char *name) {
1945 _cleanup_close_ int fd = -1;
1947 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1951 return reset_terminal_fd(fd, true);
1954 int open_terminal(const char *name, int mode) {
1959 * If a TTY is in the process of being closed opening it might
1960 * cause EIO. This is horribly awful, but unlikely to be
1961 * changed in the kernel. Hence we work around this problem by
1962 * retrying a couple of times.
1964 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
1967 assert(!(mode & O_CREAT));
1970 fd = open(name, mode, 0);
1977 /* Max 1s in total */
1981 usleep(50 * USEC_PER_MSEC);
1999 int flush_fd(int fd) {
2000 struct pollfd pollfd = {
2010 r = poll(&pollfd, 1, 0);
2020 l = read(fd, buf, sizeof(buf));
2026 if (errno == EAGAIN)
2035 int acquire_terminal(
2039 bool ignore_tiocstty_eperm,
2042 int fd = -1, notify = -1, r = 0, wd = -1;
2047 /* We use inotify to be notified when the tty is closed. We
2048 * create the watch before checking if we can actually acquire
2049 * it, so that we don't lose any event.
2051 * Note: strictly speaking this actually watches for the
2052 * device being closed, it does *not* really watch whether a
2053 * tty loses its controlling process. However, unless some
2054 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2055 * its tty otherwise this will not become a problem. As long
2056 * as the administrator makes sure not configure any service
2057 * on the same tty as an untrusted user this should not be a
2058 * problem. (Which he probably should not do anyway.) */
2060 if (timeout != USEC_INFINITY)
2061 ts = now(CLOCK_MONOTONIC);
2063 if (!fail && !force) {
2064 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2070 wd = inotify_add_watch(notify, name, IN_CLOSE);
2078 struct sigaction sa_old, sa_new = {
2079 .sa_handler = SIG_IGN,
2080 .sa_flags = SA_RESTART,
2084 r = flush_fd(notify);
2089 /* We pass here O_NOCTTY only so that we can check the return
2090 * value TIOCSCTTY and have a reliable way to figure out if we
2091 * successfully became the controlling process of the tty */
2092 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2096 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2097 * if we already own the tty. */
2098 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2100 /* First, try to get the tty */
2101 if (ioctl(fd, TIOCSCTTY, force) < 0)
2104 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2106 /* Sometimes it makes sense to ignore TIOCSCTTY
2107 * returning EPERM, i.e. when very likely we already
2108 * are have this controlling terminal. */
2109 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2112 if (r < 0 && (force || fail || r != -EPERM)) {
2121 assert(notify >= 0);
2124 union inotify_event_buffer buffer;
2125 struct inotify_event *e;
2128 if (timeout != USEC_INFINITY) {
2131 n = now(CLOCK_MONOTONIC);
2132 if (ts + timeout < n) {
2137 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2147 l = read(notify, &buffer, sizeof(buffer));
2149 if (errno == EINTR || errno == EAGAIN)
2156 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2157 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2166 /* We close the tty fd here since if the old session
2167 * ended our handle will be dead. It's important that
2168 * we do this after sleeping, so that we don't enter
2169 * an endless loop. */
2170 fd = safe_close(fd);
2175 r = reset_terminal_fd(fd, true);
2177 log_warning_errno(r, "Failed to reset terminal: %m");
2188 int release_terminal(void) {
2189 static const struct sigaction sa_new = {
2190 .sa_handler = SIG_IGN,
2191 .sa_flags = SA_RESTART,
2194 _cleanup_close_ int fd = -1;
2195 struct sigaction sa_old;
2198 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2202 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2203 * by our own TIOCNOTTY */
2204 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2206 if (ioctl(fd, TIOCNOTTY) < 0)
2209 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2214 int sigaction_many(const struct sigaction *sa, ...) {
2219 while ((sig = va_arg(ap, int)) > 0)
2220 if (sigaction(sig, sa, NULL) < 0)
2227 int ignore_signals(int sig, ...) {
2228 struct sigaction sa = {
2229 .sa_handler = SIG_IGN,
2230 .sa_flags = SA_RESTART,
2235 if (sigaction(sig, &sa, NULL) < 0)
2239 while ((sig = va_arg(ap, int)) > 0)
2240 if (sigaction(sig, &sa, NULL) < 0)
2247 int default_signals(int sig, ...) {
2248 struct sigaction sa = {
2249 .sa_handler = SIG_DFL,
2250 .sa_flags = SA_RESTART,
2255 if (sigaction(sig, &sa, NULL) < 0)
2259 while ((sig = va_arg(ap, int)) > 0)
2260 if (sigaction(sig, &sa, NULL) < 0)
2267 void safe_close_pair(int p[]) {
2271 /* Special case pairs which use the same fd in both
2273 p[0] = p[1] = safe_close(p[0]);
2277 p[0] = safe_close(p[0]);
2278 p[1] = safe_close(p[1]);
2281 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2288 while (nbytes > 0) {
2291 k = read(fd, p, nbytes);
2296 if (errno == EAGAIN && do_poll) {
2298 /* We knowingly ignore any return value here,
2299 * and expect that any error/EOF is reported
2302 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2306 return n > 0 ? n : -errno;
2320 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2321 const uint8_t *p = buf;
2328 while (nbytes > 0) {
2331 k = write(fd, p, nbytes);
2336 if (errno == EAGAIN && do_poll) {
2337 /* We knowingly ignore any return value here,
2338 * and expect that any error/EOF is reported
2341 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2348 if (k == 0) /* Can't really happen */
2358 int parse_size(const char *t, off_t base, off_t *size) {
2360 /* Soo, sometimes we want to parse IEC binary suffxies, and
2361 * sometimes SI decimal suffixes. This function can parse
2362 * both. Which one is the right way depends on the
2363 * context. Wikipedia suggests that SI is customary for
2364 * hardrware metrics and network speeds, while IEC is
2365 * customary for most data sizes used by software and volatile
2366 * (RAM) memory. Hence be careful which one you pick!
2368 * In either case we use just K, M, G as suffix, and not Ki,
2369 * Mi, Gi or so (as IEC would suggest). That's because that's
2370 * frickin' ugly. But this means you really need to make sure
2371 * to document which base you are parsing when you use this
2376 unsigned long long factor;
2379 static const struct table iec[] = {
2380 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2381 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2382 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2383 { "G", 1024ULL*1024ULL*1024ULL },
2384 { "M", 1024ULL*1024ULL },
2390 static const struct table si[] = {
2391 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2392 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2393 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2394 { "G", 1000ULL*1000ULL*1000ULL },
2395 { "M", 1000ULL*1000ULL },
2401 const struct table *table;
2403 unsigned long long r = 0;
2404 unsigned n_entries, start_pos = 0;
2407 assert(base == 1000 || base == 1024);
2412 n_entries = ELEMENTSOF(si);
2415 n_entries = ELEMENTSOF(iec);
2421 unsigned long long l2;
2427 l = strtoll(p, &e, 10);
2440 if (*e >= '0' && *e <= '9') {
2443 /* strotoull itself would accept space/+/- */
2444 l2 = strtoull(e, &e2, 10);
2446 if (errno == ERANGE)
2449 /* Ignore failure. E.g. 10.M is valid */
2456 e += strspn(e, WHITESPACE);
2458 for (i = start_pos; i < n_entries; i++)
2459 if (startswith(e, table[i].suffix)) {
2460 unsigned long long tmp;
2461 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2463 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2464 if (tmp > ULLONG_MAX - r)
2468 if ((unsigned long long) (off_t) r != r)
2471 p = e + strlen(table[i].suffix);
2487 int make_stdio(int fd) {
2492 r = dup2(fd, STDIN_FILENO);
2493 s = dup2(fd, STDOUT_FILENO);
2494 t = dup2(fd, STDERR_FILENO);
2499 if (r < 0 || s < 0 || t < 0)
2502 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2503 * dup2() was a NOP and the bit hence possibly set. */
2504 fd_cloexec(STDIN_FILENO, false);
2505 fd_cloexec(STDOUT_FILENO, false);
2506 fd_cloexec(STDERR_FILENO, false);
2511 int make_null_stdio(void) {
2514 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2518 return make_stdio(null_fd);
2521 bool is_device_path(const char *path) {
2523 /* Returns true on paths that refer to a device, either in
2524 * sysfs or in /dev */
2527 path_startswith(path, "/dev/") ||
2528 path_startswith(path, "/sys/");
2531 int dir_is_empty(const char *path) {
2532 _cleanup_closedir_ DIR *d;
2543 if (!de && errno != 0)
2549 if (!hidden_file(de->d_name))
2554 char* dirname_malloc(const char *path) {
2555 char *d, *dir, *dir2;
2572 int dev_urandom(void *p, size_t n) {
2573 static int have_syscall = -1;
2577 /* Gathers some randomness from the kernel. This call will
2578 * never block, and will always return some data from the
2579 * kernel, regardless if the random pool is fully initialized
2580 * or not. It thus makes no guarantee for the quality of the
2581 * returned entropy, but is good enough for or usual usecases
2582 * of seeding the hash functions for hashtable */
2584 /* Use the getrandom() syscall unless we know we don't have
2585 * it, or when the requested size is too large for it. */
2586 if (have_syscall != 0 || (size_t) (int) n != n) {
2587 r = getrandom(p, n, GRND_NONBLOCK);
2589 have_syscall = true;
2594 if (errno == ENOSYS)
2595 /* we lack the syscall, continue with
2596 * reading from /dev/urandom */
2597 have_syscall = false;
2598 else if (errno == EAGAIN)
2599 /* not enough entropy for now. Let's
2600 * remember to use the syscall the
2601 * next time, again, but also read
2602 * from /dev/urandom for now, which
2603 * doesn't care about the current
2604 * amount of entropy. */
2605 have_syscall = true;
2609 /* too short read? */
2613 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2615 return errno == ENOENT ? -ENOSYS : -errno;
2617 k = loop_read(fd, p, n, true);
2622 if ((size_t) k != n)
2628 void initialize_srand(void) {
2629 static bool srand_called = false;
2631 #ifdef HAVE_SYS_AUXV_H
2640 #ifdef HAVE_SYS_AUXV_H
2641 /* The kernel provides us with a bit of entropy in auxv, so
2642 * let's try to make use of that to seed the pseudo-random
2643 * generator. It's better than nothing... */
2645 auxv = (void*) getauxval(AT_RANDOM);
2647 x ^= *(unsigned*) auxv;
2650 x ^= (unsigned) now(CLOCK_REALTIME);
2651 x ^= (unsigned) gettid();
2654 srand_called = true;
2657 void random_bytes(void *p, size_t n) {
2661 r = dev_urandom(p, n);
2665 /* If some idiot made /dev/urandom unavailable to us, he'll
2666 * get a PRNG instead. */
2670 for (q = p; q < (uint8_t*) p + n; q ++)
2674 void rename_process(const char name[8]) {
2677 /* This is a like a poor man's setproctitle(). It changes the
2678 * comm field, argv[0], and also the glibc's internally used
2679 * name of the process. For the first one a limit of 16 chars
2680 * applies, to the second one usually one of 10 (i.e. length
2681 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2682 * "systemd"). If you pass a longer string it will be
2685 prctl(PR_SET_NAME, name);
2687 if (program_invocation_name)
2688 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2690 if (saved_argc > 0) {
2694 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2696 for (i = 1; i < saved_argc; i++) {
2700 memzero(saved_argv[i], strlen(saved_argv[i]));
2705 void sigset_add_many(sigset_t *ss, ...) {
2712 while ((sig = va_arg(ap, int)) > 0)
2713 assert_se(sigaddset(ss, sig) == 0);
2717 int sigprocmask_many(int how, ...) {
2722 assert_se(sigemptyset(&ss) == 0);
2725 while ((sig = va_arg(ap, int)) > 0)
2726 assert_se(sigaddset(&ss, sig) == 0);
2729 if (sigprocmask(how, &ss, NULL) < 0)
2735 char* gethostname_malloc(void) {
2738 assert_se(uname(&u) >= 0);
2740 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2741 return strdup(u.nodename);
2743 return strdup(u.sysname);
2746 bool hostname_is_set(void) {
2749 assert_se(uname(&u) >= 0);
2751 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2754 char *lookup_uid(uid_t uid) {
2757 _cleanup_free_ char *buf = NULL;
2758 struct passwd pwbuf, *pw = NULL;
2760 /* Shortcut things to avoid NSS lookups */
2762 return strdup("root");
2764 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2768 buf = malloc(bufsize);
2772 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2773 return strdup(pw->pw_name);
2775 if (asprintf(&name, UID_FMT, uid) < 0)
2781 char* getlogname_malloc(void) {
2785 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2790 return lookup_uid(uid);
2793 char *getusername_malloc(void) {
2800 return lookup_uid(getuid());
2803 int getttyname_malloc(int fd, char **ret) {
2813 r = ttyname_r(fd, path, sizeof(path));
2818 p = startswith(path, "/dev/");
2819 c = strdup(p ?: path);
2836 int getttyname_harder(int fd, char **r) {
2840 k = getttyname_malloc(fd, &s);
2844 if (streq(s, "tty")) {
2846 return get_ctty(0, NULL, r);
2853 int get_ctty_devnr(pid_t pid, dev_t *d) {
2855 _cleanup_free_ char *line = NULL;
2857 unsigned long ttynr;
2861 p = procfs_file_alloca(pid, "stat");
2862 r = read_one_line_file(p, &line);
2866 p = strrchr(line, ')');
2876 "%*d " /* session */
2881 if (major(ttynr) == 0 && minor(ttynr) == 0)
2890 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2891 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2892 _cleanup_free_ char *s = NULL;
2899 k = get_ctty_devnr(pid, &devnr);
2903 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
2905 k = readlink_malloc(fn, &s);
2911 /* This is an ugly hack */
2912 if (major(devnr) == 136) {
2913 asprintf(&b, "pts/%u", minor(devnr));
2917 /* Probably something like the ptys which have no
2918 * symlink in /dev/char. Let's return something
2919 * vaguely useful. */
2925 if (startswith(s, "/dev/"))
2927 else if (startswith(s, "../"))
2945 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2946 _cleanup_closedir_ DIR *d = NULL;
2951 /* This returns the first error we run into, but nevertheless
2952 * tries to go on. This closes the passed fd. */
2958 return errno == ENOENT ? 0 : -errno;
2963 bool is_dir, keep_around;
2970 if (errno != 0 && ret == 0)
2975 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
2978 if (de->d_type == DT_UNKNOWN ||
2980 (de->d_type == DT_DIR && root_dev)) {
2981 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
2982 if (ret == 0 && errno != ENOENT)
2987 is_dir = S_ISDIR(st.st_mode);
2990 (st.st_uid == 0 || st.st_uid == getuid()) &&
2991 (st.st_mode & S_ISVTX);
2993 is_dir = de->d_type == DT_DIR;
2994 keep_around = false;
3000 /* if root_dev is set, remove subdirectories only, if device is same as dir */
3001 if (root_dev && st.st_dev != root_dev->st_dev)
3004 subdir_fd = openat(fd, de->d_name,
3005 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3006 if (subdir_fd < 0) {
3007 if (ret == 0 && errno != ENOENT)
3012 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
3013 if (r < 0 && ret == 0)
3017 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
3018 if (ret == 0 && errno != ENOENT)
3022 } else if (!only_dirs && !keep_around) {
3024 if (unlinkat(fd, de->d_name, 0) < 0) {
3025 if (ret == 0 && errno != ENOENT)
3032 _pure_ static int is_temporary_fs(struct statfs *s) {
3035 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3036 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3039 int is_fd_on_temporary_fs(int fd) {
3042 if (fstatfs(fd, &s) < 0)
3045 return is_temporary_fs(&s);
3048 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
3053 if (fstatfs(fd, &s) < 0) {
3058 /* We refuse to clean disk file systems with this call. This
3059 * is extra paranoia just to be sure we never ever remove
3061 if (!is_temporary_fs(&s)) {
3062 log_error("Attempted to remove disk file system, and we can't allow that.");
3067 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
3070 static int file_is_priv_sticky(const char *p) {
3075 if (lstat(p, &st) < 0)
3079 (st.st_uid == 0 || st.st_uid == getuid()) &&
3080 (st.st_mode & S_ISVTX);
3083 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
3089 /* We refuse to clean the root file system with this
3090 * call. This is extra paranoia to never cause a really
3091 * seriously broken system. */
3092 if (path_equal(path, "/")) {
3093 log_error("Attempted to remove entire root file system, and we can't allow that.");
3097 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3100 if (errno != ENOTDIR && errno != ELOOP)
3104 if (statfs(path, &s) < 0)
3107 if (!is_temporary_fs(&s)) {
3108 log_error("Attempted to remove disk file system, and we can't allow that.");
3113 if (delete_root && !only_dirs)
3114 if (unlink(path) < 0 && errno != ENOENT)
3121 if (fstatfs(fd, &s) < 0) {
3126 if (!is_temporary_fs(&s)) {
3127 log_error("Attempted to remove disk file system, and we can't allow that.");
3133 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
3136 if (honour_sticky && file_is_priv_sticky(path) > 0)
3139 if (rmdir(path) < 0 && errno != ENOENT) {
3148 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3149 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
3152 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3153 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
3156 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3159 /* Under the assumption that we are running privileged we
3160 * first change the access mode and only then hand out
3161 * ownership to avoid a window where access is too open. */
3163 if (mode != MODE_INVALID)
3164 if (chmod(path, mode) < 0)
3167 if (uid != UID_INVALID || gid != GID_INVALID)
3168 if (chown(path, uid, gid) < 0)
3174 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3177 /* Under the assumption that we are running privileged we
3178 * first change the access mode and only then hand out
3179 * ownership to avoid a window where access is too open. */
3181 if (mode != MODE_INVALID)
3182 if (fchmod(fd, mode) < 0)
3185 if (uid != UID_INVALID || gid != GID_INVALID)
3186 if (fchown(fd, uid, gid) < 0)
3192 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3196 /* Allocates the cpuset in the right size */
3199 if (!(r = CPU_ALLOC(n)))
3202 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3203 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3213 if (errno != EINVAL)
3220 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3221 static const char status_indent[] = " "; /* "[" STATUS "] " */
3222 _cleanup_free_ char *s = NULL;
3223 _cleanup_close_ int fd = -1;
3224 struct iovec iovec[6] = {};
3226 static bool prev_ephemeral;
3230 /* This is independent of logging, as status messages are
3231 * optional and go exclusively to the console. */
3233 if (vasprintf(&s, format, ap) < 0)
3236 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3249 sl = status ? sizeof(status_indent)-1 : 0;
3255 e = ellipsize(s, emax, 50);
3263 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3264 prev_ephemeral = ephemeral;
3267 if (!isempty(status)) {
3268 IOVEC_SET_STRING(iovec[n++], "[");
3269 IOVEC_SET_STRING(iovec[n++], status);
3270 IOVEC_SET_STRING(iovec[n++], "] ");
3272 IOVEC_SET_STRING(iovec[n++], status_indent);
3275 IOVEC_SET_STRING(iovec[n++], s);
3277 IOVEC_SET_STRING(iovec[n++], "\n");
3279 if (writev(fd, iovec, n) < 0)
3285 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3291 va_start(ap, format);
3292 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3298 char *replace_env(const char *format, char **env) {
3305 const char *e, *word = format;
3310 for (e = format; *e; e ++) {
3321 k = strnappend(r, word, e-word-1);
3331 } else if (*e == '$') {
3332 k = strnappend(r, word, e-word);
3349 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3351 k = strappend(r, t);
3365 k = strnappend(r, word, e-word);
3377 char **replace_env_argv(char **argv, char **env) {
3379 unsigned k = 0, l = 0;
3381 l = strv_length(argv);
3383 ret = new(char*, l+1);
3387 STRV_FOREACH(i, argv) {
3389 /* If $FOO appears as single word, replace it by the split up variable */
3390 if ((*i)[0] == '$' && (*i)[1] != '{') {
3395 e = strv_env_get(env, *i+1);
3399 r = strv_split_quoted(&m, e, true);
3411 w = realloc(ret, sizeof(char*) * (l+1));
3421 memcpy(ret + k, m, q * sizeof(char*));
3429 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3430 ret[k] = replace_env(*i, env);
3442 int fd_columns(int fd) {
3443 struct winsize ws = {};
3445 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3454 unsigned columns(void) {
3458 if (_likely_(cached_columns > 0))
3459 return cached_columns;
3462 e = getenv("COLUMNS");
3464 (void) safe_atoi(e, &c);
3467 c = fd_columns(STDOUT_FILENO);
3473 return cached_columns;
3476 int fd_lines(int fd) {
3477 struct winsize ws = {};
3479 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3488 unsigned lines(void) {
3492 if (_likely_(cached_lines > 0))
3493 return cached_lines;
3496 e = getenv("LINES");
3498 (void) safe_atoi(e, &l);
3501 l = fd_lines(STDOUT_FILENO);
3507 return cached_lines;
3510 /* intended to be used as a SIGWINCH sighandler */
3511 void columns_lines_cache_reset(int signum) {
3517 static int cached_on_tty = -1;
3519 if (_unlikely_(cached_on_tty < 0))
3520 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3522 return cached_on_tty;
3525 int files_same(const char *filea, const char *fileb) {
3528 if (stat(filea, &a) < 0)
3531 if (stat(fileb, &b) < 0)
3534 return a.st_dev == b.st_dev &&
3535 a.st_ino == b.st_ino;
3538 int running_in_chroot(void) {
3541 ret = files_same("/proc/1/root", "/");
3548 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3553 assert(percent <= 100);
3554 assert(new_length >= 3);
3556 if (old_length <= 3 || old_length <= new_length)
3557 return strndup(s, old_length);
3559 r = new0(char, new_length+1);
3563 x = (new_length * percent) / 100;
3565 if (x > new_length - 3)
3573 s + old_length - (new_length - x - 3),
3574 new_length - x - 3);
3579 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3583 unsigned k, len, len2;
3586 assert(percent <= 100);
3587 assert(new_length >= 3);
3589 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3590 if (ascii_is_valid(s))
3591 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3593 if (old_length <= 3 || old_length <= new_length)
3594 return strndup(s, old_length);
3596 x = (new_length * percent) / 100;
3598 if (x > new_length - 3)
3602 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3605 c = utf8_encoded_to_unichar(i);
3608 k += unichar_iswide(c) ? 2 : 1;
3611 if (k > x) /* last character was wide and went over quota */
3614 for (j = s + old_length; k < new_length && j > i; ) {
3617 j = utf8_prev_char(j);
3618 c = utf8_encoded_to_unichar(j);
3621 k += unichar_iswide(c) ? 2 : 1;
3625 /* we don't actually need to ellipsize */
3627 return memdup(s, old_length + 1);
3629 /* make space for ellipsis */
3630 j = utf8_next_char(j);
3633 len2 = s + old_length - j;
3634 e = new(char, len + 3 + len2 + 1);
3639 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3640 old_length, new_length, x, len, len2, k);
3644 e[len] = 0xe2; /* tri-dot ellipsis: … */
3648 memcpy(e + len + 3, j, len2 + 1);
3653 char *ellipsize(const char *s, size_t length, unsigned percent) {
3654 return ellipsize_mem(s, strlen(s), length, percent);
3657 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3658 _cleanup_close_ int fd;
3664 mkdir_parents(path, 0755);
3666 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3671 r = fchmod(fd, mode);
3676 if (uid != UID_INVALID || gid != GID_INVALID) {
3677 r = fchown(fd, uid, gid);
3682 if (stamp != USEC_INFINITY) {
3683 struct timespec ts[2];
3685 timespec_store(&ts[0], stamp);
3687 r = futimens(fd, ts);
3689 r = futimens(fd, NULL);
3696 int touch(const char *path) {
3697 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3700 char *unquote(const char *s, const char* quotes) {
3704 /* This is rather stupid, simply removes the heading and
3705 * trailing quotes if there is one. Doesn't care about
3706 * escaping or anything. We should make this smarter one
3713 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3714 return strndup(s+1, l-2);
3719 char *normalize_env_assignment(const char *s) {
3720 _cleanup_free_ char *value = NULL;
3724 eq = strchr(s, '=');
3734 memmove(r, t, strlen(t) + 1);
3739 name = strndupa(s, eq - s);
3740 p = strdupa(eq + 1);
3742 value = unquote(strstrip(p), QUOTES);
3746 return strjoin(strstrip(name), "=", value, NULL);
3749 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3760 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3774 * < 0 : wait_for_terminate() failed to get the state of the
3775 * process, the process was terminated by a signal, or
3776 * failed for an unknown reason.
3777 * >=0 : The process terminated normally, and its exit code is
3780 * That is, success is indicated by a return value of zero, and an
3781 * error is indicated by a non-zero value.
3783 * A warning is emitted if the process terminates abnormally,
3784 * and also if it returns non-zero unless check_exit_code is true.
3786 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3793 r = wait_for_terminate(pid, &status);
3795 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3797 if (status.si_code == CLD_EXITED) {
3798 if (status.si_status != 0)
3799 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3800 "%s failed with error code %i.", name, status.si_status);
3802 log_debug("%s succeeded.", name);
3804 return status.si_status;
3805 } else if (status.si_code == CLD_KILLED ||
3806 status.si_code == CLD_DUMPED) {
3808 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3812 log_warning("%s failed due to unknown reason.", name);
3816 noreturn void freeze(void) {
3818 /* Make sure nobody waits for us on a socket anymore */
3819 close_all_fds(NULL, 0);
3827 bool null_or_empty(struct stat *st) {
3830 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3833 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3839 int null_or_empty_path(const char *fn) {
3844 if (stat(fn, &st) < 0)
3847 return null_or_empty(&st);
3850 int null_or_empty_fd(int fd) {
3855 if (fstat(fd, &st) < 0)
3858 return null_or_empty(&st);
3861 DIR *xopendirat(int fd, const char *name, int flags) {
3865 assert(!(flags & O_CREAT));
3867 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3880 int signal_from_string_try_harder(const char *s) {
3884 signo = signal_from_string(s);
3886 if (startswith(s, "SIG"))
3887 return signal_from_string(s+3);
3892 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3893 _cleanup_free_ char *t = NULL, *u = NULL;
3896 u = unquote(tagvalue, "\"\'");
3900 enc_len = strlen(u) * 4 + 1;
3901 t = new(char, enc_len);
3905 if (encode_devnode_name(u, t, enc_len) < 0)
3908 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3911 char *fstab_node_to_udev_node(const char *p) {
3914 if (startswith(p, "LABEL="))
3915 return tag_to_udev_node(p+6, "label");
3917 if (startswith(p, "UUID="))
3918 return tag_to_udev_node(p+5, "uuid");
3920 if (startswith(p, "PARTUUID="))
3921 return tag_to_udev_node(p+9, "partuuid");
3923 if (startswith(p, "PARTLABEL="))
3924 return tag_to_udev_node(p+10, "partlabel");
3929 bool tty_is_vc(const char *tty) {
3932 return vtnr_from_tty(tty) >= 0;
3935 bool tty_is_console(const char *tty) {
3938 if (startswith(tty, "/dev/"))
3941 return streq(tty, "console");
3944 int vtnr_from_tty(const char *tty) {
3949 if (startswith(tty, "/dev/"))
3952 if (!startswith(tty, "tty") )
3955 if (tty[3] < '0' || tty[3] > '9')
3958 r = safe_atoi(tty+3, &i);
3962 if (i < 0 || i > 63)
3968 char *resolve_dev_console(char **active) {
3971 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3972 * (i.e. not read-only-mounted which is a sign for container setups) */
3974 if (path_is_read_only_fs("/sys") > 0)
3977 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3980 /* If multiple log outputs are configured the last one is what
3981 * /dev/console points to */
3982 tty = strrchr(*active, ' ');
3988 if (streq(tty, "tty0")) {
3991 /* Get the active VC (e.g. tty1) */
3992 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
3994 tty = *active = tmp;
4001 bool tty_is_vc_resolve(const char *tty) {
4002 _cleanup_free_ char *active = NULL;
4006 if (startswith(tty, "/dev/"))
4009 if (streq(tty, "console")) {
4010 tty = resolve_dev_console(&active);
4015 return tty_is_vc(tty);
4018 const char *default_term_for_tty(const char *tty) {
4021 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
4024 bool dirent_is_file(const struct dirent *de) {
4027 if (hidden_file(de->d_name))
4030 if (de->d_type != DT_REG &&
4031 de->d_type != DT_LNK &&
4032 de->d_type != DT_UNKNOWN)
4038 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
4041 if (de->d_type != DT_REG &&
4042 de->d_type != DT_LNK &&
4043 de->d_type != DT_UNKNOWN)
4046 if (hidden_file_allow_backup(de->d_name))
4049 return endswith(de->d_name, suffix);
4052 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4053 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4054 _cleanup_set_free_free_ Set *seen = NULL;
4057 /* We fork this all off from a child process so that we can
4058 * somewhat cleanly make use of SIGALRM to set a time limit */
4060 reset_all_signal_handlers();
4061 reset_signal_mask();
4063 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4065 pids = hashmap_new(NULL);
4069 seen = set_new(&string_hash_ops);
4073 STRV_FOREACH(directory, directories) {
4074 _cleanup_closedir_ DIR *d;
4077 d = opendir(*directory);
4079 if (errno == ENOENT)
4082 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4085 FOREACH_DIRENT(de, d, break) {
4086 _cleanup_free_ char *path = NULL;
4090 if (!dirent_is_file(de))
4093 if (set_contains(seen, de->d_name)) {
4094 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4098 r = set_put_strdup(seen, de->d_name);
4102 path = strjoin(*directory, "/", de->d_name, NULL);
4106 if (null_or_empty_path(path)) {
4107 log_debug("%s is empty (a mask).", path);
4110 log_debug("%s will be executed.", path);
4114 log_error_errno(errno, "Failed to fork: %m");
4116 } else if (pid == 0) {
4119 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4129 return log_error_errno(errno, "Failed to execute %s: %m", path);
4132 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4134 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4141 /* Abort execution of this process after the timout. We simply
4142 * rely on SIGALRM as default action terminating the process,
4143 * and turn on alarm(). */
4145 if (timeout != USEC_INFINITY)
4146 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4148 while (!hashmap_isempty(pids)) {
4149 _cleanup_free_ char *path = NULL;
4152 pid = PTR_TO_UINT(hashmap_first_key(pids));
4155 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4158 wait_for_terminate_and_warn(path, pid, true);
4164 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4168 char **dirs = (char**) directories;
4170 assert(!strv_isempty(dirs));
4172 name = basename(dirs[0]);
4173 assert(!isempty(name));
4175 /* Executes all binaries in the directories in parallel and waits
4176 * for them to finish. Optionally a timeout is applied. If a file
4177 * with the same name exists in more than one directory, the
4178 * earliest one wins. */
4180 executor_pid = fork();
4181 if (executor_pid < 0) {
4182 log_error_errno(errno, "Failed to fork: %m");
4185 } else if (executor_pid == 0) {
4186 r = do_execute(dirs, timeout, argv);
4187 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4190 wait_for_terminate_and_warn(name, executor_pid, true);
4193 int kill_and_sigcont(pid_t pid, int sig) {
4196 r = kill(pid, sig) < 0 ? -errno : 0;
4204 bool nulstr_contains(const char*nulstr, const char *needle) {
4210 NULSTR_FOREACH(i, nulstr)
4211 if (streq(i, needle))
4217 bool plymouth_running(void) {
4218 return access("/run/plymouth/pid", F_OK) >= 0;
4221 char* strshorten(char *s, size_t l) {
4230 static bool hostname_valid_char(char c) {
4232 (c >= 'a' && c <= 'z') ||
4233 (c >= 'A' && c <= 'Z') ||
4234 (c >= '0' && c <= '9') ||
4240 bool hostname_is_valid(const char *s) {
4247 for (p = s, dot = true; *p; p++) {
4254 if (!hostname_valid_char(*p))
4264 if (p-s > HOST_NAME_MAX)
4270 char* hostname_cleanup(char *s, bool lowercase) {
4274 for (p = s, d = s, dot = true; *p; p++) {
4281 } else if (hostname_valid_char(*p)) {
4282 *(d++) = lowercase ? tolower(*p) : *p;
4293 strshorten(s, HOST_NAME_MAX);
4298 bool machine_name_is_valid(const char *s) {
4300 if (!hostname_is_valid(s))
4303 /* Machine names should be useful hostnames, but also be
4304 * useful in unit names, hence we enforce a stricter length
4313 int pipe_eof(int fd) {
4314 struct pollfd pollfd = {
4316 .events = POLLIN|POLLHUP,
4321 r = poll(&pollfd, 1, 0);
4328 return pollfd.revents & POLLHUP;
4331 int fd_wait_for_event(int fd, int event, usec_t t) {
4333 struct pollfd pollfd = {
4341 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4348 return pollfd.revents;
4351 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4360 r = tempfn_xxxxxx(path, &t);
4364 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4370 f = fdopen(fd, "we");
4383 int terminal_vhangup_fd(int fd) {
4386 if (ioctl(fd, TIOCVHANGUP) < 0)
4392 int terminal_vhangup(const char *name) {
4393 _cleanup_close_ int fd;
4395 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4399 return terminal_vhangup_fd(fd);
4402 int vt_disallocate(const char *name) {
4406 /* Deallocate the VT if possible. If not possible
4407 * (i.e. because it is the active one), at least clear it
4408 * entirely (including the scrollback buffer) */
4410 if (!startswith(name, "/dev/"))
4413 if (!tty_is_vc(name)) {
4414 /* So this is not a VT. I guess we cannot deallocate
4415 * it then. But let's at least clear the screen */
4417 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4422 "\033[r" /* clear scrolling region */
4423 "\033[H" /* move home */
4424 "\033[2J", /* clear screen */
4431 if (!startswith(name, "/dev/tty"))
4434 r = safe_atou(name+8, &u);
4441 /* Try to deallocate */
4442 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4446 r = ioctl(fd, VT_DISALLOCATE, u);
4455 /* Couldn't deallocate, so let's clear it fully with
4457 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4462 "\033[r" /* clear scrolling region */
4463 "\033[H" /* move home */
4464 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4471 int symlink_atomic(const char *from, const char *to) {
4472 _cleanup_free_ char *t = NULL;
4478 r = tempfn_random(to, &t);
4482 if (symlink(from, t) < 0)
4485 if (rename(t, to) < 0) {
4493 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4494 _cleanup_free_ char *t = NULL;
4499 r = tempfn_random(path, &t);
4503 if (mknod(t, mode, dev) < 0)
4506 if (rename(t, path) < 0) {
4514 int mkfifo_atomic(const char *path, mode_t mode) {
4515 _cleanup_free_ char *t = NULL;
4520 r = tempfn_random(path, &t);
4524 if (mkfifo(t, mode) < 0)
4527 if (rename(t, path) < 0) {
4535 bool display_is_local(const char *display) {
4539 display[0] == ':' &&
4540 display[1] >= '0' &&
4544 int socket_from_display(const char *display, char **path) {
4551 if (!display_is_local(display))
4554 k = strspn(display+1, "0123456789");
4556 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4560 c = stpcpy(f, "/tmp/.X11-unix/X");
4561 memcpy(c, display+1, k);
4570 const char **username,
4571 uid_t *uid, gid_t *gid,
4573 const char **shell) {
4581 /* We enforce some special rules for uid=0: in order to avoid
4582 * NSS lookups for root we hardcode its data. */
4584 if (streq(*username, "root") || streq(*username, "0")) {
4602 if (parse_uid(*username, &u) >= 0) {
4606 /* If there are multiple users with the same id, make
4607 * sure to leave $USER to the configured value instead
4608 * of the first occurrence in the database. However if
4609 * the uid was configured by a numeric uid, then let's
4610 * pick the real username from /etc/passwd. */
4612 *username = p->pw_name;
4615 p = getpwnam(*username);
4619 return errno > 0 ? -errno : -ESRCH;
4631 *shell = p->pw_shell;
4636 char* uid_to_name(uid_t uid) {
4641 return strdup("root");
4645 return strdup(p->pw_name);
4647 if (asprintf(&r, UID_FMT, uid) < 0)
4653 char* gid_to_name(gid_t gid) {
4658 return strdup("root");
4662 return strdup(p->gr_name);
4664 if (asprintf(&r, GID_FMT, gid) < 0)
4670 int get_group_creds(const char **groupname, gid_t *gid) {
4676 /* We enforce some special rules for gid=0: in order to avoid
4677 * NSS lookups for root we hardcode its data. */
4679 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4680 *groupname = "root";
4688 if (parse_gid(*groupname, &id) >= 0) {
4693 *groupname = g->gr_name;
4696 g = getgrnam(*groupname);
4700 return errno > 0 ? -errno : -ESRCH;
4708 int in_gid(gid_t gid) {
4710 int ngroups_max, r, i;
4712 if (getgid() == gid)
4715 if (getegid() == gid)
4718 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4719 assert(ngroups_max > 0);
4721 gids = alloca(sizeof(gid_t) * ngroups_max);
4723 r = getgroups(ngroups_max, gids);
4727 for (i = 0; i < r; i++)
4734 int in_group(const char *name) {
4738 r = get_group_creds(&name, &gid);
4745 int glob_exists(const char *path) {
4746 _cleanup_globfree_ glob_t g = {};
4752 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4754 if (k == GLOB_NOMATCH)
4756 else if (k == GLOB_NOSPACE)
4759 return !strv_isempty(g.gl_pathv);
4761 return errno ? -errno : -EIO;
4764 int glob_extend(char ***strv, const char *path) {
4765 _cleanup_globfree_ glob_t g = {};
4770 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4772 if (k == GLOB_NOMATCH)
4774 else if (k == GLOB_NOSPACE)
4776 else if (k != 0 || strv_isempty(g.gl_pathv))
4777 return errno ? -errno : -EIO;
4779 STRV_FOREACH(p, g.gl_pathv) {
4780 k = strv_extend(strv, *p);
4788 int dirent_ensure_type(DIR *d, struct dirent *de) {
4794 if (de->d_type != DT_UNKNOWN)
4797 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4801 S_ISREG(st.st_mode) ? DT_REG :
4802 S_ISDIR(st.st_mode) ? DT_DIR :
4803 S_ISLNK(st.st_mode) ? DT_LNK :
4804 S_ISFIFO(st.st_mode) ? DT_FIFO :
4805 S_ISSOCK(st.st_mode) ? DT_SOCK :
4806 S_ISCHR(st.st_mode) ? DT_CHR :
4807 S_ISBLK(st.st_mode) ? DT_BLK :
4813 int get_files_in_directory(const char *path, char ***list) {
4814 _cleanup_closedir_ DIR *d = NULL;
4815 size_t bufsize = 0, n = 0;
4816 _cleanup_strv_free_ char **l = NULL;
4820 /* Returns all files in a directory in *list, and the number
4821 * of files as return value. If list is NULL returns only the
4833 if (!de && errno != 0)
4838 dirent_ensure_type(d, de);
4840 if (!dirent_is_file(de))
4844 /* one extra slot is needed for the terminating NULL */
4845 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4848 l[n] = strdup(de->d_name);
4859 l = NULL; /* avoid freeing */
4865 char *strjoin(const char *x, ...) {
4879 t = va_arg(ap, const char *);
4884 if (n > ((size_t) -1) - l) {
4908 t = va_arg(ap, const char *);
4922 bool is_main_thread(void) {
4923 static thread_local int cached = 0;
4925 if (_unlikely_(cached == 0))
4926 cached = getpid() == gettid() ? 1 : -1;
4931 int block_get_whole_disk(dev_t d, dev_t *ret) {
4938 /* If it has a queue this is good enough for us */
4939 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4942 r = access(p, F_OK);
4950 /* If it is a partition find the originating device */
4951 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4954 r = access(p, F_OK);
4960 /* Get parent dev_t */
4961 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4964 r = read_one_line_file(p, &s);
4970 r = sscanf(s, "%u:%u", &m, &n);
4976 /* Only return this if it is really good enough for us. */
4977 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4980 r = access(p, F_OK);
4984 *ret = makedev(m, n);
4991 static const char *const ioprio_class_table[] = {
4992 [IOPRIO_CLASS_NONE] = "none",
4993 [IOPRIO_CLASS_RT] = "realtime",
4994 [IOPRIO_CLASS_BE] = "best-effort",
4995 [IOPRIO_CLASS_IDLE] = "idle"
4998 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
5000 static const char *const sigchld_code_table[] = {
5001 [CLD_EXITED] = "exited",
5002 [CLD_KILLED] = "killed",
5003 [CLD_DUMPED] = "dumped",
5004 [CLD_TRAPPED] = "trapped",
5005 [CLD_STOPPED] = "stopped",
5006 [CLD_CONTINUED] = "continued",
5009 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
5011 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
5012 [LOG_FAC(LOG_KERN)] = "kern",
5013 [LOG_FAC(LOG_USER)] = "user",
5014 [LOG_FAC(LOG_MAIL)] = "mail",
5015 [LOG_FAC(LOG_DAEMON)] = "daemon",
5016 [LOG_FAC(LOG_AUTH)] = "auth",
5017 [LOG_FAC(LOG_SYSLOG)] = "syslog",
5018 [LOG_FAC(LOG_LPR)] = "lpr",
5019 [LOG_FAC(LOG_NEWS)] = "news",
5020 [LOG_FAC(LOG_UUCP)] = "uucp",
5021 [LOG_FAC(LOG_CRON)] = "cron",
5022 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
5023 [LOG_FAC(LOG_FTP)] = "ftp",
5024 [LOG_FAC(LOG_LOCAL0)] = "local0",
5025 [LOG_FAC(LOG_LOCAL1)] = "local1",
5026 [LOG_FAC(LOG_LOCAL2)] = "local2",
5027 [LOG_FAC(LOG_LOCAL3)] = "local3",
5028 [LOG_FAC(LOG_LOCAL4)] = "local4",
5029 [LOG_FAC(LOG_LOCAL5)] = "local5",
5030 [LOG_FAC(LOG_LOCAL6)] = "local6",
5031 [LOG_FAC(LOG_LOCAL7)] = "local7"
5034 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
5036 static const char *const log_level_table[] = {
5037 [LOG_EMERG] = "emerg",
5038 [LOG_ALERT] = "alert",
5039 [LOG_CRIT] = "crit",
5041 [LOG_WARNING] = "warning",
5042 [LOG_NOTICE] = "notice",
5043 [LOG_INFO] = "info",
5044 [LOG_DEBUG] = "debug"
5047 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5049 static const char* const sched_policy_table[] = {
5050 [SCHED_OTHER] = "other",
5051 [SCHED_BATCH] = "batch",
5052 [SCHED_IDLE] = "idle",
5053 [SCHED_FIFO] = "fifo",
5057 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5059 static const char* const rlimit_table[_RLIMIT_MAX] = {
5060 [RLIMIT_CPU] = "LimitCPU",
5061 [RLIMIT_FSIZE] = "LimitFSIZE",
5062 [RLIMIT_DATA] = "LimitDATA",
5063 [RLIMIT_STACK] = "LimitSTACK",
5064 [RLIMIT_CORE] = "LimitCORE",
5065 [RLIMIT_RSS] = "LimitRSS",
5066 [RLIMIT_NOFILE] = "LimitNOFILE",
5067 [RLIMIT_AS] = "LimitAS",
5068 [RLIMIT_NPROC] = "LimitNPROC",
5069 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5070 [RLIMIT_LOCKS] = "LimitLOCKS",
5071 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5072 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5073 [RLIMIT_NICE] = "LimitNICE",
5074 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5075 [RLIMIT_RTTIME] = "LimitRTTIME"
5078 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5080 static const char* const ip_tos_table[] = {
5081 [IPTOS_LOWDELAY] = "low-delay",
5082 [IPTOS_THROUGHPUT] = "throughput",
5083 [IPTOS_RELIABILITY] = "reliability",
5084 [IPTOS_LOWCOST] = "low-cost",
5087 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5089 static const char *const __signal_table[] = {
5106 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5117 [SIGVTALRM] = "VTALRM",
5119 [SIGWINCH] = "WINCH",
5125 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5127 const char *signal_to_string(int signo) {
5128 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5131 name = __signal_to_string(signo);
5135 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5136 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5138 snprintf(buf, sizeof(buf), "%d", signo);
5143 int signal_from_string(const char *s) {
5148 signo = __signal_from_string(s);
5152 if (startswith(s, "RTMIN+")) {
5156 if (safe_atou(s, &u) >= 0) {
5157 signo = (int) u + offset;
5158 if (signo > 0 && signo < _NSIG)
5164 bool kexec_loaded(void) {
5165 bool loaded = false;
5168 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5176 int prot_from_flags(int flags) {
5178 switch (flags & O_ACCMODE) {
5187 return PROT_READ|PROT_WRITE;
5194 char *format_bytes(char *buf, size_t l, off_t t) {
5197 static const struct {
5201 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5202 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5203 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5204 { "G", 1024ULL*1024ULL*1024ULL },
5205 { "M", 1024ULL*1024ULL },
5209 if (t == (off_t) -1)
5212 for (i = 0; i < ELEMENTSOF(table); i++) {
5214 if (t >= table[i].factor) {
5217 (unsigned long long) (t / table[i].factor),
5218 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5225 snprintf(buf, l, "%lluB", (unsigned long long) t);
5233 void* memdup(const void *p, size_t l) {
5246 int fd_inc_sndbuf(int fd, size_t n) {
5248 socklen_t l = sizeof(value);
5250 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5251 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5254 /* If we have the privileges we will ignore the kernel limit. */
5257 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5258 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5264 int fd_inc_rcvbuf(int fd, size_t n) {
5266 socklen_t l = sizeof(value);
5268 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5269 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5272 /* If we have the privileges we will ignore the kernel limit. */
5275 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5276 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5281 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5282 bool stdout_is_tty, stderr_is_tty;
5283 pid_t parent_pid, agent_pid;
5284 sigset_t ss, saved_ss;
5292 /* Spawns a temporary TTY agent, making sure it goes away when
5295 parent_pid = getpid();
5297 /* First we temporarily block all signals, so that the new
5298 * child has them blocked initially. This way, we can be sure
5299 * that SIGTERMs are not lost we might send to the agent. */
5300 assert_se(sigfillset(&ss) >= 0);
5301 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5304 if (agent_pid < 0) {
5305 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5309 if (agent_pid != 0) {
5310 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5317 * Make sure the agent goes away when the parent dies */
5318 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5319 _exit(EXIT_FAILURE);
5321 /* Make sure we actually can kill the agent, if we need to, in
5322 * case somebody invoked us from a shell script that trapped
5323 * SIGTERM or so... */
5324 reset_all_signal_handlers();
5325 reset_signal_mask();
5327 /* Check whether our parent died before we were able
5328 * to set the death signal and unblock the signals */
5329 if (getppid() != parent_pid)
5330 _exit(EXIT_SUCCESS);
5332 /* Don't leak fds to the agent */
5333 close_all_fds(except, n_except);
5335 stdout_is_tty = isatty(STDOUT_FILENO);
5336 stderr_is_tty = isatty(STDERR_FILENO);
5338 if (!stdout_is_tty || !stderr_is_tty) {
5341 /* Detach from stdout/stderr. and reopen
5342 * /dev/tty for them. This is important to
5343 * ensure that when systemctl is started via
5344 * popen() or a similar call that expects to
5345 * read EOF we actually do generate EOF and
5346 * not delay this indefinitely by because we
5347 * keep an unused copy of stdin around. */
5348 fd = open("/dev/tty", O_WRONLY);
5350 log_error_errno(errno, "Failed to open /dev/tty: %m");
5351 _exit(EXIT_FAILURE);
5355 dup2(fd, STDOUT_FILENO);
5358 dup2(fd, STDERR_FILENO);
5364 /* Count arguments */
5366 for (n = 0; va_arg(ap, char*); n++)
5371 l = alloca(sizeof(char *) * (n + 1));
5373 /* Fill in arguments */
5375 for (i = 0; i <= n; i++)
5376 l[i] = va_arg(ap, char*);
5380 _exit(EXIT_FAILURE);
5383 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5384 struct rlimit highest, fixed;
5388 if (setrlimit(resource, rlim) >= 0)
5394 /* So we failed to set the desired setrlimit, then let's try
5395 * to get as close as we can */
5396 assert_se(getrlimit(resource, &highest) == 0);
5398 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5399 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5401 if (setrlimit(resource, &fixed) < 0)
5407 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5408 _cleanup_fclose_ FILE *f = NULL;
5419 path = procfs_file_alloca(pid, "environ");
5421 f = fopen(path, "re");
5429 char line[LINE_MAX];
5432 for (i = 0; i < sizeof(line)-1; i++) {
5436 if (_unlikely_(c == EOF)) {
5446 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5447 value = strdup(line + l + 1);
5461 bool http_url_is_valid(const char *url) {
5467 p = startswith(url, "http://");
5469 p = startswith(url, "https://");
5476 return ascii_is_valid(p);
5479 bool documentation_url_is_valid(const char *url) {
5485 if (http_url_is_valid(url))
5488 p = startswith(url, "file:/");
5490 p = startswith(url, "info:");
5492 p = startswith(url, "man:");
5497 return ascii_is_valid(p);
5500 bool in_initrd(void) {
5501 static int saved = -1;
5507 /* We make two checks here:
5509 * 1. the flag file /etc/initrd-release must exist
5510 * 2. the root file system must be a memory file system
5512 * The second check is extra paranoia, since misdetecting an
5513 * initrd can have bad bad consequences due the initrd
5514 * emptying when transititioning to the main systemd.
5517 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5518 statfs("/", &s) >= 0 &&
5519 is_temporary_fs(&s);
5524 void warn_melody(void) {
5525 _cleanup_close_ int fd = -1;
5527 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5531 /* Yeah, this is synchronous. Kinda sucks. But well... */
5533 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5534 usleep(125*USEC_PER_MSEC);
5536 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5537 usleep(125*USEC_PER_MSEC);
5539 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5540 usleep(125*USEC_PER_MSEC);
5542 ioctl(fd, KIOCSOUND, 0);
5545 int make_console_stdio(void) {
5548 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5550 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5552 return log_error_errno(fd, "Failed to acquire terminal: %m");
5556 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5561 int get_home_dir(char **_h) {
5569 /* Take the user specified one */
5570 e = secure_getenv("HOME");
5571 if (e && path_is_absolute(e)) {
5580 /* Hardcode home directory for root to avoid NSS */
5583 h = strdup("/root");
5591 /* Check the database... */
5595 return errno > 0 ? -errno : -ESRCH;
5597 if (!path_is_absolute(p->pw_dir))
5600 h = strdup(p->pw_dir);
5608 int get_shell(char **_s) {
5616 /* Take the user specified one */
5617 e = getenv("SHELL");
5627 /* Hardcode home directory for root to avoid NSS */
5630 s = strdup("/bin/sh");
5638 /* Check the database... */
5642 return errno > 0 ? -errno : -ESRCH;
5644 if (!path_is_absolute(p->pw_shell))
5647 s = strdup(p->pw_shell);
5655 bool filename_is_valid(const char *p) {
5669 if (strlen(p) > FILENAME_MAX)
5675 bool string_is_safe(const char *p) {
5681 for (t = p; *t; t++) {
5682 if (*t > 0 && *t < ' ')
5685 if (strchr("\\\"\'\0x7f", *t))
5693 * Check if a string contains control characters. If 'ok' is non-NULL
5694 * it may be a string containing additional CCs to be considered OK.
5696 bool string_has_cc(const char *p, const char *ok) {
5701 for (t = p; *t; t++) {
5702 if (ok && strchr(ok, *t))
5705 if (*t > 0 && *t < ' ')
5715 bool path_is_safe(const char *p) {
5720 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5723 if (strlen(p) > PATH_MAX)
5726 /* The following two checks are not really dangerous, but hey, they still are confusing */
5727 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5730 if (strstr(p, "//"))
5736 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5737 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5738 int (*compar) (const void *, const void *, void *), void *arg) {
5747 p = (void *)(((const char *) base) + (idx * size));
5748 comparison = compar(key, p, arg);
5751 else if (comparison > 0)
5759 bool is_locale_utf8(void) {
5761 static int cached_answer = -1;
5763 if (cached_answer >= 0)
5766 if (!setlocale(LC_ALL, "")) {
5767 cached_answer = true;
5771 set = nl_langinfo(CODESET);
5773 cached_answer = true;
5777 if (streq(set, "UTF-8")) {
5778 cached_answer = true;
5782 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5783 * unset and everything can do to UTF-8 nowadays. */
5784 set = setlocale(LC_CTYPE, NULL);
5786 cached_answer = true;
5790 /* Check result, but ignore the result if C was set
5794 !getenv("LC_ALL") &&
5795 !getenv("LC_CTYPE") &&
5799 return (bool) cached_answer;
5802 const char *draw_special_char(DrawSpecialChar ch) {
5803 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5806 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5807 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5808 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5809 [DRAW_TREE_SPACE] = " ", /* */
5810 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5811 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5812 [DRAW_ARROW] = "\342\206\222", /* → */
5813 [DRAW_DASH] = "\342\200\223", /* – */
5816 /* ASCII fallback */ {
5817 [DRAW_TREE_VERTICAL] = "| ",
5818 [DRAW_TREE_BRANCH] = "|-",
5819 [DRAW_TREE_RIGHT] = "`-",
5820 [DRAW_TREE_SPACE] = " ",
5821 [DRAW_TRIANGULAR_BULLET] = ">",
5822 [DRAW_BLACK_CIRCLE] = "*",
5823 [DRAW_ARROW] = "->",
5828 return draw_table[!is_locale_utf8()][ch];
5831 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5834 size_t l, old_len, new_len;
5840 old_len = strlen(old_string);
5841 new_len = strlen(new_string);
5854 if (!startswith(f, old_string)) {
5860 nl = l - old_len + new_len;
5861 a = realloc(r, nl + 1);
5869 t = stpcpy(t, new_string);
5881 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5882 const char *i, *begin = NULL;
5887 } state = STATE_OTHER;
5889 size_t osz = 0, isz;
5895 /* Strips ANSI color and replaces TABs by 8 spaces */
5897 isz = _isz ? *_isz : strlen(*ibuf);
5899 f = open_memstream(&obuf, &osz);
5903 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5908 if (i >= *ibuf + isz) /* EOT */
5910 else if (*i == '\x1B')
5911 state = STATE_ESCAPE;
5912 else if (*i == '\t')
5919 if (i >= *ibuf + isz) { /* EOT */
5922 } else if (*i == '[') {
5923 state = STATE_BRACKET;
5928 state = STATE_OTHER;
5935 if (i >= *ibuf + isz || /* EOT */
5936 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5939 state = STATE_OTHER;
5941 } else if (*i == 'm')
5942 state = STATE_OTHER;
5964 int on_ac_power(void) {
5965 bool found_offline = false, found_online = false;
5966 _cleanup_closedir_ DIR *d = NULL;
5968 d = opendir("/sys/class/power_supply");
5974 _cleanup_close_ int fd = -1, device = -1;
5980 if (!de && errno != 0)
5986 if (hidden_file(de->d_name))
5989 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
5991 if (errno == ENOENT || errno == ENOTDIR)
5997 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5999 if (errno == ENOENT)
6005 n = read(fd, contents, sizeof(contents));
6009 if (n != 6 || memcmp(contents, "Mains\n", 6))
6013 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6015 if (errno == ENOENT)
6021 n = read(fd, contents, sizeof(contents));
6025 if (n != 2 || contents[1] != '\n')
6028 if (contents[0] == '1') {
6029 found_online = true;
6031 } else if (contents[0] == '0')
6032 found_offline = true;
6037 return found_online || !found_offline;
6040 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6047 if (!path_strv_resolve_uniq(search, root))
6050 STRV_FOREACH(i, search) {
6051 _cleanup_free_ char *p = NULL;
6055 p = strjoin(root, *i, "/", path, NULL);
6057 p = strjoin(*i, "/", path, NULL);
6067 if (errno != ENOENT)
6074 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6075 _cleanup_strv_free_ char **copy = NULL;
6081 if (path_is_absolute(path)) {
6084 f = fopen(path, mode);
6093 copy = strv_copy((char**) search);
6097 return search_and_fopen_internal(path, mode, root, copy, _f);
6100 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6101 _cleanup_strv_free_ char **s = NULL;
6103 if (path_is_absolute(path)) {
6106 f = fopen(path, mode);
6115 s = strv_split_nulstr(search);
6119 return search_and_fopen_internal(path, mode, root, s, _f);
6122 char *strextend(char **x, ...) {
6129 l = f = *x ? strlen(*x) : 0;
6136 t = va_arg(ap, const char *);
6141 if (n > ((size_t) -1) - l) {
6150 r = realloc(*x, l+1);
6160 t = va_arg(ap, const char *);
6174 char *strrep(const char *s, unsigned n) {
6182 p = r = malloc(l * n + 1);
6186 for (i = 0; i < n; i++)
6193 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6200 if (*allocated >= need)
6203 newalloc = MAX(need * 2, 64u / size);
6204 a = newalloc * size;
6206 /* check for overflows */
6207 if (a < size * need)
6215 *allocated = newalloc;
6219 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6228 q = greedy_realloc(p, allocated, need, size);
6232 if (*allocated > prev)
6233 memzero(q + prev * size, (*allocated - prev) * size);
6238 bool id128_is_valid(const char *s) {
6244 /* Simple formatted 128bit hex string */
6246 for (i = 0; i < l; i++) {
6249 if (!(c >= '0' && c <= '9') &&
6250 !(c >= 'a' && c <= 'z') &&
6251 !(c >= 'A' && c <= 'Z'))
6255 } else if (l == 36) {
6257 /* Formatted UUID */
6259 for (i = 0; i < l; i++) {
6262 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6266 if (!(c >= '0' && c <= '9') &&
6267 !(c >= 'a' && c <= 'z') &&
6268 !(c >= 'A' && c <= 'Z'))
6279 int split_pair(const char *s, const char *sep, char **l, char **r) {
6294 a = strndup(s, x - s);
6298 b = strdup(x + strlen(sep));
6310 int shall_restore_state(void) {
6311 _cleanup_free_ char *value = NULL;
6314 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6320 return parse_boolean(value) != 0;
6323 int proc_cmdline(char **ret) {
6326 if (detect_container(NULL) > 0)
6327 return get_process_cmdline(1, 0, false, ret);
6329 return read_one_line_file("/proc/cmdline", ret);
6332 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6333 _cleanup_free_ char *line = NULL;
6339 r = proc_cmdline(&line);
6345 _cleanup_free_ char *word = NULL;
6348 r = unquote_first_word(&p, &word, true);
6354 /* Filter out arguments that are intended only for the
6356 if (!in_initrd() && startswith(word, "rd."))
6359 value = strchr(word, '=');
6363 r = parse_item(word, value);
6371 int get_proc_cmdline_key(const char *key, char **value) {
6372 _cleanup_free_ char *line = NULL, *ret = NULL;
6379 r = proc_cmdline(&line);
6385 _cleanup_free_ char *word = NULL;
6388 r = unquote_first_word(&p, &word, true);
6394 /* Filter out arguments that are intended only for the
6396 if (!in_initrd() && startswith(word, "rd."))
6400 e = startswith(word, key);
6404 r = free_and_strdup(&ret, e);
6410 if (streq(word, key))
6424 int container_get_leader(const char *machine, pid_t *pid) {
6425 _cleanup_free_ char *s = NULL, *class = NULL;
6433 p = strappenda("/run/systemd/machines/", machine);
6434 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6442 if (!streq_ptr(class, "container"))
6445 r = parse_pid(s, &leader);
6455 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6456 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6464 mntns = procfs_file_alloca(pid, "ns/mnt");
6465 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6473 pidns = procfs_file_alloca(pid, "ns/pid");
6474 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6482 netns = procfs_file_alloca(pid, "ns/net");
6483 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6491 root = procfs_file_alloca(pid, "root");
6492 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6498 *pidns_fd = pidnsfd;
6501 *mntns_fd = mntnsfd;
6504 *netns_fd = netnsfd;
6509 pidnsfd = mntnsfd = netnsfd = -1;
6514 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6517 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6521 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6525 if (setns(netns_fd, CLONE_NEWNET) < 0)
6529 if (fchdir(root_fd) < 0)
6532 if (chroot(".") < 0)
6536 if (setresgid(0, 0, 0) < 0)
6539 if (setgroups(0, NULL) < 0)
6542 if (setresuid(0, 0, 0) < 0)
6548 bool pid_is_unwaited(pid_t pid) {
6549 /* Checks whether a PID is still valid at all, including a zombie */
6554 if (kill(pid, 0) >= 0)
6557 return errno != ESRCH;
6560 bool pid_is_alive(pid_t pid) {
6563 /* Checks whether a PID is still valid and not a zombie */
6568 r = get_process_state(pid);
6569 if (r == -ENOENT || r == 'Z')
6575 int getpeercred(int fd, struct ucred *ucred) {
6576 socklen_t n = sizeof(struct ucred);
6583 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6587 if (n != sizeof(struct ucred))
6590 /* Check if the data is actually useful and not suppressed due
6591 * to namespacing issues */
6594 if (u.uid == UID_INVALID)
6596 if (u.gid == GID_INVALID)
6603 int getpeersec(int fd, char **ret) {
6615 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6619 if (errno != ERANGE)
6626 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6642 /* This is much like like mkostemp() but is subject to umask(). */
6643 int mkostemp_safe(char *pattern, int flags) {
6644 _cleanup_umask_ mode_t u;
6651 fd = mkostemp(pattern, flags);
6658 int open_tmpfile(const char *path, int flags) {
6665 /* Try O_TMPFILE first, if it is supported */
6666 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6671 /* Fall back to unguessable name + unlinking */
6672 p = strappenda(path, "/systemd-tmp-XXXXXX");
6674 fd = mkostemp_safe(p, flags);
6682 int fd_warn_permissions(const char *path, int fd) {
6685 if (fstat(fd, &st) < 0)
6688 if (st.st_mode & 0111)
6689 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6691 if (st.st_mode & 0002)
6692 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6694 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6695 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6700 unsigned long personality_from_string(const char *p) {
6702 /* Parse a personality specifier. We introduce our own
6703 * identifiers that indicate specific ABIs, rather than just
6704 * hints regarding the register size, since we want to keep
6705 * things open for multiple locally supported ABIs for the
6706 * same register size. We try to reuse the ABI identifiers
6707 * used by libseccomp. */
6709 #if defined(__x86_64__)
6711 if (streq(p, "x86"))
6714 if (streq(p, "x86-64"))
6717 #elif defined(__i386__)
6719 if (streq(p, "x86"))
6723 /* personality(7) documents that 0xffffffffUL is used for
6724 * querying the current personality, hence let's use that here
6725 * as error indicator. */
6726 return 0xffffffffUL;
6729 const char* personality_to_string(unsigned long p) {
6731 #if defined(__x86_64__)
6733 if (p == PER_LINUX32)
6739 #elif defined(__i386__)
6748 uint64_t physical_memory(void) {
6751 /* We return this as uint64_t in case we are running as 32bit
6752 * process on a 64bit kernel with huge amounts of memory */
6754 mem = sysconf(_SC_PHYS_PAGES);
6757 return (uint64_t) mem * (uint64_t) page_size();
6760 void hexdump(FILE *f, const void *p, size_t s) {
6761 const uint8_t *b = p;
6764 assert(s == 0 || b);
6769 fprintf(f, "%04x ", n);
6771 for (i = 0; i < 16; i++) {
6776 fprintf(f, "%02x ", b[i]);
6784 for (i = 0; i < 16; i++) {
6789 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6803 int update_reboot_param_file(const char *param) {
6808 r = write_string_file(REBOOT_PARAM_FILE, param);
6810 log_error("Failed to write reboot param to "
6811 REBOOT_PARAM_FILE": %s", strerror(-r));
6813 unlink(REBOOT_PARAM_FILE);
6818 int umount_recursive(const char *prefix, int flags) {
6822 /* Try to umount everything recursively below a
6823 * directory. Also, take care of stacked mounts, and keep
6824 * unmounting them until they are gone. */
6827 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6832 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6833 if (!proc_self_mountinfo)
6837 _cleanup_free_ char *path = NULL, *p = NULL;
6840 k = fscanf(proc_self_mountinfo,
6841 "%*s " /* (1) mount id */
6842 "%*s " /* (2) parent id */
6843 "%*s " /* (3) major:minor */
6844 "%*s " /* (4) root */
6845 "%ms " /* (5) mount point */
6846 "%*s" /* (6) mount options */
6847 "%*[^-]" /* (7) optional fields */
6848 "- " /* (8) separator */
6849 "%*s " /* (9) file system type */
6850 "%*s" /* (10) mount source */
6851 "%*s" /* (11) mount options 2 */
6852 "%*[^\n]", /* some rubbish at the end */
6861 p = cunescape(path);
6865 if (!path_startswith(p, prefix))
6868 if (umount2(p, flags) < 0) {
6884 static int get_mount_flags(const char *path, unsigned long *flags) {
6887 if (statvfs(path, &buf) < 0)
6889 *flags = buf.f_flag;
6893 int bind_remount_recursive(const char *prefix, bool ro) {
6894 _cleanup_set_free_free_ Set *done = NULL;
6895 _cleanup_free_ char *cleaned = NULL;
6898 /* Recursively remount a directory (and all its submounts)
6899 * read-only or read-write. If the directory is already
6900 * mounted, we reuse the mount and simply mark it
6901 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6902 * operation). If it isn't we first make it one. Afterwards we
6903 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6904 * submounts we can access, too. When mounts are stacked on
6905 * the same mount point we only care for each individual
6906 * "top-level" mount on each point, as we cannot
6907 * influence/access the underlying mounts anyway. We do not
6908 * have any effect on future submounts that might get
6909 * propagated, they migt be writable. This includes future
6910 * submounts that have been triggered via autofs. */
6912 cleaned = strdup(prefix);
6916 path_kill_slashes(cleaned);
6918 done = set_new(&string_hash_ops);
6923 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6924 _cleanup_set_free_free_ Set *todo = NULL;
6925 bool top_autofs = false;
6927 unsigned long orig_flags;
6929 todo = set_new(&string_hash_ops);
6933 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6934 if (!proc_self_mountinfo)
6938 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6941 k = fscanf(proc_self_mountinfo,
6942 "%*s " /* (1) mount id */
6943 "%*s " /* (2) parent id */
6944 "%*s " /* (3) major:minor */
6945 "%*s " /* (4) root */
6946 "%ms " /* (5) mount point */
6947 "%*s" /* (6) mount options (superblock) */
6948 "%*[^-]" /* (7) optional fields */
6949 "- " /* (8) separator */
6950 "%ms " /* (9) file system type */
6951 "%*s" /* (10) mount source */
6952 "%*s" /* (11) mount options (bind mount) */
6953 "%*[^\n]", /* some rubbish at the end */
6963 p = cunescape(path);
6967 /* Let's ignore autofs mounts. If they aren't
6968 * triggered yet, we want to avoid triggering
6969 * them, as we don't make any guarantees for
6970 * future submounts anyway. If they are
6971 * already triggered, then we will find
6972 * another entry for this. */
6973 if (streq(type, "autofs")) {
6974 top_autofs = top_autofs || path_equal(cleaned, p);
6978 if (path_startswith(p, cleaned) &&
6979 !set_contains(done, p)) {
6981 r = set_consume(todo, p);
6991 /* If we have no submounts to process anymore and if
6992 * the root is either already done, or an autofs, we
6994 if (set_isempty(todo) &&
6995 (top_autofs || set_contains(done, cleaned)))
6998 if (!set_contains(done, cleaned) &&
6999 !set_contains(todo, cleaned)) {
7000 /* The prefix directory itself is not yet a
7001 * mount, make it one. */
7002 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
7006 (void) get_mount_flags(cleaned, &orig_flags);
7007 orig_flags &= ~MS_RDONLY;
7009 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
7012 x = strdup(cleaned);
7016 r = set_consume(done, x);
7021 while ((x = set_steal_first(todo))) {
7023 r = set_consume(done, x);
7029 /* Try to reuse the original flag set, but
7030 * don't care for errors, in case of
7031 * obstructed mounts */
7033 (void) get_mount_flags(x, &orig_flags);
7034 orig_flags &= ~MS_RDONLY;
7036 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7038 /* Deal with mount points that are
7039 * obstructed by a later mount */
7041 if (errno != ENOENT)
7049 int fflush_and_check(FILE *f) {
7056 return errno ? -errno : -EIO;
7061 int tempfn_xxxxxx(const char *p, char **ret) {
7073 * /foo/bar/.#waldoXXXXXX
7077 if (!filename_is_valid(fn))
7080 t = new(char, strlen(p) + 2 + 6 + 1);
7084 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7086 *ret = path_kill_slashes(t);
7090 int tempfn_random(const char *p, char **ret) {
7104 * /foo/bar/.#waldobaa2a261115984a9
7108 if (!filename_is_valid(fn))
7111 t = new(char, strlen(p) + 2 + 16 + 1);
7115 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7118 for (i = 0; i < 16; i++) {
7119 *(x++) = hexchar(u & 0xF);
7125 *ret = path_kill_slashes(t);
7129 int tempfn_random_child(const char *p, char **ret) {
7140 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7143 t = new(char, strlen(p) + 3 + 16 + 1);
7147 x = stpcpy(stpcpy(t, p), "/.#");
7150 for (i = 0; i < 16; i++) {
7151 *(x++) = hexchar(u & 0xF);
7157 *ret = path_kill_slashes(t);
7161 /* make sure the hostname is not "localhost" */
7162 bool is_localhost(const char *hostname) {
7165 /* This tries to identify local host and domain names
7166 * described in RFC6761 plus the redhatism of .localdomain */
7168 return streq(hostname, "localhost") ||
7169 streq(hostname, "localhost.") ||
7170 streq(hostname, "localdomain.") ||
7171 streq(hostname, "localdomain") ||
7172 endswith(hostname, ".localhost") ||
7173 endswith(hostname, ".localhost.") ||
7174 endswith(hostname, ".localdomain") ||
7175 endswith(hostname, ".localdomain.");
7178 int take_password_lock(const char *root) {
7180 struct flock flock = {
7182 .l_whence = SEEK_SET,
7190 /* This is roughly the same as lckpwdf(), but not as awful. We
7191 * don't want to use alarm() and signals, hence we implement
7192 * our own trivial version of this.
7194 * Note that shadow-utils also takes per-database locks in
7195 * addition to lckpwdf(). However, we don't given that they
7196 * are redundant as they they invoke lckpwdf() first and keep
7197 * it during everything they do. The per-database locks are
7198 * awfully racy, and thus we just won't do them. */
7201 path = strappenda(root, "/etc/.pwd.lock");
7203 path = "/etc/.pwd.lock";
7205 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7209 r = fcntl(fd, F_SETLKW, &flock);
7218 int is_symlink(const char *path) {
7221 if (lstat(path, &info) < 0)
7224 return !!S_ISLNK(info.st_mode);
7227 int is_dir(const char* path, bool follow) {
7232 r = stat(path, &st);
7234 r = lstat(path, &st);
7238 return !!S_ISDIR(st.st_mode);
7241 int unquote_first_word(const char **p, char **ret, bool relax) {
7242 _cleanup_free_ char *s = NULL;
7243 size_t allocated = 0, sz = 0;
7250 SINGLE_QUOTE_ESCAPE,
7252 DOUBLE_QUOTE_ESCAPE,
7260 /* Parses the first word of a string, and returns it in
7261 * *ret. Removes all quotes in the process. When parsing fails
7262 * (because of an uneven number of quotes or similar), leaves
7263 * the pointer *p at the first invalid character. */
7273 else if (strchr(WHITESPACE, c))
7283 state = SINGLE_QUOTE;
7285 state = VALUE_ESCAPE;
7287 state = DOUBLE_QUOTE;
7288 else if (strchr(WHITESPACE, c))
7291 if (!GREEDY_REALLOC(s, allocated, sz+2))
7306 if (!GREEDY_REALLOC(s, allocated, sz+2))
7319 } else if (c == '\'')
7322 state = SINGLE_QUOTE_ESCAPE;
7324 if (!GREEDY_REALLOC(s, allocated, sz+2))
7332 case SINGLE_QUOTE_ESCAPE:
7339 if (!GREEDY_REALLOC(s, allocated, sz+2))
7343 state = SINGLE_QUOTE;
7352 state = DOUBLE_QUOTE_ESCAPE;
7354 if (!GREEDY_REALLOC(s, allocated, sz+2))
7362 case DOUBLE_QUOTE_ESCAPE:
7369 if (!GREEDY_REALLOC(s, allocated, sz+2))
7373 state = DOUBLE_QUOTE;
7379 if (!strchr(WHITESPACE, c))
7401 int unquote_many_words(const char **p, ...) {
7406 /* Parses a number of words from a string, stripping any
7407 * quotes if necessary. */
7411 /* Count how many words are expected */
7414 if (!va_arg(ap, char **))
7423 /* Read all words into a temporary array */
7424 l = newa0(char*, n);
7425 for (c = 0; c < n; c++) {
7427 r = unquote_first_word(p, &l[c], false);
7431 for (j = 0; j < c; j++)
7441 /* If we managed to parse all words, return them in the passed
7444 for (i = 0; i < n; i++) {
7447 v = va_arg(ap, char **);
7457 int free_and_strdup(char **p, const char *s) {
7462 /* Replaces a string pointer with an strdup()ed new string,
7463 * possibly freeing the old one. */
7478 int sethostname_idempotent(const char *s) {
7480 char buf[HOST_NAME_MAX + 1] = {};
7484 r = gethostname(buf, sizeof(buf));
7491 r = sethostname(s, strlen(s));
7498 int ptsname_malloc(int fd, char **ret) {
7511 if (ptsname_r(fd, c, l) == 0) {
7515 if (errno != ERANGE) {
7525 int openpt_in_namespace(pid_t pid, int flags) {
7526 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7527 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7529 struct cmsghdr cmsghdr;
7530 uint8_t buf[CMSG_SPACE(sizeof(int))];
7532 struct msghdr mh = {
7533 .msg_control = &control,
7534 .msg_controllen = sizeof(control),
7536 struct cmsghdr *cmsg;
7543 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7547 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7557 pair[0] = safe_close(pair[0]);
7559 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7561 _exit(EXIT_FAILURE);
7563 master = posix_openpt(flags);
7565 _exit(EXIT_FAILURE);
7567 cmsg = CMSG_FIRSTHDR(&mh);
7568 cmsg->cmsg_level = SOL_SOCKET;
7569 cmsg->cmsg_type = SCM_RIGHTS;
7570 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7571 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7573 mh.msg_controllen = cmsg->cmsg_len;
7575 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7576 _exit(EXIT_FAILURE);
7578 _exit(EXIT_SUCCESS);
7581 pair[1] = safe_close(pair[1]);
7583 r = wait_for_terminate(child, &si);
7586 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7589 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7592 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7593 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7597 fds = (int*) CMSG_DATA(cmsg);
7598 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7601 close_many(fds, n_fds);
7611 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7612 _cleanup_close_ int fd = -1;
7615 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7617 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7621 l = fgetxattr(fd, attribute, value, size);
7628 static int parse_crtime(le64_t le, usec_t *usec) {
7634 if (u == 0 || u == (uint64_t) -1)
7641 int fd_getcrtime(int fd, usec_t *usec) {
7648 /* Until Linux gets a real concept of birthtime/creation time,
7649 * let's fake one with xattrs */
7651 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7654 if (n != sizeof(le))
7657 return parse_crtime(le, usec);
7660 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7664 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7667 if (n != sizeof(le))
7670 return parse_crtime(le, usec);
7673 int path_getcrtime(const char *p, usec_t *usec) {
7680 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7683 if (n != sizeof(le))
7686 return parse_crtime(le, usec);
7689 int fd_setcrtime(int fd, usec_t usec) {
7695 usec = now(CLOCK_REALTIME);
7697 le = htole64((uint64_t) usec);
7698 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7704 int same_fd(int a, int b) {
7705 struct stat sta, stb;
7712 /* Compares two file descriptors. Note that semantics are
7713 * quite different depending on whether we have kcmp() or we
7714 * don't. If we have kcmp() this will only return true for
7715 * dup()ed file descriptors, but not otherwise. If we don't
7716 * have kcmp() this will also return true for two fds of the same
7717 * file, created by separate open() calls. Since we use this
7718 * call mostly for filtering out duplicates in the fd store
7719 * this difference hopefully doesn't matter too much. */
7724 /* Try to use kcmp() if we have it. */
7726 r = kcmp(pid, pid, KCMP_FILE, a, b);
7731 if (errno != ENOSYS)
7734 /* We don't have kcmp(), use fstat() instead. */
7735 if (fstat(a, &sta) < 0)
7738 if (fstat(b, &stb) < 0)
7741 if ((sta.st_mode & S_IFMT) != (stb.st_mode & S_IFMT))
7744 /* We consider all device fds different, since two device fds
7745 * might refer to quite different device contexts even though
7746 * they share the same inode and backing dev_t. */
7748 if (S_ISCHR(sta.st_mode) || S_ISBLK(sta.st_mode))
7751 if (sta.st_dev != stb.st_dev || sta.st_ino != stb.st_ino)
7754 /* The fds refer to the same inode on disk, let's also check
7755 * if they have the same fd flags. This is useful to
7756 * distuingish the read and write side of a pipe created with
7758 fa = fcntl(a, F_GETFL);
7762 fb = fcntl(b, F_GETFL);
7769 int chattr_fd(int fd, bool b, unsigned mask) {
7770 unsigned old_attr, new_attr;
7777 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7781 new_attr = old_attr | mask;
7783 new_attr = old_attr & ~mask;
7785 if (new_attr == old_attr)
7788 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7794 int chattr_path(const char *p, bool b, unsigned mask) {
7795 _cleanup_close_ int fd = -1;
7802 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7806 return chattr_fd(fd, b, mask);
7809 int read_attr_fd(int fd, unsigned *ret) {
7812 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7818 int read_attr_path(const char *p, unsigned *ret) {
7819 _cleanup_close_ int fd = -1;
7824 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7828 return read_attr_fd(fd, ret);
7831 int make_lock_file(const char *p, int operation, LockFile *ret) {
7832 _cleanup_close_ int fd = -1;
7833 _cleanup_free_ char *t = NULL;
7837 * We use UNPOSIX locks if they are available. They have nice
7838 * semantics, and are mostly compatible with NFS. However,
7839 * they are only available on new kernels. When we detect we
7840 * are running on an older kernel, then we fall back to good
7841 * old BSD locks. They also have nice semantics, but are
7842 * slightly problematic on NFS, where they are upgraded to
7843 * POSIX locks, even though locally they are orthogonal to
7853 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7854 .l_whence = SEEK_SET,
7858 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7862 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7865 /* If the kernel is too old, use good old BSD locks */
7866 if (errno == EINVAL)
7867 r = flock(fd, operation);
7870 return errno == EAGAIN ? -EBUSY : -errno;
7873 /* If we acquired the lock, let's check if the file
7874 * still exists in the file system. If not, then the
7875 * previous exclusive owner removed it and then closed
7876 * it. In such a case our acquired lock is worthless,
7877 * hence try again. */
7882 if (st.st_nlink > 0)
7885 fd = safe_close(fd);
7890 ret->operation = operation;
7898 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7906 if (!filename_is_valid(fn))
7909 t = newa(char, strlen(p) + 2 + 4 + 1);
7910 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7912 return make_lock_file(t, operation, ret);
7915 void release_lock_file(LockFile *f) {
7923 /* If we are the exclusive owner we can safely delete
7924 * the lock file itself. If we are not the exclusive
7925 * owner, we can try becoming it. */
7928 (f->operation & ~LOCK_NB) == LOCK_SH) {
7929 static const struct flock fl = {
7931 .l_whence = SEEK_SET,
7934 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7935 if (r < 0 && errno == EINVAL)
7936 r = flock(f->fd, LOCK_EX|LOCK_NB);
7939 f->operation = LOCK_EX|LOCK_NB;
7942 if ((f->operation & ~LOCK_NB) == LOCK_EX)
7943 unlink_noerrno(f->path);
7949 f->fd = safe_close(f->fd);
7953 static size_t nul_length(const uint8_t *p, size_t sz) {
7968 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
7969 const uint8_t *q, *w, *e;
7977 n = nul_length(q, e - q);
7979 /* If there are more than the specified run length of
7980 * NUL bytes, or if this is the beginning or the end
7981 * of the buffer, then seek instead of write */
7982 if ((n > run_length) ||
7983 (n > 0 && q == p) ||
7984 (n > 0 && q + n >= e)) {
7986 l = write(fd, w, q - w);
7993 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
8005 l = write(fd, w, q - w);
8012 return q - (const uint8_t*) p;
8015 void sigkill_wait(pid_t *pid) {
8021 if (kill(*pid, SIGKILL) > 0)
8022 (void) wait_for_terminate(*pid, NULL);