1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
31 #include <sys/resource.h>
32 #include <linux/sched.h>
33 #include <sys/types.h>
37 #include <sys/ioctl.h>
39 #include <linux/tiocl.h>
44 #include <sys/prctl.h>
45 #include <sys/utsname.h>
47 #include <netinet/ip.h>
56 #include <sys/mount.h>
57 #include <linux/magic.h>
61 #include <sys/personality.h>
62 #include <sys/xattr.h>
64 #include <sys/statvfs.h>
69 #ifdef HAVE_SYS_AUXV_H
81 #include "path-util.h"
82 #include "exit-status.h"
86 #include "device-nodes.h"
91 #include "sparse-endian.h"
94 char **saved_argv = NULL;
96 static volatile unsigned cached_columns = 0;
97 static volatile unsigned cached_lines = 0;
99 size_t page_size(void) {
100 static thread_local size_t pgsz = 0;
103 if (_likely_(pgsz > 0))
106 r = sysconf(_SC_PAGESIZE);
113 bool streq_ptr(const char *a, const char *b) {
115 /* Like streq(), but tries to make sense of NULL pointers */
126 char* endswith(const char *s, const char *postfix) {
133 pl = strlen(postfix);
136 return (char*) s + sl;
141 if (memcmp(s + sl - pl, postfix, pl) != 0)
144 return (char*) s + sl - pl;
147 char* first_word(const char *s, const char *word) {
154 /* Checks if the string starts with the specified word, either
155 * followed by NUL or by whitespace. Returns a pointer to the
156 * NUL or the first character after the whitespace. */
167 if (memcmp(s, word, wl) != 0)
174 if (!strchr(WHITESPACE, *p))
177 p += strspn(p, WHITESPACE);
181 static size_t cescape_char(char c, char *buf) {
182 char * buf_old = buf;
228 /* For special chars we prefer octal over
229 * hexadecimal encoding, simply because glib's
230 * g_strescape() does the same */
231 if ((c < ' ') || (c >= 127)) {
233 *(buf++) = octchar((unsigned char) c >> 6);
234 *(buf++) = octchar((unsigned char) c >> 3);
235 *(buf++) = octchar((unsigned char) c);
241 return buf - buf_old;
244 int close_nointr(int fd) {
251 * Just ignore EINTR; a retry loop is the wrong thing to do on
254 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
255 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
256 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
257 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
265 int safe_close(int fd) {
268 * Like close_nointr() but cannot fail. Guarantees errno is
269 * unchanged. Is a NOP with negative fds passed, and returns
270 * -1, so that it can be used in this syntax:
272 * fd = safe_close(fd);
278 /* The kernel might return pretty much any error code
279 * via close(), but the fd will be closed anyway. The
280 * only condition we want to check for here is whether
281 * the fd was invalid at all... */
283 assert_se(close_nointr(fd) != -EBADF);
289 void close_many(const int fds[], unsigned n_fd) {
292 assert(fds || n_fd <= 0);
294 for (i = 0; i < n_fd; i++)
298 int unlink_noerrno(const char *path) {
309 int parse_boolean(const char *v) {
312 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
314 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
320 int parse_pid(const char *s, pid_t* ret_pid) {
321 unsigned long ul = 0;
328 r = safe_atolu(s, &ul);
334 if ((unsigned long) pid != ul)
344 int parse_uid(const char *s, uid_t* ret_uid) {
345 unsigned long ul = 0;
352 r = safe_atolu(s, &ul);
358 if ((unsigned long) uid != ul)
361 /* Some libc APIs use UID_INVALID as special placeholder */
362 if (uid == (uid_t) 0xFFFFFFFF)
365 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
366 if (uid == (uid_t) 0xFFFF)
373 int safe_atou(const char *s, unsigned *ret_u) {
381 l = strtoul(s, &x, 0);
383 if (!x || x == s || *x || errno)
384 return errno > 0 ? -errno : -EINVAL;
386 if ((unsigned long) (unsigned) l != l)
389 *ret_u = (unsigned) l;
393 int safe_atoi(const char *s, int *ret_i) {
401 l = strtol(s, &x, 0);
403 if (!x || x == s || *x || errno)
404 return errno > 0 ? -errno : -EINVAL;
406 if ((long) (int) l != l)
413 int safe_atou8(const char *s, uint8_t *ret) {
421 l = strtoul(s, &x, 0);
423 if (!x || x == s || *x || errno)
424 return errno > 0 ? -errno : -EINVAL;
426 if ((unsigned long) (uint8_t) l != l)
433 int safe_atou16(const char *s, uint16_t *ret) {
441 l = strtoul(s, &x, 0);
443 if (!x || x == s || *x || errno)
444 return errno > 0 ? -errno : -EINVAL;
446 if ((unsigned long) (uint16_t) l != l)
453 int safe_atoi16(const char *s, int16_t *ret) {
461 l = strtol(s, &x, 0);
463 if (!x || x == s || *x || errno)
464 return errno > 0 ? -errno : -EINVAL;
466 if ((long) (int16_t) l != l)
473 int safe_atollu(const char *s, long long unsigned *ret_llu) {
475 unsigned long long l;
481 l = strtoull(s, &x, 0);
483 if (!x || x == s || *x || errno)
484 return errno ? -errno : -EINVAL;
490 int safe_atolli(const char *s, long long int *ret_lli) {
498 l = strtoll(s, &x, 0);
500 if (!x || x == s || *x || errno)
501 return errno ? -errno : -EINVAL;
507 int safe_atod(const char *s, double *ret_d) {
515 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
516 if (loc == (locale_t) 0)
520 d = strtod_l(s, &x, loc);
522 if (!x || x == s || *x || errno) {
524 return errno ? -errno : -EINVAL;
532 static size_t strcspn_escaped(const char *s, const char *reject) {
533 bool escaped = false;
536 for (n=0; s[n]; n++) {
539 else if (s[n] == '\\')
541 else if (strchr(reject, s[n]))
545 /* if s ends in \, return index of previous char */
549 /* Split a string into words. */
550 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
556 assert(**state == '\0');
560 current += strspn(current, separator);
566 if (quoted && strchr("\'\"", *current)) {
567 char quotechars[2] = {*current, '\0'};
569 *l = strcspn_escaped(current + 1, quotechars);
570 if (current[*l + 1] == '\0' ||
571 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
572 /* right quote missing or garbage at the end */
576 assert(current[*l + 1] == quotechars[0]);
577 *state = current++ + *l + 2;
579 *l = strcspn_escaped(current, separator);
580 if (current[*l] && !strchr(separator, current[*l])) {
581 /* unfinished escape */
585 *state = current + *l;
587 *l = strcspn(current, separator);
588 *state = current + *l;
594 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
596 _cleanup_free_ char *line = NULL;
608 p = procfs_file_alloca(pid, "stat");
609 r = read_one_line_file(p, &line);
613 /* Let's skip the pid and comm fields. The latter is enclosed
614 * in () but does not escape any () in its value, so let's
615 * skip over it manually */
617 p = strrchr(line, ')');
629 if ((long unsigned) (pid_t) ppid != ppid)
632 *_ppid = (pid_t) ppid;
637 int fchmod_umask(int fd, mode_t m) {
642 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
648 char *truncate_nl(char *s) {
651 s[strcspn(s, NEWLINE)] = 0;
655 int get_process_state(pid_t pid) {
659 _cleanup_free_ char *line = NULL;
663 p = procfs_file_alloca(pid, "stat");
664 r = read_one_line_file(p, &line);
668 p = strrchr(line, ')');
674 if (sscanf(p, " %c", &state) != 1)
677 return (unsigned char) state;
680 int get_process_comm(pid_t pid, char **name) {
687 p = procfs_file_alloca(pid, "comm");
689 r = read_one_line_file(p, name);
696 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
697 _cleanup_fclose_ FILE *f = NULL;
705 p = procfs_file_alloca(pid, "cmdline");
711 if (max_length == 0) {
712 size_t len = 0, allocated = 0;
714 while ((c = getc(f)) != EOF) {
716 if (!GREEDY_REALLOC(r, allocated, len+2)) {
721 r[len++] = isprint(c) ? c : ' ';
731 r = new(char, max_length);
737 while ((c = getc(f)) != EOF) {
759 size_t n = MIN(left-1, 3U);
766 /* Kernel threads have no argv[] */
768 _cleanup_free_ char *t = NULL;
776 h = get_process_comm(pid, &t);
780 r = strjoin("[", t, "]", NULL);
789 int is_kernel_thread(pid_t pid) {
801 p = procfs_file_alloca(pid, "cmdline");
806 count = fread(&c, 1, 1, f);
810 /* Kernel threads have an empty cmdline */
813 return eof ? 1 : -errno;
818 int get_process_capeff(pid_t pid, char **capeff) {
824 p = procfs_file_alloca(pid, "status");
826 return get_status_field(p, "\nCapEff:", capeff);
829 static int get_process_link_contents(const char *proc_file, char **name) {
835 r = readlink_malloc(proc_file, name);
837 return r == -ENOENT ? -ESRCH : r;
842 int get_process_exe(pid_t pid, char **name) {
849 p = procfs_file_alloca(pid, "exe");
850 r = get_process_link_contents(p, name);
854 d = endswith(*name, " (deleted)");
861 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
862 _cleanup_fclose_ FILE *f = NULL;
872 p = procfs_file_alloca(pid, "status");
877 FOREACH_LINE(line, f, return -errno) {
882 if (startswith(l, field)) {
884 l += strspn(l, WHITESPACE);
886 l[strcspn(l, WHITESPACE)] = 0;
888 return parse_uid(l, uid);
895 int get_process_uid(pid_t pid, uid_t *uid) {
896 return get_process_id(pid, "Uid:", uid);
899 int get_process_gid(pid_t pid, gid_t *gid) {
900 assert_cc(sizeof(uid_t) == sizeof(gid_t));
901 return get_process_id(pid, "Gid:", gid);
904 int get_process_cwd(pid_t pid, char **cwd) {
909 p = procfs_file_alloca(pid, "cwd");
911 return get_process_link_contents(p, cwd);
914 int get_process_root(pid_t pid, char **root) {
919 p = procfs_file_alloca(pid, "root");
921 return get_process_link_contents(p, root);
924 int get_process_environ(pid_t pid, char **env) {
925 _cleanup_fclose_ FILE *f = NULL;
926 _cleanup_free_ char *outcome = NULL;
929 size_t allocated = 0, sz = 0;
934 p = procfs_file_alloca(pid, "environ");
940 while ((c = fgetc(f)) != EOF) {
941 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
945 outcome[sz++] = '\n';
947 sz += cescape_char(c, outcome + sz);
957 char *strnappend(const char *s, const char *suffix, size_t b) {
965 return strndup(suffix, b);
974 if (b > ((size_t) -1) - a)
977 r = new(char, a+b+1);
982 memcpy(r+a, suffix, b);
988 char *strappend(const char *s, const char *suffix) {
989 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
992 int readlinkat_malloc(int fd, const char *p, char **ret) {
1007 n = readlinkat(fd, p, c, l-1);
1014 if ((size_t) n < l-1) {
1025 int readlink_malloc(const char *p, char **ret) {
1026 return readlinkat_malloc(AT_FDCWD, p, ret);
1029 int readlink_value(const char *p, char **ret) {
1030 _cleanup_free_ char *link = NULL;
1034 r = readlink_malloc(p, &link);
1038 value = basename(link);
1042 value = strdup(value);
1051 int readlink_and_make_absolute(const char *p, char **r) {
1052 _cleanup_free_ char *target = NULL;
1059 j = readlink_malloc(p, &target);
1063 k = file_in_same_dir(p, target);
1071 int readlink_and_canonicalize(const char *p, char **r) {
1078 j = readlink_and_make_absolute(p, &t);
1082 s = canonicalize_file_name(t);
1089 path_kill_slashes(*r);
1094 int reset_all_signal_handlers(void) {
1097 for (sig = 1; sig < _NSIG; sig++) {
1098 struct sigaction sa = {
1099 .sa_handler = SIG_DFL,
1100 .sa_flags = SA_RESTART,
1103 /* These two cannot be caught... */
1104 if (sig == SIGKILL || sig == SIGSTOP)
1107 /* On Linux the first two RT signals are reserved by
1108 * glibc, and sigaction() will return EINVAL for them. */
1109 if ((sigaction(sig, &sa, NULL) < 0))
1110 if (errno != EINVAL && r == 0)
1117 int reset_signal_mask(void) {
1120 if (sigemptyset(&ss) < 0)
1123 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1129 char *strstrip(char *s) {
1132 /* Drops trailing whitespace. Modifies the string in
1133 * place. Returns pointer to first non-space character */
1135 s += strspn(s, WHITESPACE);
1137 for (e = strchr(s, 0); e > s; e --)
1138 if (!strchr(WHITESPACE, e[-1]))
1146 char *delete_chars(char *s, const char *bad) {
1149 /* Drops all whitespace, regardless where in the string */
1151 for (f = s, t = s; *f; f++) {
1152 if (strchr(bad, *f))
1163 char *file_in_same_dir(const char *path, const char *filename) {
1170 /* This removes the last component of path and appends
1171 * filename, unless the latter is absolute anyway or the
1174 if (path_is_absolute(filename))
1175 return strdup(filename);
1177 e = strrchr(path, '/');
1179 return strdup(filename);
1181 k = strlen(filename);
1182 ret = new(char, (e + 1 - path) + k + 1);
1186 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1190 int rmdir_parents(const char *path, const char *stop) {
1199 /* Skip trailing slashes */
1200 while (l > 0 && path[l-1] == '/')
1206 /* Skip last component */
1207 while (l > 0 && path[l-1] != '/')
1210 /* Skip trailing slashes */
1211 while (l > 0 && path[l-1] == '/')
1217 if (!(t = strndup(path, l)))
1220 if (path_startswith(stop, t)) {
1229 if (errno != ENOENT)
1236 char hexchar(int x) {
1237 static const char table[16] = "0123456789abcdef";
1239 return table[x & 15];
1242 int unhexchar(char c) {
1244 if (c >= '0' && c <= '9')
1247 if (c >= 'a' && c <= 'f')
1248 return c - 'a' + 10;
1250 if (c >= 'A' && c <= 'F')
1251 return c - 'A' + 10;
1256 char *hexmem(const void *p, size_t l) {
1260 z = r = malloc(l * 2 + 1);
1264 for (x = p; x < (const uint8_t*) p + l; x++) {
1265 *(z++) = hexchar(*x >> 4);
1266 *(z++) = hexchar(*x & 15);
1273 void *unhexmem(const char *p, size_t l) {
1279 z = r = malloc((l + 1) / 2 + 1);
1283 for (x = p; x < p + l; x += 2) {
1286 a = unhexchar(x[0]);
1288 b = unhexchar(x[1]);
1292 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1299 char octchar(int x) {
1300 return '0' + (x & 7);
1303 int unoctchar(char c) {
1305 if (c >= '0' && c <= '7')
1311 char decchar(int x) {
1312 return '0' + (x % 10);
1315 int undecchar(char c) {
1317 if (c >= '0' && c <= '9')
1323 char *cescape(const char *s) {
1329 /* Does C style string escaping. */
1331 r = new(char, strlen(s)*4 + 1);
1335 for (f = s, t = r; *f; f++)
1336 t += cescape_char(*f, t);
1343 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1350 /* Undoes C style string escaping, and optionally prefixes it. */
1352 pl = prefix ? strlen(prefix) : 0;
1354 r = new(char, pl+length+1);
1359 memcpy(r, prefix, pl);
1361 for (f = s, t = r + pl; f < s + length; f++) {
1362 size_t remaining = s + length - f;
1363 assert(remaining > 0);
1365 if (*f != '\\') { /* a literal literal */
1370 if (--remaining == 0) { /* copy trailing backslash verbatim */
1411 /* This is an extension of the XDG syntax files */
1416 /* hexadecimal encoding */
1419 if (remaining >= 2) {
1420 a = unhexchar(f[1]);
1421 b = unhexchar(f[2]);
1424 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1425 /* Invalid escape code, let's take it literal then */
1429 *(t++) = (char) ((a << 4) | b);
1444 /* octal encoding */
1445 int a = -1, b = -1, c = -1;
1447 if (remaining >= 3) {
1448 a = unoctchar(f[0]);
1449 b = unoctchar(f[1]);
1450 c = unoctchar(f[2]);
1453 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1454 /* Invalid escape code, let's take it literal then */
1458 *(t++) = (char) ((a << 6) | (b << 3) | c);
1466 /* Invalid escape code, let's take it literal then */
1477 char *cunescape_length(const char *s, size_t length) {
1478 return cunescape_length_with_prefix(s, length, NULL);
1481 char *cunescape(const char *s) {
1484 return cunescape_length(s, strlen(s));
1487 char *xescape(const char *s, const char *bad) {
1491 /* Escapes all chars in bad, in addition to \ and all special
1492 * chars, in \xFF style escaping. May be reversed with
1495 r = new(char, strlen(s) * 4 + 1);
1499 for (f = s, t = r; *f; f++) {
1501 if ((*f < ' ') || (*f >= 127) ||
1502 (*f == '\\') || strchr(bad, *f)) {
1505 *(t++) = hexchar(*f >> 4);
1506 *(t++) = hexchar(*f);
1516 char *ascii_strlower(char *t) {
1521 for (p = t; *p; p++)
1522 if (*p >= 'A' && *p <= 'Z')
1523 *p = *p - 'A' + 'a';
1528 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1532 filename[0] == '.' ||
1533 streq(filename, "lost+found") ||
1534 streq(filename, "aquota.user") ||
1535 streq(filename, "aquota.group") ||
1536 endswith(filename, ".rpmnew") ||
1537 endswith(filename, ".rpmsave") ||
1538 endswith(filename, ".rpmorig") ||
1539 endswith(filename, ".dpkg-old") ||
1540 endswith(filename, ".dpkg-new") ||
1541 endswith(filename, ".dpkg-tmp") ||
1542 endswith(filename, ".dpkg-dist") ||
1543 endswith(filename, ".dpkg-bak") ||
1544 endswith(filename, ".dpkg-backup") ||
1545 endswith(filename, ".dpkg-remove") ||
1546 endswith(filename, ".swp");
1549 bool hidden_file(const char *filename) {
1552 if (endswith(filename, "~"))
1555 return hidden_file_allow_backup(filename);
1558 int fd_nonblock(int fd, bool nonblock) {
1563 flags = fcntl(fd, F_GETFL, 0);
1568 nflags = flags | O_NONBLOCK;
1570 nflags = flags & ~O_NONBLOCK;
1572 if (nflags == flags)
1575 if (fcntl(fd, F_SETFL, nflags) < 0)
1581 int fd_cloexec(int fd, bool cloexec) {
1586 flags = fcntl(fd, F_GETFD, 0);
1591 nflags = flags | FD_CLOEXEC;
1593 nflags = flags & ~FD_CLOEXEC;
1595 if (nflags == flags)
1598 if (fcntl(fd, F_SETFD, nflags) < 0)
1604 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1607 assert(n_fdset == 0 || fdset);
1609 for (i = 0; i < n_fdset; i++)
1616 int close_all_fds(const int except[], unsigned n_except) {
1617 _cleanup_closedir_ DIR *d = NULL;
1621 assert(n_except == 0 || except);
1623 d = opendir("/proc/self/fd");
1628 /* When /proc isn't available (for example in chroots)
1629 * the fallback is brute forcing through the fd
1632 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1633 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1635 if (fd_in_set(fd, except, n_except))
1638 if (close_nointr(fd) < 0)
1639 if (errno != EBADF && r == 0)
1646 while ((de = readdir(d))) {
1649 if (hidden_file(de->d_name))
1652 if (safe_atoi(de->d_name, &fd) < 0)
1653 /* Let's better ignore this, just in case */
1662 if (fd_in_set(fd, except, n_except))
1665 if (close_nointr(fd) < 0) {
1666 /* Valgrind has its own FD and doesn't want to have it closed */
1667 if (errno != EBADF && r == 0)
1675 bool chars_intersect(const char *a, const char *b) {
1678 /* Returns true if any of the chars in a are in b. */
1679 for (p = a; *p; p++)
1686 bool fstype_is_network(const char *fstype) {
1687 static const char table[] =
1701 x = startswith(fstype, "fuse.");
1705 return nulstr_contains(table, fstype);
1709 _cleanup_close_ int fd;
1711 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1717 TIOCL_GETKMSGREDIRECT,
1721 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1724 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1727 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1733 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1734 struct termios old_termios, new_termios;
1735 char c, line[LINE_MAX];
1740 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1741 new_termios = old_termios;
1743 new_termios.c_lflag &= ~ICANON;
1744 new_termios.c_cc[VMIN] = 1;
1745 new_termios.c_cc[VTIME] = 0;
1747 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1750 if (t != USEC_INFINITY) {
1751 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1752 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1757 k = fread(&c, 1, 1, f);
1759 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1765 *need_nl = c != '\n';
1772 if (t != USEC_INFINITY) {
1773 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1778 if (!fgets(line, sizeof(line), f))
1779 return errno ? -errno : -EIO;
1783 if (strlen(line) != 1)
1793 int ask_char(char *ret, const char *replies, const char *text, ...) {
1803 bool need_nl = true;
1806 fputs(ANSI_HIGHLIGHT_ON, stdout);
1813 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1817 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1820 if (r == -EBADMSG) {
1821 puts("Bad input, please try again.");
1832 if (strchr(replies, c)) {
1837 puts("Read unexpected character, please try again.");
1841 int ask_string(char **ret, const char *text, ...) {
1846 char line[LINE_MAX];
1850 fputs(ANSI_HIGHLIGHT_ON, stdout);
1857 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1862 if (!fgets(line, sizeof(line), stdin))
1863 return errno ? -errno : -EIO;
1865 if (!endswith(line, "\n"))
1884 int reset_terminal_fd(int fd, bool switch_to_text) {
1885 struct termios termios;
1888 /* Set terminal to some sane defaults */
1892 /* We leave locked terminal attributes untouched, so that
1893 * Plymouth may set whatever it wants to set, and we don't
1894 * interfere with that. */
1896 /* Disable exclusive mode, just in case */
1897 ioctl(fd, TIOCNXCL);
1899 /* Switch to text mode */
1901 ioctl(fd, KDSETMODE, KD_TEXT);
1903 /* Enable console unicode mode */
1904 ioctl(fd, KDSKBMODE, K_UNICODE);
1906 if (tcgetattr(fd, &termios) < 0) {
1911 /* We only reset the stuff that matters to the software. How
1912 * hardware is set up we don't touch assuming that somebody
1913 * else will do that for us */
1915 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1916 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1917 termios.c_oflag |= ONLCR;
1918 termios.c_cflag |= CREAD;
1919 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1921 termios.c_cc[VINTR] = 03; /* ^C */
1922 termios.c_cc[VQUIT] = 034; /* ^\ */
1923 termios.c_cc[VERASE] = 0177;
1924 termios.c_cc[VKILL] = 025; /* ^X */
1925 termios.c_cc[VEOF] = 04; /* ^D */
1926 termios.c_cc[VSTART] = 021; /* ^Q */
1927 termios.c_cc[VSTOP] = 023; /* ^S */
1928 termios.c_cc[VSUSP] = 032; /* ^Z */
1929 termios.c_cc[VLNEXT] = 026; /* ^V */
1930 termios.c_cc[VWERASE] = 027; /* ^W */
1931 termios.c_cc[VREPRINT] = 022; /* ^R */
1932 termios.c_cc[VEOL] = 0;
1933 termios.c_cc[VEOL2] = 0;
1935 termios.c_cc[VTIME] = 0;
1936 termios.c_cc[VMIN] = 1;
1938 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1942 /* Just in case, flush all crap out */
1943 tcflush(fd, TCIOFLUSH);
1948 int reset_terminal(const char *name) {
1949 _cleanup_close_ int fd = -1;
1951 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1955 return reset_terminal_fd(fd, true);
1958 int open_terminal(const char *name, int mode) {
1963 * If a TTY is in the process of being closed opening it might
1964 * cause EIO. This is horribly awful, but unlikely to be
1965 * changed in the kernel. Hence we work around this problem by
1966 * retrying a couple of times.
1968 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
1971 assert(!(mode & O_CREAT));
1974 fd = open(name, mode, 0);
1981 /* Max 1s in total */
1985 usleep(50 * USEC_PER_MSEC);
2003 int flush_fd(int fd) {
2004 struct pollfd pollfd = {
2014 r = poll(&pollfd, 1, 0);
2024 l = read(fd, buf, sizeof(buf));
2030 if (errno == EAGAIN)
2039 int acquire_terminal(
2043 bool ignore_tiocstty_eperm,
2046 int fd = -1, notify = -1, r = 0, wd = -1;
2051 /* We use inotify to be notified when the tty is closed. We
2052 * create the watch before checking if we can actually acquire
2053 * it, so that we don't lose any event.
2055 * Note: strictly speaking this actually watches for the
2056 * device being closed, it does *not* really watch whether a
2057 * tty loses its controlling process. However, unless some
2058 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2059 * its tty otherwise this will not become a problem. As long
2060 * as the administrator makes sure not configure any service
2061 * on the same tty as an untrusted user this should not be a
2062 * problem. (Which he probably should not do anyway.) */
2064 if (timeout != USEC_INFINITY)
2065 ts = now(CLOCK_MONOTONIC);
2067 if (!fail && !force) {
2068 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2074 wd = inotify_add_watch(notify, name, IN_CLOSE);
2082 struct sigaction sa_old, sa_new = {
2083 .sa_handler = SIG_IGN,
2084 .sa_flags = SA_RESTART,
2088 r = flush_fd(notify);
2093 /* We pass here O_NOCTTY only so that we can check the return
2094 * value TIOCSCTTY and have a reliable way to figure out if we
2095 * successfully became the controlling process of the tty */
2096 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2100 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2101 * if we already own the tty. */
2102 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2104 /* First, try to get the tty */
2105 if (ioctl(fd, TIOCSCTTY, force) < 0)
2108 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2110 /* Sometimes it makes sense to ignore TIOCSCTTY
2111 * returning EPERM, i.e. when very likely we already
2112 * are have this controlling terminal. */
2113 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2116 if (r < 0 && (force || fail || r != -EPERM)) {
2125 assert(notify >= 0);
2128 union inotify_event_buffer buffer;
2129 struct inotify_event *e;
2132 if (timeout != USEC_INFINITY) {
2135 n = now(CLOCK_MONOTONIC);
2136 if (ts + timeout < n) {
2141 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2151 l = read(notify, &buffer, sizeof(buffer));
2153 if (errno == EINTR || errno == EAGAIN)
2160 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2161 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2170 /* We close the tty fd here since if the old session
2171 * ended our handle will be dead. It's important that
2172 * we do this after sleeping, so that we don't enter
2173 * an endless loop. */
2174 fd = safe_close(fd);
2179 r = reset_terminal_fd(fd, true);
2181 log_warning_errno(r, "Failed to reset terminal: %m");
2192 int release_terminal(void) {
2193 static const struct sigaction sa_new = {
2194 .sa_handler = SIG_IGN,
2195 .sa_flags = SA_RESTART,
2198 _cleanup_close_ int fd = -1;
2199 struct sigaction sa_old;
2202 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2206 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2207 * by our own TIOCNOTTY */
2208 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2210 if (ioctl(fd, TIOCNOTTY) < 0)
2213 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2218 int sigaction_many(const struct sigaction *sa, ...) {
2223 while ((sig = va_arg(ap, int)) > 0)
2224 if (sigaction(sig, sa, NULL) < 0)
2231 int ignore_signals(int sig, ...) {
2232 struct sigaction sa = {
2233 .sa_handler = SIG_IGN,
2234 .sa_flags = SA_RESTART,
2239 if (sigaction(sig, &sa, NULL) < 0)
2243 while ((sig = va_arg(ap, int)) > 0)
2244 if (sigaction(sig, &sa, NULL) < 0)
2251 int default_signals(int sig, ...) {
2252 struct sigaction sa = {
2253 .sa_handler = SIG_DFL,
2254 .sa_flags = SA_RESTART,
2259 if (sigaction(sig, &sa, NULL) < 0)
2263 while ((sig = va_arg(ap, int)) > 0)
2264 if (sigaction(sig, &sa, NULL) < 0)
2271 void safe_close_pair(int p[]) {
2275 /* Special case pairs which use the same fd in both
2277 p[0] = p[1] = safe_close(p[0]);
2281 p[0] = safe_close(p[0]);
2282 p[1] = safe_close(p[1]);
2285 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2292 while (nbytes > 0) {
2295 k = read(fd, p, nbytes);
2300 if (errno == EAGAIN && do_poll) {
2302 /* We knowingly ignore any return value here,
2303 * and expect that any error/EOF is reported
2306 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2310 return n > 0 ? n : -errno;
2324 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2325 const uint8_t *p = buf;
2332 while (nbytes > 0) {
2335 k = write(fd, p, nbytes);
2340 if (errno == EAGAIN && do_poll) {
2341 /* We knowingly ignore any return value here,
2342 * and expect that any error/EOF is reported
2345 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2352 if (k == 0) /* Can't really happen */
2362 int parse_size(const char *t, off_t base, off_t *size) {
2364 /* Soo, sometimes we want to parse IEC binary suffxies, and
2365 * sometimes SI decimal suffixes. This function can parse
2366 * both. Which one is the right way depends on the
2367 * context. Wikipedia suggests that SI is customary for
2368 * hardrware metrics and network speeds, while IEC is
2369 * customary for most data sizes used by software and volatile
2370 * (RAM) memory. Hence be careful which one you pick!
2372 * In either case we use just K, M, G as suffix, and not Ki,
2373 * Mi, Gi or so (as IEC would suggest). That's because that's
2374 * frickin' ugly. But this means you really need to make sure
2375 * to document which base you are parsing when you use this
2380 unsigned long long factor;
2383 static const struct table iec[] = {
2384 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2385 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2386 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2387 { "G", 1024ULL*1024ULL*1024ULL },
2388 { "M", 1024ULL*1024ULL },
2394 static const struct table si[] = {
2395 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2396 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2397 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2398 { "G", 1000ULL*1000ULL*1000ULL },
2399 { "M", 1000ULL*1000ULL },
2405 const struct table *table;
2407 unsigned long long r = 0;
2408 unsigned n_entries, start_pos = 0;
2411 assert(base == 1000 || base == 1024);
2416 n_entries = ELEMENTSOF(si);
2419 n_entries = ELEMENTSOF(iec);
2425 unsigned long long l2;
2431 l = strtoll(p, &e, 10);
2444 if (*e >= '0' && *e <= '9') {
2447 /* strotoull itself would accept space/+/- */
2448 l2 = strtoull(e, &e2, 10);
2450 if (errno == ERANGE)
2453 /* Ignore failure. E.g. 10.M is valid */
2460 e += strspn(e, WHITESPACE);
2462 for (i = start_pos; i < n_entries; i++)
2463 if (startswith(e, table[i].suffix)) {
2464 unsigned long long tmp;
2465 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2467 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2468 if (tmp > ULLONG_MAX - r)
2472 if ((unsigned long long) (off_t) r != r)
2475 p = e + strlen(table[i].suffix);
2491 int make_stdio(int fd) {
2496 r = dup2(fd, STDIN_FILENO);
2497 s = dup2(fd, STDOUT_FILENO);
2498 t = dup2(fd, STDERR_FILENO);
2503 if (r < 0 || s < 0 || t < 0)
2506 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2507 * dup2() was a NOP and the bit hence possibly set. */
2508 fd_cloexec(STDIN_FILENO, false);
2509 fd_cloexec(STDOUT_FILENO, false);
2510 fd_cloexec(STDERR_FILENO, false);
2515 int make_null_stdio(void) {
2518 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2522 return make_stdio(null_fd);
2525 bool is_device_path(const char *path) {
2527 /* Returns true on paths that refer to a device, either in
2528 * sysfs or in /dev */
2531 path_startswith(path, "/dev/") ||
2532 path_startswith(path, "/sys/");
2535 int dir_is_empty(const char *path) {
2536 _cleanup_closedir_ DIR *d;
2547 if (!de && errno != 0)
2553 if (!hidden_file(de->d_name))
2558 char* dirname_malloc(const char *path) {
2559 char *d, *dir, *dir2;
2576 int dev_urandom(void *p, size_t n) {
2577 static int have_syscall = -1;
2581 /* Gathers some randomness from the kernel. This call will
2582 * never block, and will always return some data from the
2583 * kernel, regardless if the random pool is fully initialized
2584 * or not. It thus makes no guarantee for the quality of the
2585 * returned entropy, but is good enough for or usual usecases
2586 * of seeding the hash functions for hashtable */
2588 /* Use the getrandom() syscall unless we know we don't have
2589 * it, or when the requested size is too large for it. */
2590 if (have_syscall != 0 || (size_t) (int) n != n) {
2591 r = getrandom(p, n, GRND_NONBLOCK);
2593 have_syscall = true;
2598 if (errno == ENOSYS)
2599 /* we lack the syscall, continue with
2600 * reading from /dev/urandom */
2601 have_syscall = false;
2602 else if (errno == EAGAIN)
2603 /* not enough entropy for now. Let's
2604 * remember to use the syscall the
2605 * next time, again, but also read
2606 * from /dev/urandom for now, which
2607 * doesn't care about the current
2608 * amount of entropy. */
2609 have_syscall = true;
2613 /* too short read? */
2617 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2619 return errno == ENOENT ? -ENOSYS : -errno;
2621 k = loop_read(fd, p, n, true);
2626 if ((size_t) k != n)
2632 void initialize_srand(void) {
2633 static bool srand_called = false;
2635 #ifdef HAVE_SYS_AUXV_H
2644 #ifdef HAVE_SYS_AUXV_H
2645 /* The kernel provides us with a bit of entropy in auxv, so
2646 * let's try to make use of that to seed the pseudo-random
2647 * generator. It's better than nothing... */
2649 auxv = (void*) getauxval(AT_RANDOM);
2651 x ^= *(unsigned*) auxv;
2654 x ^= (unsigned) now(CLOCK_REALTIME);
2655 x ^= (unsigned) gettid();
2658 srand_called = true;
2661 void random_bytes(void *p, size_t n) {
2665 r = dev_urandom(p, n);
2669 /* If some idiot made /dev/urandom unavailable to us, he'll
2670 * get a PRNG instead. */
2674 for (q = p; q < (uint8_t*) p + n; q ++)
2678 void rename_process(const char name[8]) {
2681 /* This is a like a poor man's setproctitle(). It changes the
2682 * comm field, argv[0], and also the glibc's internally used
2683 * name of the process. For the first one a limit of 16 chars
2684 * applies, to the second one usually one of 10 (i.e. length
2685 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2686 * "systemd"). If you pass a longer string it will be
2689 prctl(PR_SET_NAME, name);
2691 if (program_invocation_name)
2692 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2694 if (saved_argc > 0) {
2698 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2700 for (i = 1; i < saved_argc; i++) {
2704 memzero(saved_argv[i], strlen(saved_argv[i]));
2709 void sigset_add_many(sigset_t *ss, ...) {
2716 while ((sig = va_arg(ap, int)) > 0)
2717 assert_se(sigaddset(ss, sig) == 0);
2721 int sigprocmask_many(int how, ...) {
2726 assert_se(sigemptyset(&ss) == 0);
2729 while ((sig = va_arg(ap, int)) > 0)
2730 assert_se(sigaddset(&ss, sig) == 0);
2733 if (sigprocmask(how, &ss, NULL) < 0)
2739 char* gethostname_malloc(void) {
2742 assert_se(uname(&u) >= 0);
2744 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2745 return strdup(u.nodename);
2747 return strdup(u.sysname);
2750 bool hostname_is_set(void) {
2753 assert_se(uname(&u) >= 0);
2755 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2758 char *lookup_uid(uid_t uid) {
2761 _cleanup_free_ char *buf = NULL;
2762 struct passwd pwbuf, *pw = NULL;
2764 /* Shortcut things to avoid NSS lookups */
2766 return strdup("root");
2768 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2772 buf = malloc(bufsize);
2776 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2777 return strdup(pw->pw_name);
2779 if (asprintf(&name, UID_FMT, uid) < 0)
2785 char* getlogname_malloc(void) {
2789 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2794 return lookup_uid(uid);
2797 char *getusername_malloc(void) {
2804 return lookup_uid(getuid());
2807 int getttyname_malloc(int fd, char **ret) {
2817 r = ttyname_r(fd, path, sizeof(path));
2822 p = startswith(path, "/dev/");
2823 c = strdup(p ?: path);
2840 int getttyname_harder(int fd, char **r) {
2844 k = getttyname_malloc(fd, &s);
2848 if (streq(s, "tty")) {
2850 return get_ctty(0, NULL, r);
2857 int get_ctty_devnr(pid_t pid, dev_t *d) {
2859 _cleanup_free_ char *line = NULL;
2861 unsigned long ttynr;
2865 p = procfs_file_alloca(pid, "stat");
2866 r = read_one_line_file(p, &line);
2870 p = strrchr(line, ')');
2880 "%*d " /* session */
2885 if (major(ttynr) == 0 && minor(ttynr) == 0)
2894 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2895 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2896 _cleanup_free_ char *s = NULL;
2903 k = get_ctty_devnr(pid, &devnr);
2907 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
2909 k = readlink_malloc(fn, &s);
2915 /* This is an ugly hack */
2916 if (major(devnr) == 136) {
2917 asprintf(&b, "pts/%u", minor(devnr));
2921 /* Probably something like the ptys which have no
2922 * symlink in /dev/char. Let's return something
2923 * vaguely useful. */
2929 if (startswith(s, "/dev/"))
2931 else if (startswith(s, "../"))
2949 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2950 _cleanup_closedir_ DIR *d = NULL;
2955 /* This returns the first error we run into, but nevertheless
2956 * tries to go on. This closes the passed fd. */
2962 return errno == ENOENT ? 0 : -errno;
2967 bool is_dir, keep_around;
2974 if (errno != 0 && ret == 0)
2979 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
2982 if (de->d_type == DT_UNKNOWN ||
2984 (de->d_type == DT_DIR && root_dev)) {
2985 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
2986 if (ret == 0 && errno != ENOENT)
2991 is_dir = S_ISDIR(st.st_mode);
2994 (st.st_uid == 0 || st.st_uid == getuid()) &&
2995 (st.st_mode & S_ISVTX);
2997 is_dir = de->d_type == DT_DIR;
2998 keep_around = false;
3004 /* if root_dev is set, remove subdirectories only, if device is same as dir */
3005 if (root_dev && st.st_dev != root_dev->st_dev)
3008 subdir_fd = openat(fd, de->d_name,
3009 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3010 if (subdir_fd < 0) {
3011 if (ret == 0 && errno != ENOENT)
3016 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
3017 if (r < 0 && ret == 0)
3021 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
3022 if (ret == 0 && errno != ENOENT)
3026 } else if (!only_dirs && !keep_around) {
3028 if (unlinkat(fd, de->d_name, 0) < 0) {
3029 if (ret == 0 && errno != ENOENT)
3036 _pure_ static int is_temporary_fs(struct statfs *s) {
3039 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3040 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3043 int is_fd_on_temporary_fs(int fd) {
3046 if (fstatfs(fd, &s) < 0)
3049 return is_temporary_fs(&s);
3052 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
3057 if (fstatfs(fd, &s) < 0) {
3062 /* We refuse to clean disk file systems with this call. This
3063 * is extra paranoia just to be sure we never ever remove
3065 if (!is_temporary_fs(&s)) {
3066 log_error("Attempted to remove disk file system, and we can't allow that.");
3071 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
3074 static int file_is_priv_sticky(const char *p) {
3079 if (lstat(p, &st) < 0)
3083 (st.st_uid == 0 || st.st_uid == getuid()) &&
3084 (st.st_mode & S_ISVTX);
3087 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
3093 /* We refuse to clean the root file system with this
3094 * call. This is extra paranoia to never cause a really
3095 * seriously broken system. */
3096 if (path_equal(path, "/")) {
3097 log_error("Attempted to remove entire root file system, and we can't allow that.");
3101 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3104 if (errno != ENOTDIR && errno != ELOOP)
3108 if (statfs(path, &s) < 0)
3111 if (!is_temporary_fs(&s)) {
3112 log_error("Attempted to remove disk file system, and we can't allow that.");
3117 if (delete_root && !only_dirs)
3118 if (unlink(path) < 0 && errno != ENOENT)
3125 if (fstatfs(fd, &s) < 0) {
3130 if (!is_temporary_fs(&s)) {
3131 log_error("Attempted to remove disk file system, and we can't allow that.");
3137 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
3140 if (honour_sticky && file_is_priv_sticky(path) > 0)
3143 if (rmdir(path) < 0 && errno != ENOENT) {
3152 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3153 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
3156 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3157 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
3160 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3163 /* Under the assumption that we are running privileged we
3164 * first change the access mode and only then hand out
3165 * ownership to avoid a window where access is too open. */
3167 if (mode != MODE_INVALID)
3168 if (chmod(path, mode) < 0)
3171 if (uid != UID_INVALID || gid != GID_INVALID)
3172 if (chown(path, uid, gid) < 0)
3178 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3181 /* Under the assumption that we are running privileged we
3182 * first change the access mode and only then hand out
3183 * ownership to avoid a window where access is too open. */
3185 if (mode != MODE_INVALID)
3186 if (fchmod(fd, mode) < 0)
3189 if (uid != UID_INVALID || gid != GID_INVALID)
3190 if (fchown(fd, uid, gid) < 0)
3196 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3200 /* Allocates the cpuset in the right size */
3203 if (!(r = CPU_ALLOC(n)))
3206 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3207 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3217 if (errno != EINVAL)
3224 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3225 static const char status_indent[] = " "; /* "[" STATUS "] " */
3226 _cleanup_free_ char *s = NULL;
3227 _cleanup_close_ int fd = -1;
3228 struct iovec iovec[6] = {};
3230 static bool prev_ephemeral;
3234 /* This is independent of logging, as status messages are
3235 * optional and go exclusively to the console. */
3237 if (vasprintf(&s, format, ap) < 0)
3240 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3253 sl = status ? sizeof(status_indent)-1 : 0;
3259 e = ellipsize(s, emax, 50);
3267 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3268 prev_ephemeral = ephemeral;
3271 if (!isempty(status)) {
3272 IOVEC_SET_STRING(iovec[n++], "[");
3273 IOVEC_SET_STRING(iovec[n++], status);
3274 IOVEC_SET_STRING(iovec[n++], "] ");
3276 IOVEC_SET_STRING(iovec[n++], status_indent);
3279 IOVEC_SET_STRING(iovec[n++], s);
3281 IOVEC_SET_STRING(iovec[n++], "\n");
3283 if (writev(fd, iovec, n) < 0)
3289 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3295 va_start(ap, format);
3296 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3302 char *replace_env(const char *format, char **env) {
3309 const char *e, *word = format;
3314 for (e = format; *e; e ++) {
3325 k = strnappend(r, word, e-word-1);
3335 } else if (*e == '$') {
3336 k = strnappend(r, word, e-word);
3353 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3355 k = strappend(r, t);
3369 k = strnappend(r, word, e-word);
3381 char **replace_env_argv(char **argv, char **env) {
3383 unsigned k = 0, l = 0;
3385 l = strv_length(argv);
3387 ret = new(char*, l+1);
3391 STRV_FOREACH(i, argv) {
3393 /* If $FOO appears as single word, replace it by the split up variable */
3394 if ((*i)[0] == '$' && (*i)[1] != '{') {
3399 e = strv_env_get(env, *i+1);
3403 r = strv_split_quoted(&m, e, true);
3415 w = realloc(ret, sizeof(char*) * (l+1));
3425 memcpy(ret + k, m, q * sizeof(char*));
3433 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3434 ret[k] = replace_env(*i, env);
3446 int fd_columns(int fd) {
3447 struct winsize ws = {};
3449 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3458 unsigned columns(void) {
3462 if (_likely_(cached_columns > 0))
3463 return cached_columns;
3466 e = getenv("COLUMNS");
3468 (void) safe_atoi(e, &c);
3471 c = fd_columns(STDOUT_FILENO);
3477 return cached_columns;
3480 int fd_lines(int fd) {
3481 struct winsize ws = {};
3483 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3492 unsigned lines(void) {
3496 if (_likely_(cached_lines > 0))
3497 return cached_lines;
3500 e = getenv("LINES");
3502 (void) safe_atoi(e, &l);
3505 l = fd_lines(STDOUT_FILENO);
3511 return cached_lines;
3514 /* intended to be used as a SIGWINCH sighandler */
3515 void columns_lines_cache_reset(int signum) {
3521 static int cached_on_tty = -1;
3523 if (_unlikely_(cached_on_tty < 0))
3524 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3526 return cached_on_tty;
3529 int files_same(const char *filea, const char *fileb) {
3532 if (stat(filea, &a) < 0)
3535 if (stat(fileb, &b) < 0)
3538 return a.st_dev == b.st_dev &&
3539 a.st_ino == b.st_ino;
3542 int running_in_chroot(void) {
3545 ret = files_same("/proc/1/root", "/");
3552 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3557 assert(percent <= 100);
3558 assert(new_length >= 3);
3560 if (old_length <= 3 || old_length <= new_length)
3561 return strndup(s, old_length);
3563 r = new0(char, new_length+1);
3567 x = (new_length * percent) / 100;
3569 if (x > new_length - 3)
3577 s + old_length - (new_length - x - 3),
3578 new_length - x - 3);
3583 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3587 unsigned k, len, len2;
3590 assert(percent <= 100);
3591 assert(new_length >= 3);
3593 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3594 if (ascii_is_valid(s))
3595 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3597 if (old_length <= 3 || old_length <= new_length)
3598 return strndup(s, old_length);
3600 x = (new_length * percent) / 100;
3602 if (x > new_length - 3)
3606 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3609 c = utf8_encoded_to_unichar(i);
3612 k += unichar_iswide(c) ? 2 : 1;
3615 if (k > x) /* last character was wide and went over quota */
3618 for (j = s + old_length; k < new_length && j > i; ) {
3621 j = utf8_prev_char(j);
3622 c = utf8_encoded_to_unichar(j);
3625 k += unichar_iswide(c) ? 2 : 1;
3629 /* we don't actually need to ellipsize */
3631 return memdup(s, old_length + 1);
3633 /* make space for ellipsis */
3634 j = utf8_next_char(j);
3637 len2 = s + old_length - j;
3638 e = new(char, len + 3 + len2 + 1);
3643 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3644 old_length, new_length, x, len, len2, k);
3648 e[len] = 0xe2; /* tri-dot ellipsis: … */
3652 memcpy(e + len + 3, j, len2 + 1);
3657 char *ellipsize(const char *s, size_t length, unsigned percent) {
3658 return ellipsize_mem(s, strlen(s), length, percent);
3661 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3662 _cleanup_close_ int fd;
3668 mkdir_parents(path, 0755);
3670 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3675 r = fchmod(fd, mode);
3680 if (uid != UID_INVALID || gid != GID_INVALID) {
3681 r = fchown(fd, uid, gid);
3686 if (stamp != USEC_INFINITY) {
3687 struct timespec ts[2];
3689 timespec_store(&ts[0], stamp);
3691 r = futimens(fd, ts);
3693 r = futimens(fd, NULL);
3700 int touch(const char *path) {
3701 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3704 char *unquote(const char *s, const char* quotes) {
3708 /* This is rather stupid, simply removes the heading and
3709 * trailing quotes if there is one. Doesn't care about
3710 * escaping or anything. We should make this smarter one
3717 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3718 return strndup(s+1, l-2);
3723 char *normalize_env_assignment(const char *s) {
3724 _cleanup_free_ char *value = NULL;
3728 eq = strchr(s, '=');
3738 memmove(r, t, strlen(t) + 1);
3743 name = strndupa(s, eq - s);
3744 p = strdupa(eq + 1);
3746 value = unquote(strstrip(p), QUOTES);
3750 return strjoin(strstrip(name), "=", value, NULL);
3753 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3764 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3778 * < 0 : wait_for_terminate() failed to get the state of the
3779 * process, the process was terminated by a signal, or
3780 * failed for an unknown reason.
3781 * >=0 : The process terminated normally, and its exit code is
3784 * That is, success is indicated by a return value of zero, and an
3785 * error is indicated by a non-zero value.
3787 * A warning is emitted if the process terminates abnormally,
3788 * and also if it returns non-zero unless check_exit_code is true.
3790 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3797 r = wait_for_terminate(pid, &status);
3799 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3801 if (status.si_code == CLD_EXITED) {
3802 if (status.si_status != 0)
3803 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3804 "%s failed with error code %i.", name, status.si_status);
3806 log_debug("%s succeeded.", name);
3808 return status.si_status;
3809 } else if (status.si_code == CLD_KILLED ||
3810 status.si_code == CLD_DUMPED) {
3812 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3816 log_warning("%s failed due to unknown reason.", name);
3820 noreturn void freeze(void) {
3822 /* Make sure nobody waits for us on a socket anymore */
3823 close_all_fds(NULL, 0);
3831 bool null_or_empty(struct stat *st) {
3834 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3837 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3843 int null_or_empty_path(const char *fn) {
3848 if (stat(fn, &st) < 0)
3851 return null_or_empty(&st);
3854 int null_or_empty_fd(int fd) {
3859 if (fstat(fd, &st) < 0)
3862 return null_or_empty(&st);
3865 DIR *xopendirat(int fd, const char *name, int flags) {
3869 assert(!(flags & O_CREAT));
3871 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3884 int signal_from_string_try_harder(const char *s) {
3888 signo = signal_from_string(s);
3890 if (startswith(s, "SIG"))
3891 return signal_from_string(s+3);
3896 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3897 _cleanup_free_ char *t = NULL, *u = NULL;
3900 u = unquote(tagvalue, "\"\'");
3904 enc_len = strlen(u) * 4 + 1;
3905 t = new(char, enc_len);
3909 if (encode_devnode_name(u, t, enc_len) < 0)
3912 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3915 char *fstab_node_to_udev_node(const char *p) {
3918 if (startswith(p, "LABEL="))
3919 return tag_to_udev_node(p+6, "label");
3921 if (startswith(p, "UUID="))
3922 return tag_to_udev_node(p+5, "uuid");
3924 if (startswith(p, "PARTUUID="))
3925 return tag_to_udev_node(p+9, "partuuid");
3927 if (startswith(p, "PARTLABEL="))
3928 return tag_to_udev_node(p+10, "partlabel");
3933 bool tty_is_vc(const char *tty) {
3936 return vtnr_from_tty(tty) >= 0;
3939 bool tty_is_console(const char *tty) {
3942 if (startswith(tty, "/dev/"))
3945 return streq(tty, "console");
3948 int vtnr_from_tty(const char *tty) {
3953 if (startswith(tty, "/dev/"))
3956 if (!startswith(tty, "tty") )
3959 if (tty[3] < '0' || tty[3] > '9')
3962 r = safe_atoi(tty+3, &i);
3966 if (i < 0 || i > 63)
3972 char *resolve_dev_console(char **active) {
3975 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3976 * (i.e. not read-only-mounted which is a sign for container setups) */
3978 if (path_is_read_only_fs("/sys") > 0)
3981 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3984 /* If multiple log outputs are configured the last one is what
3985 * /dev/console points to */
3986 tty = strrchr(*active, ' ');
3992 if (streq(tty, "tty0")) {
3995 /* Get the active VC (e.g. tty1) */
3996 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
3998 tty = *active = tmp;
4005 bool tty_is_vc_resolve(const char *tty) {
4006 _cleanup_free_ char *active = NULL;
4010 if (startswith(tty, "/dev/"))
4013 if (streq(tty, "console")) {
4014 tty = resolve_dev_console(&active);
4019 return tty_is_vc(tty);
4022 const char *default_term_for_tty(const char *tty) {
4025 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
4028 bool dirent_is_file(const struct dirent *de) {
4031 if (hidden_file(de->d_name))
4034 if (de->d_type != DT_REG &&
4035 de->d_type != DT_LNK &&
4036 de->d_type != DT_UNKNOWN)
4042 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
4045 if (de->d_type != DT_REG &&
4046 de->d_type != DT_LNK &&
4047 de->d_type != DT_UNKNOWN)
4050 if (hidden_file_allow_backup(de->d_name))
4053 return endswith(de->d_name, suffix);
4056 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4057 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4058 _cleanup_set_free_free_ Set *seen = NULL;
4061 /* We fork this all off from a child process so that we can
4062 * somewhat cleanly make use of SIGALRM to set a time limit */
4064 reset_all_signal_handlers();
4065 reset_signal_mask();
4067 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4069 pids = hashmap_new(NULL);
4073 seen = set_new(&string_hash_ops);
4077 STRV_FOREACH(directory, directories) {
4078 _cleanup_closedir_ DIR *d;
4081 d = opendir(*directory);
4083 if (errno == ENOENT)
4086 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4089 FOREACH_DIRENT(de, d, break) {
4090 _cleanup_free_ char *path = NULL;
4094 if (!dirent_is_file(de))
4097 if (set_contains(seen, de->d_name)) {
4098 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4102 r = set_put_strdup(seen, de->d_name);
4106 path = strjoin(*directory, "/", de->d_name, NULL);
4110 if (null_or_empty_path(path)) {
4111 log_debug("%s is empty (a mask).", path);
4114 log_debug("%s will be executed.", path);
4118 log_error_errno(errno, "Failed to fork: %m");
4120 } else if (pid == 0) {
4123 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4133 return log_error_errno(errno, "Failed to execute %s: %m", path);
4136 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4138 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4145 /* Abort execution of this process after the timout. We simply
4146 * rely on SIGALRM as default action terminating the process,
4147 * and turn on alarm(). */
4149 if (timeout != USEC_INFINITY)
4150 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4152 while (!hashmap_isempty(pids)) {
4153 _cleanup_free_ char *path = NULL;
4156 pid = PTR_TO_UINT(hashmap_first_key(pids));
4159 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4162 wait_for_terminate_and_warn(path, pid, true);
4168 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4172 char **dirs = (char**) directories;
4174 assert(!strv_isempty(dirs));
4176 name = basename(dirs[0]);
4177 assert(!isempty(name));
4179 /* Executes all binaries in the directories in parallel and waits
4180 * for them to finish. Optionally a timeout is applied. If a file
4181 * with the same name exists in more than one directory, the
4182 * earliest one wins. */
4184 executor_pid = fork();
4185 if (executor_pid < 0) {
4186 log_error_errno(errno, "Failed to fork: %m");
4189 } else if (executor_pid == 0) {
4190 r = do_execute(dirs, timeout, argv);
4191 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4194 wait_for_terminate_and_warn(name, executor_pid, true);
4197 int kill_and_sigcont(pid_t pid, int sig) {
4200 r = kill(pid, sig) < 0 ? -errno : 0;
4208 bool nulstr_contains(const char*nulstr, const char *needle) {
4214 NULSTR_FOREACH(i, nulstr)
4215 if (streq(i, needle))
4221 bool plymouth_running(void) {
4222 return access("/run/plymouth/pid", F_OK) >= 0;
4225 char* strshorten(char *s, size_t l) {
4234 static bool hostname_valid_char(char c) {
4236 (c >= 'a' && c <= 'z') ||
4237 (c >= 'A' && c <= 'Z') ||
4238 (c >= '0' && c <= '9') ||
4244 bool hostname_is_valid(const char *s) {
4251 /* Doesn't accept empty hostnames, hostnames with trailing or
4252 * leading dots, and hostnames with multiple dots in a
4253 * sequence. Also ensures that the length stays below
4256 for (p = s, dot = true; *p; p++) {
4263 if (!hostname_valid_char(*p))
4273 if (p-s > HOST_NAME_MAX)
4279 char* hostname_cleanup(char *s, bool lowercase) {
4283 for (p = s, d = s, dot = true; *p; p++) {
4290 } else if (hostname_valid_char(*p)) {
4291 *(d++) = lowercase ? tolower(*p) : *p;
4302 strshorten(s, HOST_NAME_MAX);
4307 bool machine_name_is_valid(const char *s) {
4309 if (!hostname_is_valid(s))
4312 /* Machine names should be useful hostnames, but also be
4313 * useful in unit names, hence we enforce a stricter length
4322 int pipe_eof(int fd) {
4323 struct pollfd pollfd = {
4325 .events = POLLIN|POLLHUP,
4330 r = poll(&pollfd, 1, 0);
4337 return pollfd.revents & POLLHUP;
4340 int fd_wait_for_event(int fd, int event, usec_t t) {
4342 struct pollfd pollfd = {
4350 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4357 return pollfd.revents;
4360 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4369 r = tempfn_xxxxxx(path, &t);
4373 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4379 f = fdopen(fd, "we");
4392 int terminal_vhangup_fd(int fd) {
4395 if (ioctl(fd, TIOCVHANGUP) < 0)
4401 int terminal_vhangup(const char *name) {
4402 _cleanup_close_ int fd;
4404 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4408 return terminal_vhangup_fd(fd);
4411 int vt_disallocate(const char *name) {
4415 /* Deallocate the VT if possible. If not possible
4416 * (i.e. because it is the active one), at least clear it
4417 * entirely (including the scrollback buffer) */
4419 if (!startswith(name, "/dev/"))
4422 if (!tty_is_vc(name)) {
4423 /* So this is not a VT. I guess we cannot deallocate
4424 * it then. But let's at least clear the screen */
4426 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4431 "\033[r" /* clear scrolling region */
4432 "\033[H" /* move home */
4433 "\033[2J", /* clear screen */
4440 if (!startswith(name, "/dev/tty"))
4443 r = safe_atou(name+8, &u);
4450 /* Try to deallocate */
4451 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4455 r = ioctl(fd, VT_DISALLOCATE, u);
4464 /* Couldn't deallocate, so let's clear it fully with
4466 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4471 "\033[r" /* clear scrolling region */
4472 "\033[H" /* move home */
4473 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4480 int symlink_atomic(const char *from, const char *to) {
4481 _cleanup_free_ char *t = NULL;
4487 r = tempfn_random(to, &t);
4491 if (symlink(from, t) < 0)
4494 if (rename(t, to) < 0) {
4502 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4503 _cleanup_free_ char *t = NULL;
4508 r = tempfn_random(path, &t);
4512 if (mknod(t, mode, dev) < 0)
4515 if (rename(t, path) < 0) {
4523 int mkfifo_atomic(const char *path, mode_t mode) {
4524 _cleanup_free_ char *t = NULL;
4529 r = tempfn_random(path, &t);
4533 if (mkfifo(t, mode) < 0)
4536 if (rename(t, path) < 0) {
4544 bool display_is_local(const char *display) {
4548 display[0] == ':' &&
4549 display[1] >= '0' &&
4553 int socket_from_display(const char *display, char **path) {
4560 if (!display_is_local(display))
4563 k = strspn(display+1, "0123456789");
4565 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4569 c = stpcpy(f, "/tmp/.X11-unix/X");
4570 memcpy(c, display+1, k);
4579 const char **username,
4580 uid_t *uid, gid_t *gid,
4582 const char **shell) {
4590 /* We enforce some special rules for uid=0: in order to avoid
4591 * NSS lookups for root we hardcode its data. */
4593 if (streq(*username, "root") || streq(*username, "0")) {
4611 if (parse_uid(*username, &u) >= 0) {
4615 /* If there are multiple users with the same id, make
4616 * sure to leave $USER to the configured value instead
4617 * of the first occurrence in the database. However if
4618 * the uid was configured by a numeric uid, then let's
4619 * pick the real username from /etc/passwd. */
4621 *username = p->pw_name;
4624 p = getpwnam(*username);
4628 return errno > 0 ? -errno : -ESRCH;
4640 *shell = p->pw_shell;
4645 char* uid_to_name(uid_t uid) {
4650 return strdup("root");
4654 return strdup(p->pw_name);
4656 if (asprintf(&r, UID_FMT, uid) < 0)
4662 char* gid_to_name(gid_t gid) {
4667 return strdup("root");
4671 return strdup(p->gr_name);
4673 if (asprintf(&r, GID_FMT, gid) < 0)
4679 int get_group_creds(const char **groupname, gid_t *gid) {
4685 /* We enforce some special rules for gid=0: in order to avoid
4686 * NSS lookups for root we hardcode its data. */
4688 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4689 *groupname = "root";
4697 if (parse_gid(*groupname, &id) >= 0) {
4702 *groupname = g->gr_name;
4705 g = getgrnam(*groupname);
4709 return errno > 0 ? -errno : -ESRCH;
4717 int in_gid(gid_t gid) {
4719 int ngroups_max, r, i;
4721 if (getgid() == gid)
4724 if (getegid() == gid)
4727 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4728 assert(ngroups_max > 0);
4730 gids = alloca(sizeof(gid_t) * ngroups_max);
4732 r = getgroups(ngroups_max, gids);
4736 for (i = 0; i < r; i++)
4743 int in_group(const char *name) {
4747 r = get_group_creds(&name, &gid);
4754 int glob_exists(const char *path) {
4755 _cleanup_globfree_ glob_t g = {};
4761 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4763 if (k == GLOB_NOMATCH)
4765 else if (k == GLOB_NOSPACE)
4768 return !strv_isempty(g.gl_pathv);
4770 return errno ? -errno : -EIO;
4773 int glob_extend(char ***strv, const char *path) {
4774 _cleanup_globfree_ glob_t g = {};
4779 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4781 if (k == GLOB_NOMATCH)
4783 else if (k == GLOB_NOSPACE)
4785 else if (k != 0 || strv_isempty(g.gl_pathv))
4786 return errno ? -errno : -EIO;
4788 STRV_FOREACH(p, g.gl_pathv) {
4789 k = strv_extend(strv, *p);
4797 int dirent_ensure_type(DIR *d, struct dirent *de) {
4803 if (de->d_type != DT_UNKNOWN)
4806 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4810 S_ISREG(st.st_mode) ? DT_REG :
4811 S_ISDIR(st.st_mode) ? DT_DIR :
4812 S_ISLNK(st.st_mode) ? DT_LNK :
4813 S_ISFIFO(st.st_mode) ? DT_FIFO :
4814 S_ISSOCK(st.st_mode) ? DT_SOCK :
4815 S_ISCHR(st.st_mode) ? DT_CHR :
4816 S_ISBLK(st.st_mode) ? DT_BLK :
4822 int get_files_in_directory(const char *path, char ***list) {
4823 _cleanup_closedir_ DIR *d = NULL;
4824 size_t bufsize = 0, n = 0;
4825 _cleanup_strv_free_ char **l = NULL;
4829 /* Returns all files in a directory in *list, and the number
4830 * of files as return value. If list is NULL returns only the
4842 if (!de && errno != 0)
4847 dirent_ensure_type(d, de);
4849 if (!dirent_is_file(de))
4853 /* one extra slot is needed for the terminating NULL */
4854 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4857 l[n] = strdup(de->d_name);
4868 l = NULL; /* avoid freeing */
4874 char *strjoin(const char *x, ...) {
4888 t = va_arg(ap, const char *);
4893 if (n > ((size_t) -1) - l) {
4917 t = va_arg(ap, const char *);
4931 bool is_main_thread(void) {
4932 static thread_local int cached = 0;
4934 if (_unlikely_(cached == 0))
4935 cached = getpid() == gettid() ? 1 : -1;
4940 int block_get_whole_disk(dev_t d, dev_t *ret) {
4947 /* If it has a queue this is good enough for us */
4948 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4951 r = access(p, F_OK);
4959 /* If it is a partition find the originating device */
4960 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4963 r = access(p, F_OK);
4969 /* Get parent dev_t */
4970 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4973 r = read_one_line_file(p, &s);
4979 r = sscanf(s, "%u:%u", &m, &n);
4985 /* Only return this if it is really good enough for us. */
4986 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4989 r = access(p, F_OK);
4993 *ret = makedev(m, n);
5000 static const char *const ioprio_class_table[] = {
5001 [IOPRIO_CLASS_NONE] = "none",
5002 [IOPRIO_CLASS_RT] = "realtime",
5003 [IOPRIO_CLASS_BE] = "best-effort",
5004 [IOPRIO_CLASS_IDLE] = "idle"
5007 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
5009 static const char *const sigchld_code_table[] = {
5010 [CLD_EXITED] = "exited",
5011 [CLD_KILLED] = "killed",
5012 [CLD_DUMPED] = "dumped",
5013 [CLD_TRAPPED] = "trapped",
5014 [CLD_STOPPED] = "stopped",
5015 [CLD_CONTINUED] = "continued",
5018 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
5020 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
5021 [LOG_FAC(LOG_KERN)] = "kern",
5022 [LOG_FAC(LOG_USER)] = "user",
5023 [LOG_FAC(LOG_MAIL)] = "mail",
5024 [LOG_FAC(LOG_DAEMON)] = "daemon",
5025 [LOG_FAC(LOG_AUTH)] = "auth",
5026 [LOG_FAC(LOG_SYSLOG)] = "syslog",
5027 [LOG_FAC(LOG_LPR)] = "lpr",
5028 [LOG_FAC(LOG_NEWS)] = "news",
5029 [LOG_FAC(LOG_UUCP)] = "uucp",
5030 [LOG_FAC(LOG_CRON)] = "cron",
5031 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
5032 [LOG_FAC(LOG_FTP)] = "ftp",
5033 [LOG_FAC(LOG_LOCAL0)] = "local0",
5034 [LOG_FAC(LOG_LOCAL1)] = "local1",
5035 [LOG_FAC(LOG_LOCAL2)] = "local2",
5036 [LOG_FAC(LOG_LOCAL3)] = "local3",
5037 [LOG_FAC(LOG_LOCAL4)] = "local4",
5038 [LOG_FAC(LOG_LOCAL5)] = "local5",
5039 [LOG_FAC(LOG_LOCAL6)] = "local6",
5040 [LOG_FAC(LOG_LOCAL7)] = "local7"
5043 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
5045 static const char *const log_level_table[] = {
5046 [LOG_EMERG] = "emerg",
5047 [LOG_ALERT] = "alert",
5048 [LOG_CRIT] = "crit",
5050 [LOG_WARNING] = "warning",
5051 [LOG_NOTICE] = "notice",
5052 [LOG_INFO] = "info",
5053 [LOG_DEBUG] = "debug"
5056 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5058 static const char* const sched_policy_table[] = {
5059 [SCHED_OTHER] = "other",
5060 [SCHED_BATCH] = "batch",
5061 [SCHED_IDLE] = "idle",
5062 [SCHED_FIFO] = "fifo",
5066 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5068 static const char* const rlimit_table[_RLIMIT_MAX] = {
5069 [RLIMIT_CPU] = "LimitCPU",
5070 [RLIMIT_FSIZE] = "LimitFSIZE",
5071 [RLIMIT_DATA] = "LimitDATA",
5072 [RLIMIT_STACK] = "LimitSTACK",
5073 [RLIMIT_CORE] = "LimitCORE",
5074 [RLIMIT_RSS] = "LimitRSS",
5075 [RLIMIT_NOFILE] = "LimitNOFILE",
5076 [RLIMIT_AS] = "LimitAS",
5077 [RLIMIT_NPROC] = "LimitNPROC",
5078 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5079 [RLIMIT_LOCKS] = "LimitLOCKS",
5080 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5081 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5082 [RLIMIT_NICE] = "LimitNICE",
5083 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5084 [RLIMIT_RTTIME] = "LimitRTTIME"
5087 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5089 static const char* const ip_tos_table[] = {
5090 [IPTOS_LOWDELAY] = "low-delay",
5091 [IPTOS_THROUGHPUT] = "throughput",
5092 [IPTOS_RELIABILITY] = "reliability",
5093 [IPTOS_LOWCOST] = "low-cost",
5096 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5098 static const char *const __signal_table[] = {
5115 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5126 [SIGVTALRM] = "VTALRM",
5128 [SIGWINCH] = "WINCH",
5134 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5136 const char *signal_to_string(int signo) {
5137 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5140 name = __signal_to_string(signo);
5144 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5145 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5147 snprintf(buf, sizeof(buf), "%d", signo);
5152 int signal_from_string(const char *s) {
5157 signo = __signal_from_string(s);
5161 if (startswith(s, "RTMIN+")) {
5165 if (safe_atou(s, &u) >= 0) {
5166 signo = (int) u + offset;
5167 if (signo > 0 && signo < _NSIG)
5173 bool kexec_loaded(void) {
5174 bool loaded = false;
5177 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5185 int prot_from_flags(int flags) {
5187 switch (flags & O_ACCMODE) {
5196 return PROT_READ|PROT_WRITE;
5203 char *format_bytes(char *buf, size_t l, off_t t) {
5206 static const struct {
5210 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5211 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5212 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5213 { "G", 1024ULL*1024ULL*1024ULL },
5214 { "M", 1024ULL*1024ULL },
5218 if (t == (off_t) -1)
5221 for (i = 0; i < ELEMENTSOF(table); i++) {
5223 if (t >= table[i].factor) {
5226 (unsigned long long) (t / table[i].factor),
5227 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5234 snprintf(buf, l, "%lluB", (unsigned long long) t);
5242 void* memdup(const void *p, size_t l) {
5255 int fd_inc_sndbuf(int fd, size_t n) {
5257 socklen_t l = sizeof(value);
5259 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5260 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5263 /* If we have the privileges we will ignore the kernel limit. */
5266 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5267 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5273 int fd_inc_rcvbuf(int fd, size_t n) {
5275 socklen_t l = sizeof(value);
5277 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5278 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5281 /* If we have the privileges we will ignore the kernel limit. */
5284 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5285 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5290 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5291 bool stdout_is_tty, stderr_is_tty;
5292 pid_t parent_pid, agent_pid;
5293 sigset_t ss, saved_ss;
5301 /* Spawns a temporary TTY agent, making sure it goes away when
5304 parent_pid = getpid();
5306 /* First we temporarily block all signals, so that the new
5307 * child has them blocked initially. This way, we can be sure
5308 * that SIGTERMs are not lost we might send to the agent. */
5309 assert_se(sigfillset(&ss) >= 0);
5310 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5313 if (agent_pid < 0) {
5314 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5318 if (agent_pid != 0) {
5319 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5326 * Make sure the agent goes away when the parent dies */
5327 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5328 _exit(EXIT_FAILURE);
5330 /* Make sure we actually can kill the agent, if we need to, in
5331 * case somebody invoked us from a shell script that trapped
5332 * SIGTERM or so... */
5333 reset_all_signal_handlers();
5334 reset_signal_mask();
5336 /* Check whether our parent died before we were able
5337 * to set the death signal and unblock the signals */
5338 if (getppid() != parent_pid)
5339 _exit(EXIT_SUCCESS);
5341 /* Don't leak fds to the agent */
5342 close_all_fds(except, n_except);
5344 stdout_is_tty = isatty(STDOUT_FILENO);
5345 stderr_is_tty = isatty(STDERR_FILENO);
5347 if (!stdout_is_tty || !stderr_is_tty) {
5350 /* Detach from stdout/stderr. and reopen
5351 * /dev/tty for them. This is important to
5352 * ensure that when systemctl is started via
5353 * popen() or a similar call that expects to
5354 * read EOF we actually do generate EOF and
5355 * not delay this indefinitely by because we
5356 * keep an unused copy of stdin around. */
5357 fd = open("/dev/tty", O_WRONLY);
5359 log_error_errno(errno, "Failed to open /dev/tty: %m");
5360 _exit(EXIT_FAILURE);
5364 dup2(fd, STDOUT_FILENO);
5367 dup2(fd, STDERR_FILENO);
5373 /* Count arguments */
5375 for (n = 0; va_arg(ap, char*); n++)
5380 l = alloca(sizeof(char *) * (n + 1));
5382 /* Fill in arguments */
5384 for (i = 0; i <= n; i++)
5385 l[i] = va_arg(ap, char*);
5389 _exit(EXIT_FAILURE);
5392 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5393 struct rlimit highest, fixed;
5397 if (setrlimit(resource, rlim) >= 0)
5403 /* So we failed to set the desired setrlimit, then let's try
5404 * to get as close as we can */
5405 assert_se(getrlimit(resource, &highest) == 0);
5407 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5408 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5410 if (setrlimit(resource, &fixed) < 0)
5416 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5417 _cleanup_fclose_ FILE *f = NULL;
5428 path = procfs_file_alloca(pid, "environ");
5430 f = fopen(path, "re");
5438 char line[LINE_MAX];
5441 for (i = 0; i < sizeof(line)-1; i++) {
5445 if (_unlikely_(c == EOF)) {
5455 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5456 value = strdup(line + l + 1);
5470 bool http_etag_is_valid(const char *etag) {
5474 if (!endswith(etag, "\""))
5477 if (!startswith(etag, "\"") && !startswith(etag, "W/\""))
5483 bool http_url_is_valid(const char *url) {
5489 p = startswith(url, "http://");
5491 p = startswith(url, "https://");
5498 return ascii_is_valid(p);
5501 bool documentation_url_is_valid(const char *url) {
5507 if (http_url_is_valid(url))
5510 p = startswith(url, "file:/");
5512 p = startswith(url, "info:");
5514 p = startswith(url, "man:");
5519 return ascii_is_valid(p);
5522 bool in_initrd(void) {
5523 static int saved = -1;
5529 /* We make two checks here:
5531 * 1. the flag file /etc/initrd-release must exist
5532 * 2. the root file system must be a memory file system
5534 * The second check is extra paranoia, since misdetecting an
5535 * initrd can have bad bad consequences due the initrd
5536 * emptying when transititioning to the main systemd.
5539 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5540 statfs("/", &s) >= 0 &&
5541 is_temporary_fs(&s);
5546 void warn_melody(void) {
5547 _cleanup_close_ int fd = -1;
5549 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5553 /* Yeah, this is synchronous. Kinda sucks. But well... */
5555 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5556 usleep(125*USEC_PER_MSEC);
5558 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5559 usleep(125*USEC_PER_MSEC);
5561 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5562 usleep(125*USEC_PER_MSEC);
5564 ioctl(fd, KIOCSOUND, 0);
5567 int make_console_stdio(void) {
5570 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5572 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5574 return log_error_errno(fd, "Failed to acquire terminal: %m");
5578 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5583 int get_home_dir(char **_h) {
5591 /* Take the user specified one */
5592 e = secure_getenv("HOME");
5593 if (e && path_is_absolute(e)) {
5602 /* Hardcode home directory for root to avoid NSS */
5605 h = strdup("/root");
5613 /* Check the database... */
5617 return errno > 0 ? -errno : -ESRCH;
5619 if (!path_is_absolute(p->pw_dir))
5622 h = strdup(p->pw_dir);
5630 int get_shell(char **_s) {
5638 /* Take the user specified one */
5639 e = getenv("SHELL");
5649 /* Hardcode home directory for root to avoid NSS */
5652 s = strdup("/bin/sh");
5660 /* Check the database... */
5664 return errno > 0 ? -errno : -ESRCH;
5666 if (!path_is_absolute(p->pw_shell))
5669 s = strdup(p->pw_shell);
5677 bool filename_is_valid(const char *p) {
5691 if (strlen(p) > FILENAME_MAX)
5697 bool string_is_safe(const char *p) {
5703 for (t = p; *t; t++) {
5704 if (*t > 0 && *t < ' ')
5707 if (strchr("\\\"\'\0x7f", *t))
5715 * Check if a string contains control characters. If 'ok' is non-NULL
5716 * it may be a string containing additional CCs to be considered OK.
5718 bool string_has_cc(const char *p, const char *ok) {
5723 for (t = p; *t; t++) {
5724 if (ok && strchr(ok, *t))
5727 if (*t > 0 && *t < ' ')
5737 bool path_is_safe(const char *p) {
5742 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5745 if (strlen(p) > PATH_MAX)
5748 /* The following two checks are not really dangerous, but hey, they still are confusing */
5749 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5752 if (strstr(p, "//"))
5758 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5759 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5760 int (*compar) (const void *, const void *, void *), void *arg) {
5769 p = (void *)(((const char *) base) + (idx * size));
5770 comparison = compar(key, p, arg);
5773 else if (comparison > 0)
5781 bool is_locale_utf8(void) {
5783 static int cached_answer = -1;
5785 if (cached_answer >= 0)
5788 if (!setlocale(LC_ALL, "")) {
5789 cached_answer = true;
5793 set = nl_langinfo(CODESET);
5795 cached_answer = true;
5799 if (streq(set, "UTF-8")) {
5800 cached_answer = true;
5804 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5805 * unset and everything can do to UTF-8 nowadays. */
5806 set = setlocale(LC_CTYPE, NULL);
5808 cached_answer = true;
5812 /* Check result, but ignore the result if C was set
5816 !getenv("LC_ALL") &&
5817 !getenv("LC_CTYPE") &&
5821 return (bool) cached_answer;
5824 const char *draw_special_char(DrawSpecialChar ch) {
5825 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5828 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5829 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5830 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5831 [DRAW_TREE_SPACE] = " ", /* */
5832 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5833 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5834 [DRAW_ARROW] = "\342\206\222", /* → */
5835 [DRAW_DASH] = "\342\200\223", /* – */
5838 /* ASCII fallback */ {
5839 [DRAW_TREE_VERTICAL] = "| ",
5840 [DRAW_TREE_BRANCH] = "|-",
5841 [DRAW_TREE_RIGHT] = "`-",
5842 [DRAW_TREE_SPACE] = " ",
5843 [DRAW_TRIANGULAR_BULLET] = ">",
5844 [DRAW_BLACK_CIRCLE] = "*",
5845 [DRAW_ARROW] = "->",
5850 return draw_table[!is_locale_utf8()][ch];
5853 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5856 size_t l, old_len, new_len;
5862 old_len = strlen(old_string);
5863 new_len = strlen(new_string);
5876 if (!startswith(f, old_string)) {
5882 nl = l - old_len + new_len;
5883 a = realloc(r, nl + 1);
5891 t = stpcpy(t, new_string);
5903 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5904 const char *i, *begin = NULL;
5909 } state = STATE_OTHER;
5911 size_t osz = 0, isz;
5917 /* Strips ANSI color and replaces TABs by 8 spaces */
5919 isz = _isz ? *_isz : strlen(*ibuf);
5921 f = open_memstream(&obuf, &osz);
5925 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5930 if (i >= *ibuf + isz) /* EOT */
5932 else if (*i == '\x1B')
5933 state = STATE_ESCAPE;
5934 else if (*i == '\t')
5941 if (i >= *ibuf + isz) { /* EOT */
5944 } else if (*i == '[') {
5945 state = STATE_BRACKET;
5950 state = STATE_OTHER;
5957 if (i >= *ibuf + isz || /* EOT */
5958 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5961 state = STATE_OTHER;
5963 } else if (*i == 'm')
5964 state = STATE_OTHER;
5986 int on_ac_power(void) {
5987 bool found_offline = false, found_online = false;
5988 _cleanup_closedir_ DIR *d = NULL;
5990 d = opendir("/sys/class/power_supply");
5996 _cleanup_close_ int fd = -1, device = -1;
6002 if (!de && errno != 0)
6008 if (hidden_file(de->d_name))
6011 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
6013 if (errno == ENOENT || errno == ENOTDIR)
6019 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6021 if (errno == ENOENT)
6027 n = read(fd, contents, sizeof(contents));
6031 if (n != 6 || memcmp(contents, "Mains\n", 6))
6035 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6037 if (errno == ENOENT)
6043 n = read(fd, contents, sizeof(contents));
6047 if (n != 2 || contents[1] != '\n')
6050 if (contents[0] == '1') {
6051 found_online = true;
6053 } else if (contents[0] == '0')
6054 found_offline = true;
6059 return found_online || !found_offline;
6062 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6069 if (!path_strv_resolve_uniq(search, root))
6072 STRV_FOREACH(i, search) {
6073 _cleanup_free_ char *p = NULL;
6077 p = strjoin(root, *i, "/", path, NULL);
6079 p = strjoin(*i, "/", path, NULL);
6089 if (errno != ENOENT)
6096 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6097 _cleanup_strv_free_ char **copy = NULL;
6103 if (path_is_absolute(path)) {
6106 f = fopen(path, mode);
6115 copy = strv_copy((char**) search);
6119 return search_and_fopen_internal(path, mode, root, copy, _f);
6122 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6123 _cleanup_strv_free_ char **s = NULL;
6125 if (path_is_absolute(path)) {
6128 f = fopen(path, mode);
6137 s = strv_split_nulstr(search);
6141 return search_and_fopen_internal(path, mode, root, s, _f);
6144 char *strextend(char **x, ...) {
6151 l = f = *x ? strlen(*x) : 0;
6158 t = va_arg(ap, const char *);
6163 if (n > ((size_t) -1) - l) {
6172 r = realloc(*x, l+1);
6182 t = va_arg(ap, const char *);
6196 char *strrep(const char *s, unsigned n) {
6204 p = r = malloc(l * n + 1);
6208 for (i = 0; i < n; i++)
6215 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6222 if (*allocated >= need)
6225 newalloc = MAX(need * 2, 64u / size);
6226 a = newalloc * size;
6228 /* check for overflows */
6229 if (a < size * need)
6237 *allocated = newalloc;
6241 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6250 q = greedy_realloc(p, allocated, need, size);
6254 if (*allocated > prev)
6255 memzero(q + prev * size, (*allocated - prev) * size);
6260 bool id128_is_valid(const char *s) {
6266 /* Simple formatted 128bit hex string */
6268 for (i = 0; i < l; i++) {
6271 if (!(c >= '0' && c <= '9') &&
6272 !(c >= 'a' && c <= 'z') &&
6273 !(c >= 'A' && c <= 'Z'))
6277 } else if (l == 36) {
6279 /* Formatted UUID */
6281 for (i = 0; i < l; i++) {
6284 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6288 if (!(c >= '0' && c <= '9') &&
6289 !(c >= 'a' && c <= 'z') &&
6290 !(c >= 'A' && c <= 'Z'))
6301 int split_pair(const char *s, const char *sep, char **l, char **r) {
6316 a = strndup(s, x - s);
6320 b = strdup(x + strlen(sep));
6332 int shall_restore_state(void) {
6333 _cleanup_free_ char *value = NULL;
6336 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6342 return parse_boolean(value) != 0;
6345 int proc_cmdline(char **ret) {
6348 if (detect_container(NULL) > 0)
6349 return get_process_cmdline(1, 0, false, ret);
6351 return read_one_line_file("/proc/cmdline", ret);
6354 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6355 _cleanup_free_ char *line = NULL;
6361 r = proc_cmdline(&line);
6367 _cleanup_free_ char *word = NULL;
6370 r = unquote_first_word(&p, &word, true);
6376 /* Filter out arguments that are intended only for the
6378 if (!in_initrd() && startswith(word, "rd."))
6381 value = strchr(word, '=');
6385 r = parse_item(word, value);
6393 int get_proc_cmdline_key(const char *key, char **value) {
6394 _cleanup_free_ char *line = NULL, *ret = NULL;
6401 r = proc_cmdline(&line);
6407 _cleanup_free_ char *word = NULL;
6410 r = unquote_first_word(&p, &word, true);
6416 /* Filter out arguments that are intended only for the
6418 if (!in_initrd() && startswith(word, "rd."))
6422 e = startswith(word, key);
6426 r = free_and_strdup(&ret, e);
6432 if (streq(word, key))
6446 int container_get_leader(const char *machine, pid_t *pid) {
6447 _cleanup_free_ char *s = NULL, *class = NULL;
6455 p = strjoina("/run/systemd/machines/", machine);
6456 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6464 if (!streq_ptr(class, "container"))
6467 r = parse_pid(s, &leader);
6477 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6478 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6486 mntns = procfs_file_alloca(pid, "ns/mnt");
6487 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6495 pidns = procfs_file_alloca(pid, "ns/pid");
6496 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6504 netns = procfs_file_alloca(pid, "ns/net");
6505 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6513 root = procfs_file_alloca(pid, "root");
6514 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6520 *pidns_fd = pidnsfd;
6523 *mntns_fd = mntnsfd;
6526 *netns_fd = netnsfd;
6531 pidnsfd = mntnsfd = netnsfd = -1;
6536 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6539 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6543 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6547 if (setns(netns_fd, CLONE_NEWNET) < 0)
6551 if (fchdir(root_fd) < 0)
6554 if (chroot(".") < 0)
6558 if (setresgid(0, 0, 0) < 0)
6561 if (setgroups(0, NULL) < 0)
6564 if (setresuid(0, 0, 0) < 0)
6570 bool pid_is_unwaited(pid_t pid) {
6571 /* Checks whether a PID is still valid at all, including a zombie */
6576 if (kill(pid, 0) >= 0)
6579 return errno != ESRCH;
6582 bool pid_is_alive(pid_t pid) {
6585 /* Checks whether a PID is still valid and not a zombie */
6590 r = get_process_state(pid);
6591 if (r == -ENOENT || r == 'Z')
6597 int getpeercred(int fd, struct ucred *ucred) {
6598 socklen_t n = sizeof(struct ucred);
6605 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6609 if (n != sizeof(struct ucred))
6612 /* Check if the data is actually useful and not suppressed due
6613 * to namespacing issues */
6616 if (u.uid == UID_INVALID)
6618 if (u.gid == GID_INVALID)
6625 int getpeersec(int fd, char **ret) {
6637 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6641 if (errno != ERANGE)
6648 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6664 /* This is much like like mkostemp() but is subject to umask(). */
6665 int mkostemp_safe(char *pattern, int flags) {
6666 _cleanup_umask_ mode_t u;
6673 fd = mkostemp(pattern, flags);
6680 int open_tmpfile(const char *path, int flags) {
6687 /* Try O_TMPFILE first, if it is supported */
6688 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6693 /* Fall back to unguessable name + unlinking */
6694 p = strjoina(path, "/systemd-tmp-XXXXXX");
6696 fd = mkostemp_safe(p, flags);
6704 int fd_warn_permissions(const char *path, int fd) {
6707 if (fstat(fd, &st) < 0)
6710 if (st.st_mode & 0111)
6711 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6713 if (st.st_mode & 0002)
6714 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6716 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6717 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6722 unsigned long personality_from_string(const char *p) {
6724 /* Parse a personality specifier. We introduce our own
6725 * identifiers that indicate specific ABIs, rather than just
6726 * hints regarding the register size, since we want to keep
6727 * things open for multiple locally supported ABIs for the
6728 * same register size. We try to reuse the ABI identifiers
6729 * used by libseccomp. */
6731 #if defined(__x86_64__)
6733 if (streq(p, "x86"))
6736 if (streq(p, "x86-64"))
6739 #elif defined(__i386__)
6741 if (streq(p, "x86"))
6745 /* personality(7) documents that 0xffffffffUL is used for
6746 * querying the current personality, hence let's use that here
6747 * as error indicator. */
6748 return 0xffffffffUL;
6751 const char* personality_to_string(unsigned long p) {
6753 #if defined(__x86_64__)
6755 if (p == PER_LINUX32)
6761 #elif defined(__i386__)
6770 uint64_t physical_memory(void) {
6773 /* We return this as uint64_t in case we are running as 32bit
6774 * process on a 64bit kernel with huge amounts of memory */
6776 mem = sysconf(_SC_PHYS_PAGES);
6779 return (uint64_t) mem * (uint64_t) page_size();
6782 void hexdump(FILE *f, const void *p, size_t s) {
6783 const uint8_t *b = p;
6786 assert(s == 0 || b);
6791 fprintf(f, "%04x ", n);
6793 for (i = 0; i < 16; i++) {
6798 fprintf(f, "%02x ", b[i]);
6806 for (i = 0; i < 16; i++) {
6811 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6825 int update_reboot_param_file(const char *param) {
6830 r = write_string_file(REBOOT_PARAM_FILE, param);
6832 log_error("Failed to write reboot param to "
6833 REBOOT_PARAM_FILE": %s", strerror(-r));
6835 unlink(REBOOT_PARAM_FILE);
6840 int umount_recursive(const char *prefix, int flags) {
6844 /* Try to umount everything recursively below a
6845 * directory. Also, take care of stacked mounts, and keep
6846 * unmounting them until they are gone. */
6849 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6854 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6855 if (!proc_self_mountinfo)
6859 _cleanup_free_ char *path = NULL, *p = NULL;
6862 k = fscanf(proc_self_mountinfo,
6863 "%*s " /* (1) mount id */
6864 "%*s " /* (2) parent id */
6865 "%*s " /* (3) major:minor */
6866 "%*s " /* (4) root */
6867 "%ms " /* (5) mount point */
6868 "%*s" /* (6) mount options */
6869 "%*[^-]" /* (7) optional fields */
6870 "- " /* (8) separator */
6871 "%*s " /* (9) file system type */
6872 "%*s" /* (10) mount source */
6873 "%*s" /* (11) mount options 2 */
6874 "%*[^\n]", /* some rubbish at the end */
6883 p = cunescape(path);
6887 if (!path_startswith(p, prefix))
6890 if (umount2(p, flags) < 0) {
6906 static int get_mount_flags(const char *path, unsigned long *flags) {
6909 if (statvfs(path, &buf) < 0)
6911 *flags = buf.f_flag;
6915 int bind_remount_recursive(const char *prefix, bool ro) {
6916 _cleanup_set_free_free_ Set *done = NULL;
6917 _cleanup_free_ char *cleaned = NULL;
6920 /* Recursively remount a directory (and all its submounts)
6921 * read-only or read-write. If the directory is already
6922 * mounted, we reuse the mount and simply mark it
6923 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6924 * operation). If it isn't we first make it one. Afterwards we
6925 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6926 * submounts we can access, too. When mounts are stacked on
6927 * the same mount point we only care for each individual
6928 * "top-level" mount on each point, as we cannot
6929 * influence/access the underlying mounts anyway. We do not
6930 * have any effect on future submounts that might get
6931 * propagated, they migt be writable. This includes future
6932 * submounts that have been triggered via autofs. */
6934 cleaned = strdup(prefix);
6938 path_kill_slashes(cleaned);
6940 done = set_new(&string_hash_ops);
6945 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6946 _cleanup_set_free_free_ Set *todo = NULL;
6947 bool top_autofs = false;
6949 unsigned long orig_flags;
6951 todo = set_new(&string_hash_ops);
6955 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6956 if (!proc_self_mountinfo)
6960 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6963 k = fscanf(proc_self_mountinfo,
6964 "%*s " /* (1) mount id */
6965 "%*s " /* (2) parent id */
6966 "%*s " /* (3) major:minor */
6967 "%*s " /* (4) root */
6968 "%ms " /* (5) mount point */
6969 "%*s" /* (6) mount options (superblock) */
6970 "%*[^-]" /* (7) optional fields */
6971 "- " /* (8) separator */
6972 "%ms " /* (9) file system type */
6973 "%*s" /* (10) mount source */
6974 "%*s" /* (11) mount options (bind mount) */
6975 "%*[^\n]", /* some rubbish at the end */
6985 p = cunescape(path);
6989 /* Let's ignore autofs mounts. If they aren't
6990 * triggered yet, we want to avoid triggering
6991 * them, as we don't make any guarantees for
6992 * future submounts anyway. If they are
6993 * already triggered, then we will find
6994 * another entry for this. */
6995 if (streq(type, "autofs")) {
6996 top_autofs = top_autofs || path_equal(cleaned, p);
7000 if (path_startswith(p, cleaned) &&
7001 !set_contains(done, p)) {
7003 r = set_consume(todo, p);
7013 /* If we have no submounts to process anymore and if
7014 * the root is either already done, or an autofs, we
7016 if (set_isempty(todo) &&
7017 (top_autofs || set_contains(done, cleaned)))
7020 if (!set_contains(done, cleaned) &&
7021 !set_contains(todo, cleaned)) {
7022 /* The prefix directory itself is not yet a
7023 * mount, make it one. */
7024 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
7028 (void) get_mount_flags(cleaned, &orig_flags);
7029 orig_flags &= ~MS_RDONLY;
7031 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
7034 x = strdup(cleaned);
7038 r = set_consume(done, x);
7043 while ((x = set_steal_first(todo))) {
7045 r = set_consume(done, x);
7051 /* Try to reuse the original flag set, but
7052 * don't care for errors, in case of
7053 * obstructed mounts */
7055 (void) get_mount_flags(x, &orig_flags);
7056 orig_flags &= ~MS_RDONLY;
7058 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7060 /* Deal with mount points that are
7061 * obstructed by a later mount */
7063 if (errno != ENOENT)
7071 int fflush_and_check(FILE *f) {
7078 return errno ? -errno : -EIO;
7083 int tempfn_xxxxxx(const char *p, char **ret) {
7095 * /foo/bar/.#waldoXXXXXX
7099 if (!filename_is_valid(fn))
7102 t = new(char, strlen(p) + 2 + 6 + 1);
7106 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7108 *ret = path_kill_slashes(t);
7112 int tempfn_random(const char *p, char **ret) {
7126 * /foo/bar/.#waldobaa2a261115984a9
7130 if (!filename_is_valid(fn))
7133 t = new(char, strlen(p) + 2 + 16 + 1);
7137 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7140 for (i = 0; i < 16; i++) {
7141 *(x++) = hexchar(u & 0xF);
7147 *ret = path_kill_slashes(t);
7151 int tempfn_random_child(const char *p, char **ret) {
7162 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7165 t = new(char, strlen(p) + 3 + 16 + 1);
7169 x = stpcpy(stpcpy(t, p), "/.#");
7172 for (i = 0; i < 16; i++) {
7173 *(x++) = hexchar(u & 0xF);
7179 *ret = path_kill_slashes(t);
7183 /* make sure the hostname is not "localhost" */
7184 bool is_localhost(const char *hostname) {
7187 /* This tries to identify local host and domain names
7188 * described in RFC6761 plus the redhatism of .localdomain */
7190 return streq(hostname, "localhost") ||
7191 streq(hostname, "localhost.") ||
7192 streq(hostname, "localdomain.") ||
7193 streq(hostname, "localdomain") ||
7194 endswith(hostname, ".localhost") ||
7195 endswith(hostname, ".localhost.") ||
7196 endswith(hostname, ".localdomain") ||
7197 endswith(hostname, ".localdomain.");
7200 int take_password_lock(const char *root) {
7202 struct flock flock = {
7204 .l_whence = SEEK_SET,
7212 /* This is roughly the same as lckpwdf(), but not as awful. We
7213 * don't want to use alarm() and signals, hence we implement
7214 * our own trivial version of this.
7216 * Note that shadow-utils also takes per-database locks in
7217 * addition to lckpwdf(). However, we don't given that they
7218 * are redundant as they they invoke lckpwdf() first and keep
7219 * it during everything they do. The per-database locks are
7220 * awfully racy, and thus we just won't do them. */
7223 path = strjoina(root, "/etc/.pwd.lock");
7225 path = "/etc/.pwd.lock";
7227 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7231 r = fcntl(fd, F_SETLKW, &flock);
7240 int is_symlink(const char *path) {
7243 if (lstat(path, &info) < 0)
7246 return !!S_ISLNK(info.st_mode);
7249 int is_dir(const char* path, bool follow) {
7254 r = stat(path, &st);
7256 r = lstat(path, &st);
7260 return !!S_ISDIR(st.st_mode);
7263 int unquote_first_word(const char **p, char **ret, bool relax) {
7264 _cleanup_free_ char *s = NULL;
7265 size_t allocated = 0, sz = 0;
7272 SINGLE_QUOTE_ESCAPE,
7274 DOUBLE_QUOTE_ESCAPE,
7282 /* Parses the first word of a string, and returns it in
7283 * *ret. Removes all quotes in the process. When parsing fails
7284 * (because of an uneven number of quotes or similar), leaves
7285 * the pointer *p at the first invalid character. */
7295 else if (strchr(WHITESPACE, c))
7305 state = SINGLE_QUOTE;
7307 state = VALUE_ESCAPE;
7309 state = DOUBLE_QUOTE;
7310 else if (strchr(WHITESPACE, c))
7313 if (!GREEDY_REALLOC(s, allocated, sz+2))
7328 if (!GREEDY_REALLOC(s, allocated, sz+2))
7341 } else if (c == '\'')
7344 state = SINGLE_QUOTE_ESCAPE;
7346 if (!GREEDY_REALLOC(s, allocated, sz+2))
7354 case SINGLE_QUOTE_ESCAPE:
7361 if (!GREEDY_REALLOC(s, allocated, sz+2))
7365 state = SINGLE_QUOTE;
7374 state = DOUBLE_QUOTE_ESCAPE;
7376 if (!GREEDY_REALLOC(s, allocated, sz+2))
7384 case DOUBLE_QUOTE_ESCAPE:
7391 if (!GREEDY_REALLOC(s, allocated, sz+2))
7395 state = DOUBLE_QUOTE;
7401 if (!strchr(WHITESPACE, c))
7423 int unquote_many_words(const char **p, ...) {
7428 /* Parses a number of words from a string, stripping any
7429 * quotes if necessary. */
7433 /* Count how many words are expected */
7436 if (!va_arg(ap, char **))
7445 /* Read all words into a temporary array */
7446 l = newa0(char*, n);
7447 for (c = 0; c < n; c++) {
7449 r = unquote_first_word(p, &l[c], false);
7453 for (j = 0; j < c; j++)
7463 /* If we managed to parse all words, return them in the passed
7466 for (i = 0; i < n; i++) {
7469 v = va_arg(ap, char **);
7479 int free_and_strdup(char **p, const char *s) {
7484 /* Replaces a string pointer with an strdup()ed new string,
7485 * possibly freeing the old one. */
7500 int sethostname_idempotent(const char *s) {
7502 char buf[HOST_NAME_MAX + 1] = {};
7506 r = gethostname(buf, sizeof(buf));
7513 r = sethostname(s, strlen(s));
7520 int ptsname_malloc(int fd, char **ret) {
7533 if (ptsname_r(fd, c, l) == 0) {
7537 if (errno != ERANGE) {
7547 int openpt_in_namespace(pid_t pid, int flags) {
7548 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7549 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7551 struct cmsghdr cmsghdr;
7552 uint8_t buf[CMSG_SPACE(sizeof(int))];
7554 struct msghdr mh = {
7555 .msg_control = &control,
7556 .msg_controllen = sizeof(control),
7558 struct cmsghdr *cmsg;
7565 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7569 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7579 pair[0] = safe_close(pair[0]);
7581 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7583 _exit(EXIT_FAILURE);
7585 master = posix_openpt(flags);
7587 _exit(EXIT_FAILURE);
7589 cmsg = CMSG_FIRSTHDR(&mh);
7590 cmsg->cmsg_level = SOL_SOCKET;
7591 cmsg->cmsg_type = SCM_RIGHTS;
7592 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7593 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7595 mh.msg_controllen = cmsg->cmsg_len;
7597 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7598 _exit(EXIT_FAILURE);
7600 _exit(EXIT_SUCCESS);
7603 pair[1] = safe_close(pair[1]);
7605 r = wait_for_terminate(child, &si);
7608 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7611 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7614 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7615 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7619 fds = (int*) CMSG_DATA(cmsg);
7620 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7623 close_many(fds, n_fds);
7633 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7634 _cleanup_close_ int fd = -1;
7637 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7639 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7643 l = fgetxattr(fd, attribute, value, size);
7650 static int parse_crtime(le64_t le, usec_t *usec) {
7656 if (u == 0 || u == (uint64_t) -1)
7663 int fd_getcrtime(int fd, usec_t *usec) {
7670 /* Until Linux gets a real concept of birthtime/creation time,
7671 * let's fake one with xattrs */
7673 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7676 if (n != sizeof(le))
7679 return parse_crtime(le, usec);
7682 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7686 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7689 if (n != sizeof(le))
7692 return parse_crtime(le, usec);
7695 int path_getcrtime(const char *p, usec_t *usec) {
7702 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7705 if (n != sizeof(le))
7708 return parse_crtime(le, usec);
7711 int fd_setcrtime(int fd, usec_t usec) {
7717 usec = now(CLOCK_REALTIME);
7719 le = htole64((uint64_t) usec);
7720 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7726 int same_fd(int a, int b) {
7727 struct stat sta, stb;
7734 /* Compares two file descriptors. Note that semantics are
7735 * quite different depending on whether we have kcmp() or we
7736 * don't. If we have kcmp() this will only return true for
7737 * dup()ed file descriptors, but not otherwise. If we don't
7738 * have kcmp() this will also return true for two fds of the same
7739 * file, created by separate open() calls. Since we use this
7740 * call mostly for filtering out duplicates in the fd store
7741 * this difference hopefully doesn't matter too much. */
7746 /* Try to use kcmp() if we have it. */
7748 r = kcmp(pid, pid, KCMP_FILE, a, b);
7753 if (errno != ENOSYS)
7756 /* We don't have kcmp(), use fstat() instead. */
7757 if (fstat(a, &sta) < 0)
7760 if (fstat(b, &stb) < 0)
7763 if ((sta.st_mode & S_IFMT) != (stb.st_mode & S_IFMT))
7766 /* We consider all device fds different, since two device fds
7767 * might refer to quite different device contexts even though
7768 * they share the same inode and backing dev_t. */
7770 if (S_ISCHR(sta.st_mode) || S_ISBLK(sta.st_mode))
7773 if (sta.st_dev != stb.st_dev || sta.st_ino != stb.st_ino)
7776 /* The fds refer to the same inode on disk, let's also check
7777 * if they have the same fd flags. This is useful to
7778 * distuingish the read and write side of a pipe created with
7780 fa = fcntl(a, F_GETFL);
7784 fb = fcntl(b, F_GETFL);
7791 int chattr_fd(int fd, bool b, unsigned mask) {
7792 unsigned old_attr, new_attr;
7799 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7803 new_attr = old_attr | mask;
7805 new_attr = old_attr & ~mask;
7807 if (new_attr == old_attr)
7810 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7816 int chattr_path(const char *p, bool b, unsigned mask) {
7817 _cleanup_close_ int fd = -1;
7824 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7828 return chattr_fd(fd, b, mask);
7831 int read_attr_fd(int fd, unsigned *ret) {
7834 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7840 int read_attr_path(const char *p, unsigned *ret) {
7841 _cleanup_close_ int fd = -1;
7846 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7850 return read_attr_fd(fd, ret);
7853 int make_lock_file(const char *p, int operation, LockFile *ret) {
7854 _cleanup_close_ int fd = -1;
7855 _cleanup_free_ char *t = NULL;
7859 * We use UNPOSIX locks if they are available. They have nice
7860 * semantics, and are mostly compatible with NFS. However,
7861 * they are only available on new kernels. When we detect we
7862 * are running on an older kernel, then we fall back to good
7863 * old BSD locks. They also have nice semantics, but are
7864 * slightly problematic on NFS, where they are upgraded to
7865 * POSIX locks, even though locally they are orthogonal to
7875 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7876 .l_whence = SEEK_SET,
7880 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7884 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7887 /* If the kernel is too old, use good old BSD locks */
7888 if (errno == EINVAL)
7889 r = flock(fd, operation);
7892 return errno == EAGAIN ? -EBUSY : -errno;
7895 /* If we acquired the lock, let's check if the file
7896 * still exists in the file system. If not, then the
7897 * previous exclusive owner removed it and then closed
7898 * it. In such a case our acquired lock is worthless,
7899 * hence try again. */
7904 if (st.st_nlink > 0)
7907 fd = safe_close(fd);
7912 ret->operation = operation;
7920 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7928 if (!filename_is_valid(fn))
7931 t = newa(char, strlen(p) + 2 + 4 + 1);
7932 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7934 return make_lock_file(t, operation, ret);
7937 void release_lock_file(LockFile *f) {
7945 /* If we are the exclusive owner we can safely delete
7946 * the lock file itself. If we are not the exclusive
7947 * owner, we can try becoming it. */
7950 (f->operation & ~LOCK_NB) == LOCK_SH) {
7951 static const struct flock fl = {
7953 .l_whence = SEEK_SET,
7956 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7957 if (r < 0 && errno == EINVAL)
7958 r = flock(f->fd, LOCK_EX|LOCK_NB);
7961 f->operation = LOCK_EX|LOCK_NB;
7964 if ((f->operation & ~LOCK_NB) == LOCK_EX)
7965 unlink_noerrno(f->path);
7971 f->fd = safe_close(f->fd);
7975 static size_t nul_length(const uint8_t *p, size_t sz) {
7990 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
7991 const uint8_t *q, *w, *e;
7999 n = nul_length(q, e - q);
8001 /* If there are more than the specified run length of
8002 * NUL bytes, or if this is the beginning or the end
8003 * of the buffer, then seek instead of write */
8004 if ((n > run_length) ||
8005 (n > 0 && q == p) ||
8006 (n > 0 && q + n >= e)) {
8008 l = write(fd, w, q - w);
8015 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
8027 l = write(fd, w, q - w);
8034 return q - (const uint8_t*) p;
8037 void sigkill_wait(pid_t *pid) {
8043 if (kill(*pid, SIGKILL) > 0)
8044 (void) wait_for_terminate(*pid, NULL);
8047 int syslog_parse_priority(const char **p, int *priority, bool with_facility) {
8048 int a = 0, b = 0, c = 0;
8058 if (!strchr(*p, '>'))
8061 if ((*p)[2] == '>') {
8062 c = undecchar((*p)[1]);
8064 } else if ((*p)[3] == '>') {
8065 b = undecchar((*p)[1]);
8066 c = undecchar((*p)[2]);
8068 } else if ((*p)[4] == '>') {
8069 a = undecchar((*p)[1]);
8070 b = undecchar((*p)[2]);
8071 c = undecchar((*p)[3]);
8076 if (a < 0 || b < 0 || c < 0 ||
8077 (!with_facility && (a || b || c > 7)))
8081 *priority = a*100 + b*10 + c;
8083 *priority = (*priority & LOG_FACMASK) | c;