1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
31 #include <sys/resource.h>
32 #include <linux/sched.h>
33 #include <sys/types.h>
37 #include <sys/ioctl.h>
39 #include <linux/tiocl.h>
44 #include <sys/prctl.h>
45 #include <sys/utsname.h>
47 #include <netinet/ip.h>
56 #include <sys/mount.h>
57 #include <linux/magic.h>
61 #include <sys/personality.h>
62 #include <sys/xattr.h>
64 #include <sys/statvfs.h>
69 #ifdef HAVE_SYS_AUXV_H
81 #include "path-util.h"
82 #include "exit-status.h"
86 #include "device-nodes.h"
91 #include "sparse-endian.h"
94 char **saved_argv = NULL;
96 static volatile unsigned cached_columns = 0;
97 static volatile unsigned cached_lines = 0;
99 size_t page_size(void) {
100 static thread_local size_t pgsz = 0;
103 if (_likely_(pgsz > 0))
106 r = sysconf(_SC_PAGESIZE);
113 bool streq_ptr(const char *a, const char *b) {
115 /* Like streq(), but tries to make sense of NULL pointers */
126 char* endswith(const char *s, const char *postfix) {
133 pl = strlen(postfix);
136 return (char*) s + sl;
141 if (memcmp(s + sl - pl, postfix, pl) != 0)
144 return (char*) s + sl - pl;
147 char* first_word(const char *s, const char *word) {
154 /* Checks if the string starts with the specified word, either
155 * followed by NUL or by whitespace. Returns a pointer to the
156 * NUL or the first character after the whitespace. */
167 if (memcmp(s, word, wl) != 0)
174 if (!strchr(WHITESPACE, *p))
177 p += strspn(p, WHITESPACE);
181 static size_t cescape_char(char c, char *buf) {
182 char * buf_old = buf;
228 /* For special chars we prefer octal over
229 * hexadecimal encoding, simply because glib's
230 * g_strescape() does the same */
231 if ((c < ' ') || (c >= 127)) {
233 *(buf++) = octchar((unsigned char) c >> 6);
234 *(buf++) = octchar((unsigned char) c >> 3);
235 *(buf++) = octchar((unsigned char) c);
241 return buf - buf_old;
244 int close_nointr(int fd) {
251 * Just ignore EINTR; a retry loop is the wrong thing to do on
254 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
255 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
256 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
257 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
265 int safe_close(int fd) {
268 * Like close_nointr() but cannot fail. Guarantees errno is
269 * unchanged. Is a NOP with negative fds passed, and returns
270 * -1, so that it can be used in this syntax:
272 * fd = safe_close(fd);
278 /* The kernel might return pretty much any error code
279 * via close(), but the fd will be closed anyway. The
280 * only condition we want to check for here is whether
281 * the fd was invalid at all... */
283 assert_se(close_nointr(fd) != -EBADF);
289 void close_many(const int fds[], unsigned n_fd) {
292 assert(fds || n_fd <= 0);
294 for (i = 0; i < n_fd; i++)
298 int unlink_noerrno(const char *path) {
309 int parse_boolean(const char *v) {
312 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
314 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
320 int parse_pid(const char *s, pid_t* ret_pid) {
321 unsigned long ul = 0;
328 r = safe_atolu(s, &ul);
334 if ((unsigned long) pid != ul)
344 int parse_uid(const char *s, uid_t* ret_uid) {
345 unsigned long ul = 0;
352 r = safe_atolu(s, &ul);
358 if ((unsigned long) uid != ul)
361 /* Some libc APIs use UID_INVALID as special placeholder */
362 if (uid == (uid_t) 0xFFFFFFFF)
365 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
366 if (uid == (uid_t) 0xFFFF)
373 int safe_atou(const char *s, unsigned *ret_u) {
381 l = strtoul(s, &x, 0);
383 if (!x || x == s || *x || errno)
384 return errno > 0 ? -errno : -EINVAL;
386 if ((unsigned long) (unsigned) l != l)
389 *ret_u = (unsigned) l;
393 int safe_atoi(const char *s, int *ret_i) {
401 l = strtol(s, &x, 0);
403 if (!x || x == s || *x || errno)
404 return errno > 0 ? -errno : -EINVAL;
406 if ((long) (int) l != l)
413 int safe_atou8(const char *s, uint8_t *ret) {
421 l = strtoul(s, &x, 0);
423 if (!x || x == s || *x || errno)
424 return errno > 0 ? -errno : -EINVAL;
426 if ((unsigned long) (uint8_t) l != l)
433 int safe_atou16(const char *s, uint16_t *ret) {
441 l = strtoul(s, &x, 0);
443 if (!x || x == s || *x || errno)
444 return errno > 0 ? -errno : -EINVAL;
446 if ((unsigned long) (uint16_t) l != l)
453 int safe_atoi16(const char *s, int16_t *ret) {
461 l = strtol(s, &x, 0);
463 if (!x || x == s || *x || errno)
464 return errno > 0 ? -errno : -EINVAL;
466 if ((long) (int16_t) l != l)
473 int safe_atollu(const char *s, long long unsigned *ret_llu) {
475 unsigned long long l;
481 l = strtoull(s, &x, 0);
483 if (!x || x == s || *x || errno)
484 return errno ? -errno : -EINVAL;
490 int safe_atolli(const char *s, long long int *ret_lli) {
498 l = strtoll(s, &x, 0);
500 if (!x || x == s || *x || errno)
501 return errno ? -errno : -EINVAL;
507 int safe_atod(const char *s, double *ret_d) {
514 RUN_WITH_LOCALE(LC_NUMERIC_MASK, "C") {
519 if (!x || x == s || *x || errno)
520 return errno ? -errno : -EINVAL;
526 static size_t strcspn_escaped(const char *s, const char *reject) {
527 bool escaped = false;
530 for (n=0; s[n]; n++) {
533 else if (s[n] == '\\')
535 else if (strchr(reject, s[n]))
539 /* if s ends in \, return index of previous char */
543 /* Split a string into words. */
544 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
550 assert(**state == '\0');
554 current += strspn(current, separator);
560 if (quoted && strchr("\'\"", *current)) {
561 char quotechars[2] = {*current, '\0'};
563 *l = strcspn_escaped(current + 1, quotechars);
564 if (current[*l + 1] == '\0' ||
565 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
566 /* right quote missing or garbage at the end */
570 assert(current[*l + 1] == quotechars[0]);
571 *state = current++ + *l + 2;
573 *l = strcspn_escaped(current, separator);
574 if (current[*l] && !strchr(separator, current[*l])) {
575 /* unfinished escape */
579 *state = current + *l;
581 *l = strcspn(current, separator);
582 *state = current + *l;
588 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
590 _cleanup_free_ char *line = NULL;
602 p = procfs_file_alloca(pid, "stat");
603 r = read_one_line_file(p, &line);
607 /* Let's skip the pid and comm fields. The latter is enclosed
608 * in () but does not escape any () in its value, so let's
609 * skip over it manually */
611 p = strrchr(line, ')');
623 if ((long unsigned) (pid_t) ppid != ppid)
626 *_ppid = (pid_t) ppid;
631 int fchmod_umask(int fd, mode_t m) {
636 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
642 char *truncate_nl(char *s) {
645 s[strcspn(s, NEWLINE)] = 0;
649 int get_process_state(pid_t pid) {
653 _cleanup_free_ char *line = NULL;
657 p = procfs_file_alloca(pid, "stat");
658 r = read_one_line_file(p, &line);
662 p = strrchr(line, ')');
668 if (sscanf(p, " %c", &state) != 1)
671 return (unsigned char) state;
674 int get_process_comm(pid_t pid, char **name) {
681 p = procfs_file_alloca(pid, "comm");
683 r = read_one_line_file(p, name);
690 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
691 _cleanup_fclose_ FILE *f = NULL;
699 p = procfs_file_alloca(pid, "cmdline");
705 if (max_length == 0) {
706 size_t len = 0, allocated = 0;
708 while ((c = getc(f)) != EOF) {
710 if (!GREEDY_REALLOC(r, allocated, len+2)) {
715 r[len++] = isprint(c) ? c : ' ';
725 r = new(char, max_length);
731 while ((c = getc(f)) != EOF) {
753 size_t n = MIN(left-1, 3U);
760 /* Kernel threads have no argv[] */
762 _cleanup_free_ char *t = NULL;
770 h = get_process_comm(pid, &t);
774 r = strjoin("[", t, "]", NULL);
783 int is_kernel_thread(pid_t pid) {
795 p = procfs_file_alloca(pid, "cmdline");
800 count = fread(&c, 1, 1, f);
804 /* Kernel threads have an empty cmdline */
807 return eof ? 1 : -errno;
812 int get_process_capeff(pid_t pid, char **capeff) {
818 p = procfs_file_alloca(pid, "status");
820 return get_status_field(p, "\nCapEff:", capeff);
823 static int get_process_link_contents(const char *proc_file, char **name) {
829 r = readlink_malloc(proc_file, name);
831 return r == -ENOENT ? -ESRCH : r;
836 int get_process_exe(pid_t pid, char **name) {
843 p = procfs_file_alloca(pid, "exe");
844 r = get_process_link_contents(p, name);
848 d = endswith(*name, " (deleted)");
855 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
856 _cleanup_fclose_ FILE *f = NULL;
866 p = procfs_file_alloca(pid, "status");
871 FOREACH_LINE(line, f, return -errno) {
876 if (startswith(l, field)) {
878 l += strspn(l, WHITESPACE);
880 l[strcspn(l, WHITESPACE)] = 0;
882 return parse_uid(l, uid);
889 int get_process_uid(pid_t pid, uid_t *uid) {
890 return get_process_id(pid, "Uid:", uid);
893 int get_process_gid(pid_t pid, gid_t *gid) {
894 assert_cc(sizeof(uid_t) == sizeof(gid_t));
895 return get_process_id(pid, "Gid:", gid);
898 int get_process_cwd(pid_t pid, char **cwd) {
903 p = procfs_file_alloca(pid, "cwd");
905 return get_process_link_contents(p, cwd);
908 int get_process_root(pid_t pid, char **root) {
913 p = procfs_file_alloca(pid, "root");
915 return get_process_link_contents(p, root);
918 int get_process_environ(pid_t pid, char **env) {
919 _cleanup_fclose_ FILE *f = NULL;
920 _cleanup_free_ char *outcome = NULL;
923 size_t allocated = 0, sz = 0;
928 p = procfs_file_alloca(pid, "environ");
934 while ((c = fgetc(f)) != EOF) {
935 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
939 outcome[sz++] = '\n';
941 sz += cescape_char(c, outcome + sz);
951 char *strnappend(const char *s, const char *suffix, size_t b) {
959 return strndup(suffix, b);
968 if (b > ((size_t) -1) - a)
971 r = new(char, a+b+1);
976 memcpy(r+a, suffix, b);
982 char *strappend(const char *s, const char *suffix) {
983 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
986 int readlinkat_malloc(int fd, const char *p, char **ret) {
1001 n = readlinkat(fd, p, c, l-1);
1008 if ((size_t) n < l-1) {
1019 int readlink_malloc(const char *p, char **ret) {
1020 return readlinkat_malloc(AT_FDCWD, p, ret);
1023 int readlink_value(const char *p, char **ret) {
1024 _cleanup_free_ char *link = NULL;
1028 r = readlink_malloc(p, &link);
1032 value = basename(link);
1036 value = strdup(value);
1045 int readlink_and_make_absolute(const char *p, char **r) {
1046 _cleanup_free_ char *target = NULL;
1053 j = readlink_malloc(p, &target);
1057 k = file_in_same_dir(p, target);
1065 int readlink_and_canonicalize(const char *p, char **r) {
1072 j = readlink_and_make_absolute(p, &t);
1076 s = canonicalize_file_name(t);
1083 path_kill_slashes(*r);
1088 int reset_all_signal_handlers(void) {
1091 for (sig = 1; sig < _NSIG; sig++) {
1092 struct sigaction sa = {
1093 .sa_handler = SIG_DFL,
1094 .sa_flags = SA_RESTART,
1097 /* These two cannot be caught... */
1098 if (sig == SIGKILL || sig == SIGSTOP)
1101 /* On Linux the first two RT signals are reserved by
1102 * glibc, and sigaction() will return EINVAL for them. */
1103 if ((sigaction(sig, &sa, NULL) < 0))
1104 if (errno != EINVAL && r == 0)
1111 int reset_signal_mask(void) {
1114 if (sigemptyset(&ss) < 0)
1117 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1123 char *strstrip(char *s) {
1126 /* Drops trailing whitespace. Modifies the string in
1127 * place. Returns pointer to first non-space character */
1129 s += strspn(s, WHITESPACE);
1131 for (e = strchr(s, 0); e > s; e --)
1132 if (!strchr(WHITESPACE, e[-1]))
1140 char *delete_chars(char *s, const char *bad) {
1143 /* Drops all whitespace, regardless where in the string */
1145 for (f = s, t = s; *f; f++) {
1146 if (strchr(bad, *f))
1157 char *file_in_same_dir(const char *path, const char *filename) {
1164 /* This removes the last component of path and appends
1165 * filename, unless the latter is absolute anyway or the
1168 if (path_is_absolute(filename))
1169 return strdup(filename);
1171 e = strrchr(path, '/');
1173 return strdup(filename);
1175 k = strlen(filename);
1176 ret = new(char, (e + 1 - path) + k + 1);
1180 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1184 int rmdir_parents(const char *path, const char *stop) {
1193 /* Skip trailing slashes */
1194 while (l > 0 && path[l-1] == '/')
1200 /* Skip last component */
1201 while (l > 0 && path[l-1] != '/')
1204 /* Skip trailing slashes */
1205 while (l > 0 && path[l-1] == '/')
1211 if (!(t = strndup(path, l)))
1214 if (path_startswith(stop, t)) {
1223 if (errno != ENOENT)
1230 char hexchar(int x) {
1231 static const char table[16] = "0123456789abcdef";
1233 return table[x & 15];
1236 int unhexchar(char c) {
1238 if (c >= '0' && c <= '9')
1241 if (c >= 'a' && c <= 'f')
1242 return c - 'a' + 10;
1244 if (c >= 'A' && c <= 'F')
1245 return c - 'A' + 10;
1250 char *hexmem(const void *p, size_t l) {
1254 z = r = malloc(l * 2 + 1);
1258 for (x = p; x < (const uint8_t*) p + l; x++) {
1259 *(z++) = hexchar(*x >> 4);
1260 *(z++) = hexchar(*x & 15);
1267 void *unhexmem(const char *p, size_t l) {
1273 z = r = malloc((l + 1) / 2 + 1);
1277 for (x = p; x < p + l; x += 2) {
1280 a = unhexchar(x[0]);
1282 b = unhexchar(x[1]);
1286 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1293 char octchar(int x) {
1294 return '0' + (x & 7);
1297 int unoctchar(char c) {
1299 if (c >= '0' && c <= '7')
1305 char decchar(int x) {
1306 return '0' + (x % 10);
1309 int undecchar(char c) {
1311 if (c >= '0' && c <= '9')
1317 char *cescape(const char *s) {
1323 /* Does C style string escaping. */
1325 r = new(char, strlen(s)*4 + 1);
1329 for (f = s, t = r; *f; f++)
1330 t += cescape_char(*f, t);
1337 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1344 /* Undoes C style string escaping, and optionally prefixes it. */
1346 pl = prefix ? strlen(prefix) : 0;
1348 r = new(char, pl+length+1);
1353 memcpy(r, prefix, pl);
1355 for (f = s, t = r + pl; f < s + length; f++) {
1356 size_t remaining = s + length - f;
1357 assert(remaining > 0);
1359 if (*f != '\\') { /* a literal literal */
1364 if (--remaining == 0) { /* copy trailing backslash verbatim */
1405 /* This is an extension of the XDG syntax files */
1410 /* hexadecimal encoding */
1413 if (remaining >= 2) {
1414 a = unhexchar(f[1]);
1415 b = unhexchar(f[2]);
1418 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1419 /* Invalid escape code, let's take it literal then */
1423 *(t++) = (char) ((a << 4) | b);
1438 /* octal encoding */
1439 int a = -1, b = -1, c = -1;
1441 if (remaining >= 3) {
1442 a = unoctchar(f[0]);
1443 b = unoctchar(f[1]);
1444 c = unoctchar(f[2]);
1447 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1448 /* Invalid escape code, let's take it literal then */
1452 *(t++) = (char) ((a << 6) | (b << 3) | c);
1460 /* Invalid escape code, let's take it literal then */
1471 char *cunescape_length(const char *s, size_t length) {
1472 return cunescape_length_with_prefix(s, length, NULL);
1475 char *cunescape(const char *s) {
1478 return cunescape_length(s, strlen(s));
1481 char *xescape(const char *s, const char *bad) {
1485 /* Escapes all chars in bad, in addition to \ and all special
1486 * chars, in \xFF style escaping. May be reversed with
1489 r = new(char, strlen(s) * 4 + 1);
1493 for (f = s, t = r; *f; f++) {
1495 if ((*f < ' ') || (*f >= 127) ||
1496 (*f == '\\') || strchr(bad, *f)) {
1499 *(t++) = hexchar(*f >> 4);
1500 *(t++) = hexchar(*f);
1510 char *ascii_strlower(char *t) {
1515 for (p = t; *p; p++)
1516 if (*p >= 'A' && *p <= 'Z')
1517 *p = *p - 'A' + 'a';
1522 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1526 filename[0] == '.' ||
1527 streq(filename, "lost+found") ||
1528 streq(filename, "aquota.user") ||
1529 streq(filename, "aquota.group") ||
1530 endswith(filename, ".rpmnew") ||
1531 endswith(filename, ".rpmsave") ||
1532 endswith(filename, ".rpmorig") ||
1533 endswith(filename, ".dpkg-old") ||
1534 endswith(filename, ".dpkg-new") ||
1535 endswith(filename, ".dpkg-tmp") ||
1536 endswith(filename, ".swp");
1539 bool hidden_file(const char *filename) {
1542 if (endswith(filename, "~"))
1545 return hidden_file_allow_backup(filename);
1548 int fd_nonblock(int fd, bool nonblock) {
1553 flags = fcntl(fd, F_GETFL, 0);
1558 nflags = flags | O_NONBLOCK;
1560 nflags = flags & ~O_NONBLOCK;
1562 if (nflags == flags)
1565 if (fcntl(fd, F_SETFL, nflags) < 0)
1571 int fd_cloexec(int fd, bool cloexec) {
1576 flags = fcntl(fd, F_GETFD, 0);
1581 nflags = flags | FD_CLOEXEC;
1583 nflags = flags & ~FD_CLOEXEC;
1585 if (nflags == flags)
1588 if (fcntl(fd, F_SETFD, nflags) < 0)
1594 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1597 assert(n_fdset == 0 || fdset);
1599 for (i = 0; i < n_fdset; i++)
1606 int close_all_fds(const int except[], unsigned n_except) {
1607 _cleanup_closedir_ DIR *d = NULL;
1611 assert(n_except == 0 || except);
1613 d = opendir("/proc/self/fd");
1618 /* When /proc isn't available (for example in chroots)
1619 * the fallback is brute forcing through the fd
1622 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1623 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1625 if (fd_in_set(fd, except, n_except))
1628 if (close_nointr(fd) < 0)
1629 if (errno != EBADF && r == 0)
1636 while ((de = readdir(d))) {
1639 if (hidden_file(de->d_name))
1642 if (safe_atoi(de->d_name, &fd) < 0)
1643 /* Let's better ignore this, just in case */
1652 if (fd_in_set(fd, except, n_except))
1655 if (close_nointr(fd) < 0) {
1656 /* Valgrind has its own FD and doesn't want to have it closed */
1657 if (errno != EBADF && r == 0)
1665 bool chars_intersect(const char *a, const char *b) {
1668 /* Returns true if any of the chars in a are in b. */
1669 for (p = a; *p; p++)
1676 bool fstype_is_network(const char *fstype) {
1677 static const char table[] =
1691 x = startswith(fstype, "fuse.");
1695 return nulstr_contains(table, fstype);
1699 _cleanup_close_ int fd;
1701 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1707 TIOCL_GETKMSGREDIRECT,
1711 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1714 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1717 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1723 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1724 struct termios old_termios, new_termios;
1725 char c, line[LINE_MAX];
1730 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1731 new_termios = old_termios;
1733 new_termios.c_lflag &= ~ICANON;
1734 new_termios.c_cc[VMIN] = 1;
1735 new_termios.c_cc[VTIME] = 0;
1737 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1740 if (t != USEC_INFINITY) {
1741 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1742 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1747 k = fread(&c, 1, 1, f);
1749 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1755 *need_nl = c != '\n';
1762 if (t != USEC_INFINITY) {
1763 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1768 if (!fgets(line, sizeof(line), f))
1769 return errno ? -errno : -EIO;
1773 if (strlen(line) != 1)
1783 int ask_char(char *ret, const char *replies, const char *text, ...) {
1793 bool need_nl = true;
1796 fputs(ANSI_HIGHLIGHT_ON, stdout);
1803 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1807 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1810 if (r == -EBADMSG) {
1811 puts("Bad input, please try again.");
1822 if (strchr(replies, c)) {
1827 puts("Read unexpected character, please try again.");
1831 int ask_string(char **ret, const char *text, ...) {
1836 char line[LINE_MAX];
1840 fputs(ANSI_HIGHLIGHT_ON, stdout);
1847 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1852 if (!fgets(line, sizeof(line), stdin))
1853 return errno ? -errno : -EIO;
1855 if (!endswith(line, "\n"))
1874 int reset_terminal_fd(int fd, bool switch_to_text) {
1875 struct termios termios;
1878 /* Set terminal to some sane defaults */
1882 /* We leave locked terminal attributes untouched, so that
1883 * Plymouth may set whatever it wants to set, and we don't
1884 * interfere with that. */
1886 /* Disable exclusive mode, just in case */
1887 ioctl(fd, TIOCNXCL);
1889 /* Switch to text mode */
1891 ioctl(fd, KDSETMODE, KD_TEXT);
1893 /* Enable console unicode mode */
1894 ioctl(fd, KDSKBMODE, K_UNICODE);
1896 if (tcgetattr(fd, &termios) < 0) {
1901 /* We only reset the stuff that matters to the software. How
1902 * hardware is set up we don't touch assuming that somebody
1903 * else will do that for us */
1905 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1906 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1907 termios.c_oflag |= ONLCR;
1908 termios.c_cflag |= CREAD;
1909 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1911 termios.c_cc[VINTR] = 03; /* ^C */
1912 termios.c_cc[VQUIT] = 034; /* ^\ */
1913 termios.c_cc[VERASE] = 0177;
1914 termios.c_cc[VKILL] = 025; /* ^X */
1915 termios.c_cc[VEOF] = 04; /* ^D */
1916 termios.c_cc[VSTART] = 021; /* ^Q */
1917 termios.c_cc[VSTOP] = 023; /* ^S */
1918 termios.c_cc[VSUSP] = 032; /* ^Z */
1919 termios.c_cc[VLNEXT] = 026; /* ^V */
1920 termios.c_cc[VWERASE] = 027; /* ^W */
1921 termios.c_cc[VREPRINT] = 022; /* ^R */
1922 termios.c_cc[VEOL] = 0;
1923 termios.c_cc[VEOL2] = 0;
1925 termios.c_cc[VTIME] = 0;
1926 termios.c_cc[VMIN] = 1;
1928 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1932 /* Just in case, flush all crap out */
1933 tcflush(fd, TCIOFLUSH);
1938 int reset_terminal(const char *name) {
1939 _cleanup_close_ int fd = -1;
1941 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1945 return reset_terminal_fd(fd, true);
1948 int open_terminal(const char *name, int mode) {
1953 * If a TTY is in the process of being closed opening it might
1954 * cause EIO. This is horribly awful, but unlikely to be
1955 * changed in the kernel. Hence we work around this problem by
1956 * retrying a couple of times.
1958 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
1961 assert(!(mode & O_CREAT));
1964 fd = open(name, mode, 0);
1971 /* Max 1s in total */
1975 usleep(50 * USEC_PER_MSEC);
1993 int flush_fd(int fd) {
1994 struct pollfd pollfd = {
2004 r = poll(&pollfd, 1, 0);
2014 l = read(fd, buf, sizeof(buf));
2020 if (errno == EAGAIN)
2029 int acquire_terminal(
2033 bool ignore_tiocstty_eperm,
2036 int fd = -1, notify = -1, r = 0, wd = -1;
2041 /* We use inotify to be notified when the tty is closed. We
2042 * create the watch before checking if we can actually acquire
2043 * it, so that we don't lose any event.
2045 * Note: strictly speaking this actually watches for the
2046 * device being closed, it does *not* really watch whether a
2047 * tty loses its controlling process. However, unless some
2048 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2049 * its tty otherwise this will not become a problem. As long
2050 * as the administrator makes sure not configure any service
2051 * on the same tty as an untrusted user this should not be a
2052 * problem. (Which he probably should not do anyway.) */
2054 if (timeout != USEC_INFINITY)
2055 ts = now(CLOCK_MONOTONIC);
2057 if (!fail && !force) {
2058 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2064 wd = inotify_add_watch(notify, name, IN_CLOSE);
2072 struct sigaction sa_old, sa_new = {
2073 .sa_handler = SIG_IGN,
2074 .sa_flags = SA_RESTART,
2078 r = flush_fd(notify);
2083 /* We pass here O_NOCTTY only so that we can check the return
2084 * value TIOCSCTTY and have a reliable way to figure out if we
2085 * successfully became the controlling process of the tty */
2086 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2090 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2091 * if we already own the tty. */
2092 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2094 /* First, try to get the tty */
2095 if (ioctl(fd, TIOCSCTTY, force) < 0)
2098 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2100 /* Sometimes it makes sense to ignore TIOCSCTTY
2101 * returning EPERM, i.e. when very likely we already
2102 * are have this controlling terminal. */
2103 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2106 if (r < 0 && (force || fail || r != -EPERM)) {
2115 assert(notify >= 0);
2118 union inotify_event_buffer buffer;
2119 struct inotify_event *e;
2122 if (timeout != USEC_INFINITY) {
2125 n = now(CLOCK_MONOTONIC);
2126 if (ts + timeout < n) {
2131 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2141 l = read(notify, &buffer, sizeof(buffer));
2143 if (errno == EINTR || errno == EAGAIN)
2150 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2151 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2160 /* We close the tty fd here since if the old session
2161 * ended our handle will be dead. It's important that
2162 * we do this after sleeping, so that we don't enter
2163 * an endless loop. */
2164 fd = safe_close(fd);
2169 r = reset_terminal_fd(fd, true);
2171 log_warning_errno(r, "Failed to reset terminal: %m");
2182 int release_terminal(void) {
2183 static const struct sigaction sa_new = {
2184 .sa_handler = SIG_IGN,
2185 .sa_flags = SA_RESTART,
2188 _cleanup_close_ int fd = -1;
2189 struct sigaction sa_old;
2192 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2196 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2197 * by our own TIOCNOTTY */
2198 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2200 if (ioctl(fd, TIOCNOTTY) < 0)
2203 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2208 int sigaction_many(const struct sigaction *sa, ...) {
2213 while ((sig = va_arg(ap, int)) > 0)
2214 if (sigaction(sig, sa, NULL) < 0)
2221 int ignore_signals(int sig, ...) {
2222 struct sigaction sa = {
2223 .sa_handler = SIG_IGN,
2224 .sa_flags = SA_RESTART,
2229 if (sigaction(sig, &sa, NULL) < 0)
2233 while ((sig = va_arg(ap, int)) > 0)
2234 if (sigaction(sig, &sa, NULL) < 0)
2241 int default_signals(int sig, ...) {
2242 struct sigaction sa = {
2243 .sa_handler = SIG_DFL,
2244 .sa_flags = SA_RESTART,
2249 if (sigaction(sig, &sa, NULL) < 0)
2253 while ((sig = va_arg(ap, int)) > 0)
2254 if (sigaction(sig, &sa, NULL) < 0)
2261 void safe_close_pair(int p[]) {
2265 /* Special case pairs which use the same fd in both
2267 p[0] = p[1] = safe_close(p[0]);
2271 p[0] = safe_close(p[0]);
2272 p[1] = safe_close(p[1]);
2275 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2282 while (nbytes > 0) {
2285 k = read(fd, p, nbytes);
2290 if (errno == EAGAIN && do_poll) {
2292 /* We knowingly ignore any return value here,
2293 * and expect that any error/EOF is reported
2296 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2300 return n > 0 ? n : -errno;
2314 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2315 const uint8_t *p = buf;
2322 while (nbytes > 0) {
2325 k = write(fd, p, nbytes);
2330 if (errno == EAGAIN && do_poll) {
2331 /* We knowingly ignore any return value here,
2332 * and expect that any error/EOF is reported
2335 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2342 if (k == 0) /* Can't really happen */
2352 int parse_size(const char *t, off_t base, off_t *size) {
2354 /* Soo, sometimes we want to parse IEC binary suffxies, and
2355 * sometimes SI decimal suffixes. This function can parse
2356 * both. Which one is the right way depends on the
2357 * context. Wikipedia suggests that SI is customary for
2358 * hardrware metrics and network speeds, while IEC is
2359 * customary for most data sizes used by software and volatile
2360 * (RAM) memory. Hence be careful which one you pick!
2362 * In either case we use just K, M, G as suffix, and not Ki,
2363 * Mi, Gi or so (as IEC would suggest). That's because that's
2364 * frickin' ugly. But this means you really need to make sure
2365 * to document which base you are parsing when you use this
2370 unsigned long long factor;
2373 static const struct table iec[] = {
2374 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2375 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2376 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2377 { "G", 1024ULL*1024ULL*1024ULL },
2378 { "M", 1024ULL*1024ULL },
2384 static const struct table si[] = {
2385 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2386 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2387 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2388 { "G", 1000ULL*1000ULL*1000ULL },
2389 { "M", 1000ULL*1000ULL },
2395 const struct table *table;
2397 unsigned long long r = 0;
2398 unsigned n_entries, start_pos = 0;
2401 assert(base == 1000 || base == 1024);
2406 n_entries = ELEMENTSOF(si);
2409 n_entries = ELEMENTSOF(iec);
2415 unsigned long long l2;
2421 l = strtoll(p, &e, 10);
2434 if (*e >= '0' && *e <= '9') {
2437 /* strotoull itself would accept space/+/- */
2438 l2 = strtoull(e, &e2, 10);
2440 if (errno == ERANGE)
2443 /* Ignore failure. E.g. 10.M is valid */
2450 e += strspn(e, WHITESPACE);
2452 for (i = start_pos; i < n_entries; i++)
2453 if (startswith(e, table[i].suffix)) {
2454 unsigned long long tmp;
2455 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2457 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2458 if (tmp > ULLONG_MAX - r)
2462 if ((unsigned long long) (off_t) r != r)
2465 p = e + strlen(table[i].suffix);
2481 int make_stdio(int fd) {
2486 r = dup2(fd, STDIN_FILENO);
2487 s = dup2(fd, STDOUT_FILENO);
2488 t = dup2(fd, STDERR_FILENO);
2493 if (r < 0 || s < 0 || t < 0)
2496 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2497 * dup2() was a NOP and the bit hence possibly set. */
2498 fd_cloexec(STDIN_FILENO, false);
2499 fd_cloexec(STDOUT_FILENO, false);
2500 fd_cloexec(STDERR_FILENO, false);
2505 int make_null_stdio(void) {
2508 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2512 return make_stdio(null_fd);
2515 bool is_device_path(const char *path) {
2517 /* Returns true on paths that refer to a device, either in
2518 * sysfs or in /dev */
2521 path_startswith(path, "/dev/") ||
2522 path_startswith(path, "/sys/");
2525 int dir_is_empty(const char *path) {
2526 _cleanup_closedir_ DIR *d;
2537 if (!de && errno != 0)
2543 if (!hidden_file(de->d_name))
2548 char* dirname_malloc(const char *path) {
2549 char *d, *dir, *dir2;
2566 int dev_urandom(void *p, size_t n) {
2567 static int have_syscall = -1;
2571 /* Gathers some randomness from the kernel. This call will
2572 * never block, and will always return some data from the
2573 * kernel, regardless if the random pool is fully initialized
2574 * or not. It thus makes no guarantee for the quality of the
2575 * returned entropy, but is good enough for or usual usecases
2576 * of seeding the hash functions for hashtable */
2578 /* Use the getrandom() syscall unless we know we don't have
2579 * it, or when the requested size is too large for it. */
2580 if (have_syscall != 0 || (size_t) (int) n != n) {
2581 r = getrandom(p, n, GRND_NONBLOCK);
2583 have_syscall = true;
2588 if (errno == ENOSYS)
2589 /* we lack the syscall, continue with
2590 * reading from /dev/urandom */
2591 have_syscall = false;
2592 else if (errno == EAGAIN)
2593 /* not enough entropy for now. Let's
2594 * remember to use the syscall the
2595 * next time, again, but also read
2596 * from /dev/urandom for now, which
2597 * doesn't care about the current
2598 * amount of entropy. */
2599 have_syscall = true;
2603 /* too short read? */
2607 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2609 return errno == ENOENT ? -ENOSYS : -errno;
2611 k = loop_read(fd, p, n, true);
2616 if ((size_t) k != n)
2622 void initialize_srand(void) {
2623 static bool srand_called = false;
2625 #ifdef HAVE_SYS_AUXV_H
2634 #ifdef HAVE_SYS_AUXV_H
2635 /* The kernel provides us with a bit of entropy in auxv, so
2636 * let's try to make use of that to seed the pseudo-random
2637 * generator. It's better than nothing... */
2639 auxv = (void*) getauxval(AT_RANDOM);
2641 x ^= *(unsigned*) auxv;
2644 x ^= (unsigned) now(CLOCK_REALTIME);
2645 x ^= (unsigned) gettid();
2648 srand_called = true;
2651 void random_bytes(void *p, size_t n) {
2655 r = dev_urandom(p, n);
2659 /* If some idiot made /dev/urandom unavailable to us, he'll
2660 * get a PRNG instead. */
2664 for (q = p; q < (uint8_t*) p + n; q ++)
2668 void rename_process(const char name[8]) {
2671 /* This is a like a poor man's setproctitle(). It changes the
2672 * comm field, argv[0], and also the glibc's internally used
2673 * name of the process. For the first one a limit of 16 chars
2674 * applies, to the second one usually one of 10 (i.e. length
2675 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2676 * "systemd"). If you pass a longer string it will be
2679 prctl(PR_SET_NAME, name);
2681 if (program_invocation_name)
2682 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2684 if (saved_argc > 0) {
2688 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2690 for (i = 1; i < saved_argc; i++) {
2694 memzero(saved_argv[i], strlen(saved_argv[i]));
2699 void sigset_add_many(sigset_t *ss, ...) {
2706 while ((sig = va_arg(ap, int)) > 0)
2707 assert_se(sigaddset(ss, sig) == 0);
2711 int sigprocmask_many(int how, ...) {
2716 assert_se(sigemptyset(&ss) == 0);
2719 while ((sig = va_arg(ap, int)) > 0)
2720 assert_se(sigaddset(&ss, sig) == 0);
2723 if (sigprocmask(how, &ss, NULL) < 0)
2729 char* gethostname_malloc(void) {
2732 assert_se(uname(&u) >= 0);
2734 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2735 return strdup(u.nodename);
2737 return strdup(u.sysname);
2740 bool hostname_is_set(void) {
2743 assert_se(uname(&u) >= 0);
2745 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2748 char *lookup_uid(uid_t uid) {
2751 _cleanup_free_ char *buf = NULL;
2752 struct passwd pwbuf, *pw = NULL;
2754 /* Shortcut things to avoid NSS lookups */
2756 return strdup("root");
2758 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2762 buf = malloc(bufsize);
2766 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2767 return strdup(pw->pw_name);
2769 if (asprintf(&name, UID_FMT, uid) < 0)
2775 char* getlogname_malloc(void) {
2779 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2784 return lookup_uid(uid);
2787 char *getusername_malloc(void) {
2794 return lookup_uid(getuid());
2797 int getttyname_malloc(int fd, char **ret) {
2807 r = ttyname_r(fd, path, sizeof(path));
2812 p = startswith(path, "/dev/");
2813 c = strdup(p ?: path);
2830 int getttyname_harder(int fd, char **r) {
2834 k = getttyname_malloc(fd, &s);
2838 if (streq(s, "tty")) {
2840 return get_ctty(0, NULL, r);
2847 int get_ctty_devnr(pid_t pid, dev_t *d) {
2849 _cleanup_free_ char *line = NULL;
2851 unsigned long ttynr;
2855 p = procfs_file_alloca(pid, "stat");
2856 r = read_one_line_file(p, &line);
2860 p = strrchr(line, ')');
2870 "%*d " /* session */
2875 if (major(ttynr) == 0 && minor(ttynr) == 0)
2884 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2885 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2886 _cleanup_free_ char *s = NULL;
2893 k = get_ctty_devnr(pid, &devnr);
2897 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
2899 k = readlink_malloc(fn, &s);
2905 /* This is an ugly hack */
2906 if (major(devnr) == 136) {
2907 asprintf(&b, "pts/%u", minor(devnr));
2911 /* Probably something like the ptys which have no
2912 * symlink in /dev/char. Let's return something
2913 * vaguely useful. */
2919 if (startswith(s, "/dev/"))
2921 else if (startswith(s, "../"))
2939 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2940 _cleanup_closedir_ DIR *d = NULL;
2945 /* This returns the first error we run into, but nevertheless
2946 * tries to go on. This closes the passed fd. */
2952 return errno == ENOENT ? 0 : -errno;
2957 bool is_dir, keep_around;
2964 if (errno != 0 && ret == 0)
2969 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
2972 if (de->d_type == DT_UNKNOWN ||
2974 (de->d_type == DT_DIR && root_dev)) {
2975 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
2976 if (ret == 0 && errno != ENOENT)
2981 is_dir = S_ISDIR(st.st_mode);
2984 (st.st_uid == 0 || st.st_uid == getuid()) &&
2985 (st.st_mode & S_ISVTX);
2987 is_dir = de->d_type == DT_DIR;
2988 keep_around = false;
2994 /* if root_dev is set, remove subdirectories only, if device is same as dir */
2995 if (root_dev && st.st_dev != root_dev->st_dev)
2998 subdir_fd = openat(fd, de->d_name,
2999 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3000 if (subdir_fd < 0) {
3001 if (ret == 0 && errno != ENOENT)
3006 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
3007 if (r < 0 && ret == 0)
3011 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
3012 if (ret == 0 && errno != ENOENT)
3016 } else if (!only_dirs && !keep_around) {
3018 if (unlinkat(fd, de->d_name, 0) < 0) {
3019 if (ret == 0 && errno != ENOENT)
3026 _pure_ static int is_temporary_fs(struct statfs *s) {
3029 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3030 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3033 int is_fd_on_temporary_fs(int fd) {
3036 if (fstatfs(fd, &s) < 0)
3039 return is_temporary_fs(&s);
3042 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
3047 if (fstatfs(fd, &s) < 0) {
3052 /* We refuse to clean disk file systems with this call. This
3053 * is extra paranoia just to be sure we never ever remove
3055 if (!is_temporary_fs(&s)) {
3056 log_error("Attempted to remove disk file system, and we can't allow that.");
3061 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
3064 static int file_is_priv_sticky(const char *p) {
3069 if (lstat(p, &st) < 0)
3073 (st.st_uid == 0 || st.st_uid == getuid()) &&
3074 (st.st_mode & S_ISVTX);
3077 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
3083 /* We refuse to clean the root file system with this
3084 * call. This is extra paranoia to never cause a really
3085 * seriously broken system. */
3086 if (path_equal(path, "/")) {
3087 log_error("Attempted to remove entire root file system, and we can't allow that.");
3091 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3094 if (errno != ENOTDIR && errno != ELOOP)
3098 if (statfs(path, &s) < 0)
3101 if (!is_temporary_fs(&s)) {
3102 log_error("Attempted to remove disk file system, and we can't allow that.");
3107 if (delete_root && !only_dirs)
3108 if (unlink(path) < 0 && errno != ENOENT)
3115 if (fstatfs(fd, &s) < 0) {
3120 if (!is_temporary_fs(&s)) {
3121 log_error("Attempted to remove disk file system, and we can't allow that.");
3127 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
3130 if (honour_sticky && file_is_priv_sticky(path) > 0)
3133 if (rmdir(path) < 0 && errno != ENOENT) {
3142 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3143 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
3146 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3147 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
3150 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3153 /* Under the assumption that we are running privileged we
3154 * first change the access mode and only then hand out
3155 * ownership to avoid a window where access is too open. */
3157 if (mode != MODE_INVALID)
3158 if (chmod(path, mode) < 0)
3161 if (uid != UID_INVALID || gid != GID_INVALID)
3162 if (chown(path, uid, gid) < 0)
3168 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3171 /* Under the assumption that we are running privileged we
3172 * first change the access mode and only then hand out
3173 * ownership to avoid a window where access is too open. */
3175 if (mode != MODE_INVALID)
3176 if (fchmod(fd, mode) < 0)
3179 if (uid != UID_INVALID || gid != GID_INVALID)
3180 if (fchown(fd, uid, gid) < 0)
3186 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3190 /* Allocates the cpuset in the right size */
3193 if (!(r = CPU_ALLOC(n)))
3196 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3197 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3207 if (errno != EINVAL)
3214 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3215 static const char status_indent[] = " "; /* "[" STATUS "] " */
3216 _cleanup_free_ char *s = NULL;
3217 _cleanup_close_ int fd = -1;
3218 struct iovec iovec[6] = {};
3220 static bool prev_ephemeral;
3224 /* This is independent of logging, as status messages are
3225 * optional and go exclusively to the console. */
3227 if (vasprintf(&s, format, ap) < 0)
3230 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3243 sl = status ? sizeof(status_indent)-1 : 0;
3249 e = ellipsize(s, emax, 50);
3257 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3258 prev_ephemeral = ephemeral;
3261 if (!isempty(status)) {
3262 IOVEC_SET_STRING(iovec[n++], "[");
3263 IOVEC_SET_STRING(iovec[n++], status);
3264 IOVEC_SET_STRING(iovec[n++], "] ");
3266 IOVEC_SET_STRING(iovec[n++], status_indent);
3269 IOVEC_SET_STRING(iovec[n++], s);
3271 IOVEC_SET_STRING(iovec[n++], "\n");
3273 if (writev(fd, iovec, n) < 0)
3279 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3285 va_start(ap, format);
3286 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3292 char *replace_env(const char *format, char **env) {
3299 const char *e, *word = format;
3304 for (e = format; *e; e ++) {
3315 k = strnappend(r, word, e-word-1);
3325 } else if (*e == '$') {
3326 k = strnappend(r, word, e-word);
3343 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3345 k = strappend(r, t);
3359 k = strnappend(r, word, e-word);
3371 char **replace_env_argv(char **argv, char **env) {
3373 unsigned k = 0, l = 0;
3375 l = strv_length(argv);
3377 ret = new(char*, l+1);
3381 STRV_FOREACH(i, argv) {
3383 /* If $FOO appears as single word, replace it by the split up variable */
3384 if ((*i)[0] == '$' && (*i)[1] != '{') {
3389 e = strv_env_get(env, *i+1);
3393 r = strv_split_quoted(&m, e, true);
3405 w = realloc(ret, sizeof(char*) * (l+1));
3415 memcpy(ret + k, m, q * sizeof(char*));
3423 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3424 ret[k] = replace_env(*i, env);
3436 int fd_columns(int fd) {
3437 struct winsize ws = {};
3439 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3448 unsigned columns(void) {
3452 if (_likely_(cached_columns > 0))
3453 return cached_columns;
3456 e = getenv("COLUMNS");
3458 (void) safe_atoi(e, &c);
3461 c = fd_columns(STDOUT_FILENO);
3467 return cached_columns;
3470 int fd_lines(int fd) {
3471 struct winsize ws = {};
3473 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3482 unsigned lines(void) {
3486 if (_likely_(cached_lines > 0))
3487 return cached_lines;
3490 e = getenv("LINES");
3492 (void) safe_atoi(e, &l);
3495 l = fd_lines(STDOUT_FILENO);
3501 return cached_lines;
3504 /* intended to be used as a SIGWINCH sighandler */
3505 void columns_lines_cache_reset(int signum) {
3511 static int cached_on_tty = -1;
3513 if (_unlikely_(cached_on_tty < 0))
3514 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3516 return cached_on_tty;
3519 int files_same(const char *filea, const char *fileb) {
3522 if (stat(filea, &a) < 0)
3525 if (stat(fileb, &b) < 0)
3528 return a.st_dev == b.st_dev &&
3529 a.st_ino == b.st_ino;
3532 int running_in_chroot(void) {
3535 ret = files_same("/proc/1/root", "/");
3542 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3547 assert(percent <= 100);
3548 assert(new_length >= 3);
3550 if (old_length <= 3 || old_length <= new_length)
3551 return strndup(s, old_length);
3553 r = new0(char, new_length+1);
3557 x = (new_length * percent) / 100;
3559 if (x > new_length - 3)
3567 s + old_length - (new_length - x - 3),
3568 new_length - x - 3);
3573 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3577 unsigned k, len, len2;
3580 assert(percent <= 100);
3581 assert(new_length >= 3);
3583 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3584 if (ascii_is_valid(s))
3585 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3587 if (old_length <= 3 || old_length <= new_length)
3588 return strndup(s, old_length);
3590 x = (new_length * percent) / 100;
3592 if (x > new_length - 3)
3596 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3599 c = utf8_encoded_to_unichar(i);
3602 k += unichar_iswide(c) ? 2 : 1;
3605 if (k > x) /* last character was wide and went over quota */
3608 for (j = s + old_length; k < new_length && j > i; ) {
3611 j = utf8_prev_char(j);
3612 c = utf8_encoded_to_unichar(j);
3615 k += unichar_iswide(c) ? 2 : 1;
3619 /* we don't actually need to ellipsize */
3621 return memdup(s, old_length + 1);
3623 /* make space for ellipsis */
3624 j = utf8_next_char(j);
3627 len2 = s + old_length - j;
3628 e = new(char, len + 3 + len2 + 1);
3633 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3634 old_length, new_length, x, len, len2, k);
3638 e[len] = 0xe2; /* tri-dot ellipsis: … */
3642 memcpy(e + len + 3, j, len2 + 1);
3647 char *ellipsize(const char *s, size_t length, unsigned percent) {
3648 return ellipsize_mem(s, strlen(s), length, percent);
3651 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3652 _cleanup_close_ int fd;
3658 mkdir_parents(path, 0755);
3660 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3665 r = fchmod(fd, mode);
3670 if (uid != UID_INVALID || gid != GID_INVALID) {
3671 r = fchown(fd, uid, gid);
3676 if (stamp != USEC_INFINITY) {
3677 struct timespec ts[2];
3679 timespec_store(&ts[0], stamp);
3681 r = futimens(fd, ts);
3683 r = futimens(fd, NULL);
3690 int touch(const char *path) {
3691 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3694 char *unquote(const char *s, const char* quotes) {
3698 /* This is rather stupid, simply removes the heading and
3699 * trailing quotes if there is one. Doesn't care about
3700 * escaping or anything. We should make this smarter one
3707 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3708 return strndup(s+1, l-2);
3713 char *normalize_env_assignment(const char *s) {
3714 _cleanup_free_ char *value = NULL;
3718 eq = strchr(s, '=');
3728 memmove(r, t, strlen(t) + 1);
3733 name = strndupa(s, eq - s);
3734 p = strdupa(eq + 1);
3736 value = unquote(strstrip(p), QUOTES);
3740 return strjoin(strstrip(name), "=", value, NULL);
3743 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3754 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3768 * < 0 : wait_for_terminate() failed to get the state of the
3769 * process, the process was terminated by a signal, or
3770 * failed for an unknown reason.
3771 * >=0 : The process terminated normally, and its exit code is
3774 * That is, success is indicated by a return value of zero, and an
3775 * error is indicated by a non-zero value.
3777 * A warning is emitted if the process terminates abnormally,
3778 * and also if it returns non-zero unless check_exit_code is true.
3780 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3787 r = wait_for_terminate(pid, &status);
3789 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3791 if (status.si_code == CLD_EXITED) {
3792 if (status.si_status != 0)
3793 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3794 "%s failed with error code %i.", name, status.si_status);
3796 log_debug("%s succeeded.", name);
3798 return status.si_status;
3799 } else if (status.si_code == CLD_KILLED ||
3800 status.si_code == CLD_DUMPED) {
3802 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3806 log_warning("%s failed due to unknown reason.", name);
3810 noreturn void freeze(void) {
3812 /* Make sure nobody waits for us on a socket anymore */
3813 close_all_fds(NULL, 0);
3821 bool null_or_empty(struct stat *st) {
3824 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3827 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3833 int null_or_empty_path(const char *fn) {
3838 if (stat(fn, &st) < 0)
3841 return null_or_empty(&st);
3844 int null_or_empty_fd(int fd) {
3849 if (fstat(fd, &st) < 0)
3852 return null_or_empty(&st);
3855 DIR *xopendirat(int fd, const char *name, int flags) {
3859 assert(!(flags & O_CREAT));
3861 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3874 int signal_from_string_try_harder(const char *s) {
3878 signo = signal_from_string(s);
3880 if (startswith(s, "SIG"))
3881 return signal_from_string(s+3);
3886 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3887 _cleanup_free_ char *t = NULL, *u = NULL;
3890 u = unquote(tagvalue, "\"\'");
3894 enc_len = strlen(u) * 4 + 1;
3895 t = new(char, enc_len);
3899 if (encode_devnode_name(u, t, enc_len) < 0)
3902 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3905 char *fstab_node_to_udev_node(const char *p) {
3908 if (startswith(p, "LABEL="))
3909 return tag_to_udev_node(p+6, "label");
3911 if (startswith(p, "UUID="))
3912 return tag_to_udev_node(p+5, "uuid");
3914 if (startswith(p, "PARTUUID="))
3915 return tag_to_udev_node(p+9, "partuuid");
3917 if (startswith(p, "PARTLABEL="))
3918 return tag_to_udev_node(p+10, "partlabel");
3923 bool tty_is_vc(const char *tty) {
3926 return vtnr_from_tty(tty) >= 0;
3929 bool tty_is_console(const char *tty) {
3932 if (startswith(tty, "/dev/"))
3935 return streq(tty, "console");
3938 int vtnr_from_tty(const char *tty) {
3943 if (startswith(tty, "/dev/"))
3946 if (!startswith(tty, "tty") )
3949 if (tty[3] < '0' || tty[3] > '9')
3952 r = safe_atoi(tty+3, &i);
3956 if (i < 0 || i > 63)
3962 char *resolve_dev_console(char **active) {
3965 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3966 * (i.e. not read-only-mounted which is a sign for container setups) */
3968 if (path_is_read_only_fs("/sys") > 0)
3971 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3974 /* If multiple log outputs are configured the last one is what
3975 * /dev/console points to */
3976 tty = strrchr(*active, ' ');
3982 if (streq(tty, "tty0")) {
3985 /* Get the active VC (e.g. tty1) */
3986 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
3988 tty = *active = tmp;
3995 bool tty_is_vc_resolve(const char *tty) {
3996 _cleanup_free_ char *active = NULL;
4000 if (startswith(tty, "/dev/"))
4003 if (streq(tty, "console")) {
4004 tty = resolve_dev_console(&active);
4009 return tty_is_vc(tty);
4012 const char *default_term_for_tty(const char *tty) {
4015 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
4018 bool dirent_is_file(const struct dirent *de) {
4021 if (hidden_file(de->d_name))
4024 if (de->d_type != DT_REG &&
4025 de->d_type != DT_LNK &&
4026 de->d_type != DT_UNKNOWN)
4032 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
4035 if (de->d_type != DT_REG &&
4036 de->d_type != DT_LNK &&
4037 de->d_type != DT_UNKNOWN)
4040 if (hidden_file_allow_backup(de->d_name))
4043 return endswith(de->d_name, suffix);
4046 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4047 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4048 _cleanup_set_free_free_ Set *seen = NULL;
4051 /* We fork this all off from a child process so that we can
4052 * somewhat cleanly make use of SIGALRM to set a time limit */
4054 reset_all_signal_handlers();
4055 reset_signal_mask();
4057 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4059 pids = hashmap_new(NULL);
4063 seen = set_new(&string_hash_ops);
4067 STRV_FOREACH(directory, directories) {
4068 _cleanup_closedir_ DIR *d;
4071 d = opendir(*directory);
4073 if (errno == ENOENT)
4076 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4079 FOREACH_DIRENT(de, d, break) {
4080 _cleanup_free_ char *path = NULL;
4084 if (!dirent_is_file(de))
4087 if (set_contains(seen, de->d_name)) {
4088 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4092 r = set_put_strdup(seen, de->d_name);
4096 path = strjoin(*directory, "/", de->d_name, NULL);
4100 if (null_or_empty_path(path)) {
4101 log_debug("%s is empty (a mask).", path);
4104 log_debug("%s will be executed.", path);
4108 log_error_errno(errno, "Failed to fork: %m");
4110 } else if (pid == 0) {
4113 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4123 return log_error_errno(errno, "Failed to execute %s: %m", path);
4126 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4128 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4135 /* Abort execution of this process after the timout. We simply
4136 * rely on SIGALRM as default action terminating the process,
4137 * and turn on alarm(). */
4139 if (timeout != USEC_INFINITY)
4140 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4142 while (!hashmap_isempty(pids)) {
4143 _cleanup_free_ char *path = NULL;
4146 pid = PTR_TO_UINT(hashmap_first_key(pids));
4149 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4152 wait_for_terminate_and_warn(path, pid, true);
4158 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4162 char **dirs = (char**) directories;
4164 assert(!strv_isempty(dirs));
4166 name = basename(dirs[0]);
4167 assert(!isempty(name));
4169 /* Executes all binaries in the directories in parallel and waits
4170 * for them to finish. Optionally a timeout is applied. If a file
4171 * with the same name exists in more than one directory, the
4172 * earliest one wins. */
4174 executor_pid = fork();
4175 if (executor_pid < 0) {
4176 log_error_errno(errno, "Failed to fork: %m");
4179 } else if (executor_pid == 0) {
4180 r = do_execute(dirs, timeout, argv);
4181 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4184 wait_for_terminate_and_warn(name, executor_pid, true);
4187 int kill_and_sigcont(pid_t pid, int sig) {
4190 r = kill(pid, sig) < 0 ? -errno : 0;
4198 bool nulstr_contains(const char*nulstr, const char *needle) {
4204 NULSTR_FOREACH(i, nulstr)
4205 if (streq(i, needle))
4211 bool plymouth_running(void) {
4212 return access("/run/plymouth/pid", F_OK) >= 0;
4215 char* strshorten(char *s, size_t l) {
4224 static bool hostname_valid_char(char c) {
4226 (c >= 'a' && c <= 'z') ||
4227 (c >= 'A' && c <= 'Z') ||
4228 (c >= '0' && c <= '9') ||
4234 bool hostname_is_valid(const char *s) {
4241 for (p = s, dot = true; *p; p++) {
4248 if (!hostname_valid_char(*p))
4258 if (p-s > HOST_NAME_MAX)
4264 char* hostname_cleanup(char *s, bool lowercase) {
4268 for (p = s, d = s, dot = true; *p; p++) {
4275 } else if (hostname_valid_char(*p)) {
4276 *(d++) = lowercase ? tolower(*p) : *p;
4287 strshorten(s, HOST_NAME_MAX);
4292 bool machine_name_is_valid(const char *s) {
4294 if (!hostname_is_valid(s))
4297 /* Machine names should be useful hostnames, but also be
4298 * useful in unit names, hence we enforce a stricter length
4307 int pipe_eof(int fd) {
4308 struct pollfd pollfd = {
4310 .events = POLLIN|POLLHUP,
4315 r = poll(&pollfd, 1, 0);
4322 return pollfd.revents & POLLHUP;
4325 int fd_wait_for_event(int fd, int event, usec_t t) {
4327 struct pollfd pollfd = {
4335 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4342 return pollfd.revents;
4345 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4354 r = tempfn_xxxxxx(path, &t);
4358 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4364 f = fdopen(fd, "we");
4377 int terminal_vhangup_fd(int fd) {
4380 if (ioctl(fd, TIOCVHANGUP) < 0)
4386 int terminal_vhangup(const char *name) {
4387 _cleanup_close_ int fd;
4389 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4393 return terminal_vhangup_fd(fd);
4396 int vt_disallocate(const char *name) {
4400 /* Deallocate the VT if possible. If not possible
4401 * (i.e. because it is the active one), at least clear it
4402 * entirely (including the scrollback buffer) */
4404 if (!startswith(name, "/dev/"))
4407 if (!tty_is_vc(name)) {
4408 /* So this is not a VT. I guess we cannot deallocate
4409 * it then. But let's at least clear the screen */
4411 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4416 "\033[r" /* clear scrolling region */
4417 "\033[H" /* move home */
4418 "\033[2J", /* clear screen */
4425 if (!startswith(name, "/dev/tty"))
4428 r = safe_atou(name+8, &u);
4435 /* Try to deallocate */
4436 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4440 r = ioctl(fd, VT_DISALLOCATE, u);
4449 /* Couldn't deallocate, so let's clear it fully with
4451 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4456 "\033[r" /* clear scrolling region */
4457 "\033[H" /* move home */
4458 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4465 int symlink_atomic(const char *from, const char *to) {
4466 _cleanup_free_ char *t = NULL;
4472 r = tempfn_random(to, &t);
4476 if (symlink(from, t) < 0)
4479 if (rename(t, to) < 0) {
4487 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4488 _cleanup_free_ char *t = NULL;
4493 r = tempfn_random(path, &t);
4497 if (mknod(t, mode, dev) < 0)
4500 if (rename(t, path) < 0) {
4508 int mkfifo_atomic(const char *path, mode_t mode) {
4509 _cleanup_free_ char *t = NULL;
4514 r = tempfn_random(path, &t);
4518 if (mkfifo(t, mode) < 0)
4521 if (rename(t, path) < 0) {
4529 bool display_is_local(const char *display) {
4533 display[0] == ':' &&
4534 display[1] >= '0' &&
4538 int socket_from_display(const char *display, char **path) {
4545 if (!display_is_local(display))
4548 k = strspn(display+1, "0123456789");
4550 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4554 c = stpcpy(f, "/tmp/.X11-unix/X");
4555 memcpy(c, display+1, k);
4564 const char **username,
4565 uid_t *uid, gid_t *gid,
4567 const char **shell) {
4575 /* We enforce some special rules for uid=0: in order to avoid
4576 * NSS lookups for root we hardcode its data. */
4578 if (streq(*username, "root") || streq(*username, "0")) {
4596 if (parse_uid(*username, &u) >= 0) {
4600 /* If there are multiple users with the same id, make
4601 * sure to leave $USER to the configured value instead
4602 * of the first occurrence in the database. However if
4603 * the uid was configured by a numeric uid, then let's
4604 * pick the real username from /etc/passwd. */
4606 *username = p->pw_name;
4609 p = getpwnam(*username);
4613 return errno > 0 ? -errno : -ESRCH;
4625 *shell = p->pw_shell;
4630 char* uid_to_name(uid_t uid) {
4635 return strdup("root");
4639 return strdup(p->pw_name);
4641 if (asprintf(&r, UID_FMT, uid) < 0)
4647 char* gid_to_name(gid_t gid) {
4652 return strdup("root");
4656 return strdup(p->gr_name);
4658 if (asprintf(&r, GID_FMT, gid) < 0)
4664 int get_group_creds(const char **groupname, gid_t *gid) {
4670 /* We enforce some special rules for gid=0: in order to avoid
4671 * NSS lookups for root we hardcode its data. */
4673 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4674 *groupname = "root";
4682 if (parse_gid(*groupname, &id) >= 0) {
4687 *groupname = g->gr_name;
4690 g = getgrnam(*groupname);
4694 return errno > 0 ? -errno : -ESRCH;
4702 int in_gid(gid_t gid) {
4704 int ngroups_max, r, i;
4706 if (getgid() == gid)
4709 if (getegid() == gid)
4712 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4713 assert(ngroups_max > 0);
4715 gids = alloca(sizeof(gid_t) * ngroups_max);
4717 r = getgroups(ngroups_max, gids);
4721 for (i = 0; i < r; i++)
4728 int in_group(const char *name) {
4732 r = get_group_creds(&name, &gid);
4739 int glob_exists(const char *path) {
4740 _cleanup_globfree_ glob_t g = {};
4746 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4748 if (k == GLOB_NOMATCH)
4750 else if (k == GLOB_NOSPACE)
4753 return !strv_isempty(g.gl_pathv);
4755 return errno ? -errno : -EIO;
4758 int glob_extend(char ***strv, const char *path) {
4759 _cleanup_globfree_ glob_t g = {};
4764 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4766 if (k == GLOB_NOMATCH)
4768 else if (k == GLOB_NOSPACE)
4770 else if (k != 0 || strv_isempty(g.gl_pathv))
4771 return errno ? -errno : -EIO;
4773 STRV_FOREACH(p, g.gl_pathv) {
4774 k = strv_extend(strv, *p);
4782 int dirent_ensure_type(DIR *d, struct dirent *de) {
4788 if (de->d_type != DT_UNKNOWN)
4791 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4795 S_ISREG(st.st_mode) ? DT_REG :
4796 S_ISDIR(st.st_mode) ? DT_DIR :
4797 S_ISLNK(st.st_mode) ? DT_LNK :
4798 S_ISFIFO(st.st_mode) ? DT_FIFO :
4799 S_ISSOCK(st.st_mode) ? DT_SOCK :
4800 S_ISCHR(st.st_mode) ? DT_CHR :
4801 S_ISBLK(st.st_mode) ? DT_BLK :
4807 int get_files_in_directory(const char *path, char ***list) {
4808 _cleanup_closedir_ DIR *d = NULL;
4809 size_t bufsize = 0, n = 0;
4810 _cleanup_strv_free_ char **l = NULL;
4814 /* Returns all files in a directory in *list, and the number
4815 * of files as return value. If list is NULL returns only the
4827 if (!de && errno != 0)
4832 dirent_ensure_type(d, de);
4834 if (!dirent_is_file(de))
4838 /* one extra slot is needed for the terminating NULL */
4839 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4842 l[n] = strdup(de->d_name);
4853 l = NULL; /* avoid freeing */
4859 char *strjoin(const char *x, ...) {
4873 t = va_arg(ap, const char *);
4878 if (n > ((size_t) -1) - l) {
4902 t = va_arg(ap, const char *);
4916 bool is_main_thread(void) {
4917 static thread_local int cached = 0;
4919 if (_unlikely_(cached == 0))
4920 cached = getpid() == gettid() ? 1 : -1;
4925 int block_get_whole_disk(dev_t d, dev_t *ret) {
4932 /* If it has a queue this is good enough for us */
4933 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4936 r = access(p, F_OK);
4944 /* If it is a partition find the originating device */
4945 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4948 r = access(p, F_OK);
4954 /* Get parent dev_t */
4955 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4958 r = read_one_line_file(p, &s);
4964 r = sscanf(s, "%u:%u", &m, &n);
4970 /* Only return this if it is really good enough for us. */
4971 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4974 r = access(p, F_OK);
4978 *ret = makedev(m, n);
4985 static const char *const ioprio_class_table[] = {
4986 [IOPRIO_CLASS_NONE] = "none",
4987 [IOPRIO_CLASS_RT] = "realtime",
4988 [IOPRIO_CLASS_BE] = "best-effort",
4989 [IOPRIO_CLASS_IDLE] = "idle"
4992 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
4994 static const char *const sigchld_code_table[] = {
4995 [CLD_EXITED] = "exited",
4996 [CLD_KILLED] = "killed",
4997 [CLD_DUMPED] = "dumped",
4998 [CLD_TRAPPED] = "trapped",
4999 [CLD_STOPPED] = "stopped",
5000 [CLD_CONTINUED] = "continued",
5003 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
5005 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
5006 [LOG_FAC(LOG_KERN)] = "kern",
5007 [LOG_FAC(LOG_USER)] = "user",
5008 [LOG_FAC(LOG_MAIL)] = "mail",
5009 [LOG_FAC(LOG_DAEMON)] = "daemon",
5010 [LOG_FAC(LOG_AUTH)] = "auth",
5011 [LOG_FAC(LOG_SYSLOG)] = "syslog",
5012 [LOG_FAC(LOG_LPR)] = "lpr",
5013 [LOG_FAC(LOG_NEWS)] = "news",
5014 [LOG_FAC(LOG_UUCP)] = "uucp",
5015 [LOG_FAC(LOG_CRON)] = "cron",
5016 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
5017 [LOG_FAC(LOG_FTP)] = "ftp",
5018 [LOG_FAC(LOG_LOCAL0)] = "local0",
5019 [LOG_FAC(LOG_LOCAL1)] = "local1",
5020 [LOG_FAC(LOG_LOCAL2)] = "local2",
5021 [LOG_FAC(LOG_LOCAL3)] = "local3",
5022 [LOG_FAC(LOG_LOCAL4)] = "local4",
5023 [LOG_FAC(LOG_LOCAL5)] = "local5",
5024 [LOG_FAC(LOG_LOCAL6)] = "local6",
5025 [LOG_FAC(LOG_LOCAL7)] = "local7"
5028 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
5030 static const char *const log_level_table[] = {
5031 [LOG_EMERG] = "emerg",
5032 [LOG_ALERT] = "alert",
5033 [LOG_CRIT] = "crit",
5035 [LOG_WARNING] = "warning",
5036 [LOG_NOTICE] = "notice",
5037 [LOG_INFO] = "info",
5038 [LOG_DEBUG] = "debug"
5041 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5043 static const char* const sched_policy_table[] = {
5044 [SCHED_OTHER] = "other",
5045 [SCHED_BATCH] = "batch",
5046 [SCHED_IDLE] = "idle",
5047 [SCHED_FIFO] = "fifo",
5051 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5053 static const char* const rlimit_table[_RLIMIT_MAX] = {
5054 [RLIMIT_CPU] = "LimitCPU",
5055 [RLIMIT_FSIZE] = "LimitFSIZE",
5056 [RLIMIT_DATA] = "LimitDATA",
5057 [RLIMIT_STACK] = "LimitSTACK",
5058 [RLIMIT_CORE] = "LimitCORE",
5059 [RLIMIT_RSS] = "LimitRSS",
5060 [RLIMIT_NOFILE] = "LimitNOFILE",
5061 [RLIMIT_AS] = "LimitAS",
5062 [RLIMIT_NPROC] = "LimitNPROC",
5063 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5064 [RLIMIT_LOCKS] = "LimitLOCKS",
5065 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5066 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5067 [RLIMIT_NICE] = "LimitNICE",
5068 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5069 [RLIMIT_RTTIME] = "LimitRTTIME"
5072 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5074 static const char* const ip_tos_table[] = {
5075 [IPTOS_LOWDELAY] = "low-delay",
5076 [IPTOS_THROUGHPUT] = "throughput",
5077 [IPTOS_RELIABILITY] = "reliability",
5078 [IPTOS_LOWCOST] = "low-cost",
5081 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5083 static const char *const __signal_table[] = {
5100 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5111 [SIGVTALRM] = "VTALRM",
5113 [SIGWINCH] = "WINCH",
5119 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5121 const char *signal_to_string(int signo) {
5122 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5125 name = __signal_to_string(signo);
5129 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5130 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5132 snprintf(buf, sizeof(buf), "%d", signo);
5137 int signal_from_string(const char *s) {
5142 signo = __signal_from_string(s);
5146 if (startswith(s, "RTMIN+")) {
5150 if (safe_atou(s, &u) >= 0) {
5151 signo = (int) u + offset;
5152 if (signo > 0 && signo < _NSIG)
5158 bool kexec_loaded(void) {
5159 bool loaded = false;
5162 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5170 int prot_from_flags(int flags) {
5172 switch (flags & O_ACCMODE) {
5181 return PROT_READ|PROT_WRITE;
5188 char *format_bytes(char *buf, size_t l, off_t t) {
5191 static const struct {
5195 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5196 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5197 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5198 { "G", 1024ULL*1024ULL*1024ULL },
5199 { "M", 1024ULL*1024ULL },
5203 if (t == (off_t) -1)
5206 for (i = 0; i < ELEMENTSOF(table); i++) {
5208 if (t >= table[i].factor) {
5211 (unsigned long long) (t / table[i].factor),
5212 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5219 snprintf(buf, l, "%lluB", (unsigned long long) t);
5227 void* memdup(const void *p, size_t l) {
5240 int fd_inc_sndbuf(int fd, size_t n) {
5242 socklen_t l = sizeof(value);
5244 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5245 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5248 /* If we have the privileges we will ignore the kernel limit. */
5251 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5252 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5258 int fd_inc_rcvbuf(int fd, size_t n) {
5260 socklen_t l = sizeof(value);
5262 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5263 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5266 /* If we have the privileges we will ignore the kernel limit. */
5269 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5270 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5275 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5276 bool stdout_is_tty, stderr_is_tty;
5277 pid_t parent_pid, agent_pid;
5278 sigset_t ss, saved_ss;
5286 /* Spawns a temporary TTY agent, making sure it goes away when
5289 parent_pid = getpid();
5291 /* First we temporarily block all signals, so that the new
5292 * child has them blocked initially. This way, we can be sure
5293 * that SIGTERMs are not lost we might send to the agent. */
5294 assert_se(sigfillset(&ss) >= 0);
5295 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5298 if (agent_pid < 0) {
5299 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5303 if (agent_pid != 0) {
5304 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5311 * Make sure the agent goes away when the parent dies */
5312 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5313 _exit(EXIT_FAILURE);
5315 /* Make sure we actually can kill the agent, if we need to, in
5316 * case somebody invoked us from a shell script that trapped
5317 * SIGTERM or so... */
5318 reset_all_signal_handlers();
5319 reset_signal_mask();
5321 /* Check whether our parent died before we were able
5322 * to set the death signal and unblock the signals */
5323 if (getppid() != parent_pid)
5324 _exit(EXIT_SUCCESS);
5326 /* Don't leak fds to the agent */
5327 close_all_fds(except, n_except);
5329 stdout_is_tty = isatty(STDOUT_FILENO);
5330 stderr_is_tty = isatty(STDERR_FILENO);
5332 if (!stdout_is_tty || !stderr_is_tty) {
5335 /* Detach from stdout/stderr. and reopen
5336 * /dev/tty for them. This is important to
5337 * ensure that when systemctl is started via
5338 * popen() or a similar call that expects to
5339 * read EOF we actually do generate EOF and
5340 * not delay this indefinitely by because we
5341 * keep an unused copy of stdin around. */
5342 fd = open("/dev/tty", O_WRONLY);
5344 log_error_errno(errno, "Failed to open /dev/tty: %m");
5345 _exit(EXIT_FAILURE);
5349 dup2(fd, STDOUT_FILENO);
5352 dup2(fd, STDERR_FILENO);
5358 /* Count arguments */
5360 for (n = 0; va_arg(ap, char*); n++)
5365 l = alloca(sizeof(char *) * (n + 1));
5367 /* Fill in arguments */
5369 for (i = 0; i <= n; i++)
5370 l[i] = va_arg(ap, char*);
5374 _exit(EXIT_FAILURE);
5377 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5378 struct rlimit highest, fixed;
5382 if (setrlimit(resource, rlim) >= 0)
5388 /* So we failed to set the desired setrlimit, then let's try
5389 * to get as close as we can */
5390 assert_se(getrlimit(resource, &highest) == 0);
5392 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5393 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5395 if (setrlimit(resource, &fixed) < 0)
5401 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5402 _cleanup_fclose_ FILE *f = NULL;
5413 path = procfs_file_alloca(pid, "environ");
5415 f = fopen(path, "re");
5423 char line[LINE_MAX];
5426 for (i = 0; i < sizeof(line)-1; i++) {
5430 if (_unlikely_(c == EOF)) {
5440 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5441 value = strdup(line + l + 1);
5455 bool is_valid_documentation_url(const char *url) {
5458 if (startswith(url, "http://") && url[7])
5461 if (startswith(url, "https://") && url[8])
5464 if (startswith(url, "file:") && url[5])
5467 if (startswith(url, "info:") && url[5])
5470 if (startswith(url, "man:") && url[4])
5476 bool in_initrd(void) {
5477 static int saved = -1;
5483 /* We make two checks here:
5485 * 1. the flag file /etc/initrd-release must exist
5486 * 2. the root file system must be a memory file system
5488 * The second check is extra paranoia, since misdetecting an
5489 * initrd can have bad bad consequences due the initrd
5490 * emptying when transititioning to the main systemd.
5493 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5494 statfs("/", &s) >= 0 &&
5495 is_temporary_fs(&s);
5500 void warn_melody(void) {
5501 _cleanup_close_ int fd = -1;
5503 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5507 /* Yeah, this is synchronous. Kinda sucks. But well... */
5509 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5510 usleep(125*USEC_PER_MSEC);
5512 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5513 usleep(125*USEC_PER_MSEC);
5515 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5516 usleep(125*USEC_PER_MSEC);
5518 ioctl(fd, KIOCSOUND, 0);
5521 int make_console_stdio(void) {
5524 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5526 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5528 return log_error_errno(fd, "Failed to acquire terminal: %m");
5532 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5537 int get_home_dir(char **_h) {
5545 /* Take the user specified one */
5546 e = secure_getenv("HOME");
5547 if (e && path_is_absolute(e)) {
5556 /* Hardcode home directory for root to avoid NSS */
5559 h = strdup("/root");
5567 /* Check the database... */
5571 return errno > 0 ? -errno : -ESRCH;
5573 if (!path_is_absolute(p->pw_dir))
5576 h = strdup(p->pw_dir);
5584 int get_shell(char **_s) {
5592 /* Take the user specified one */
5593 e = getenv("SHELL");
5603 /* Hardcode home directory for root to avoid NSS */
5606 s = strdup("/bin/sh");
5614 /* Check the database... */
5618 return errno > 0 ? -errno : -ESRCH;
5620 if (!path_is_absolute(p->pw_shell))
5623 s = strdup(p->pw_shell);
5631 bool filename_is_valid(const char *p) {
5645 if (strlen(p) > FILENAME_MAX)
5651 bool string_is_safe(const char *p) {
5657 for (t = p; *t; t++) {
5658 if (*t > 0 && *t < ' ')
5661 if (strchr("\\\"\'\0x7f", *t))
5669 * Check if a string contains control characters. If 'ok' is non-NULL
5670 * it may be a string containing additional CCs to be considered OK.
5672 bool string_has_cc(const char *p, const char *ok) {
5677 for (t = p; *t; t++) {
5678 if (ok && strchr(ok, *t))
5681 if (*t > 0 && *t < ' ')
5691 bool path_is_safe(const char *p) {
5696 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5699 if (strlen(p) > PATH_MAX)
5702 /* The following two checks are not really dangerous, but hey, they still are confusing */
5703 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5706 if (strstr(p, "//"))
5712 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5713 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5714 int (*compar) (const void *, const void *, void *), void *arg) {
5723 p = (void *)(((const char *) base) + (idx * size));
5724 comparison = compar(key, p, arg);
5727 else if (comparison > 0)
5735 bool is_locale_utf8(void) {
5737 static int cached_answer = -1;
5739 if (cached_answer >= 0)
5742 if (!setlocale(LC_ALL, "")) {
5743 cached_answer = true;
5747 set = nl_langinfo(CODESET);
5749 cached_answer = true;
5753 if (streq(set, "UTF-8")) {
5754 cached_answer = true;
5758 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5759 * unset and everything can do to UTF-8 nowadays. */
5760 set = setlocale(LC_CTYPE, NULL);
5762 cached_answer = true;
5766 /* Check result, but ignore the result if C was set
5770 !getenv("LC_ALL") &&
5771 !getenv("LC_CTYPE") &&
5775 return (bool) cached_answer;
5778 const char *draw_special_char(DrawSpecialChar ch) {
5779 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5782 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5783 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5784 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5785 [DRAW_TREE_SPACE] = " ", /* */
5786 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5787 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5788 [DRAW_ARROW] = "\342\206\222", /* → */
5789 [DRAW_DASH] = "\342\200\223", /* – */
5792 /* ASCII fallback */ {
5793 [DRAW_TREE_VERTICAL] = "| ",
5794 [DRAW_TREE_BRANCH] = "|-",
5795 [DRAW_TREE_RIGHT] = "`-",
5796 [DRAW_TREE_SPACE] = " ",
5797 [DRAW_TRIANGULAR_BULLET] = ">",
5798 [DRAW_BLACK_CIRCLE] = "*",
5799 [DRAW_ARROW] = "->",
5804 return draw_table[!is_locale_utf8()][ch];
5807 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5810 size_t l, old_len, new_len;
5816 old_len = strlen(old_string);
5817 new_len = strlen(new_string);
5830 if (!startswith(f, old_string)) {
5836 nl = l - old_len + new_len;
5837 a = realloc(r, nl + 1);
5845 t = stpcpy(t, new_string);
5857 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5858 const char *i, *begin = NULL;
5863 } state = STATE_OTHER;
5865 size_t osz = 0, isz;
5871 /* Strips ANSI color and replaces TABs by 8 spaces */
5873 isz = _isz ? *_isz : strlen(*ibuf);
5875 f = open_memstream(&obuf, &osz);
5879 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5884 if (i >= *ibuf + isz) /* EOT */
5886 else if (*i == '\x1B')
5887 state = STATE_ESCAPE;
5888 else if (*i == '\t')
5895 if (i >= *ibuf + isz) { /* EOT */
5898 } else if (*i == '[') {
5899 state = STATE_BRACKET;
5904 state = STATE_OTHER;
5911 if (i >= *ibuf + isz || /* EOT */
5912 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5915 state = STATE_OTHER;
5917 } else if (*i == 'm')
5918 state = STATE_OTHER;
5940 int on_ac_power(void) {
5941 bool found_offline = false, found_online = false;
5942 _cleanup_closedir_ DIR *d = NULL;
5944 d = opendir("/sys/class/power_supply");
5950 _cleanup_close_ int fd = -1, device = -1;
5956 if (!de && errno != 0)
5962 if (hidden_file(de->d_name))
5965 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
5967 if (errno == ENOENT || errno == ENOTDIR)
5973 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5975 if (errno == ENOENT)
5981 n = read(fd, contents, sizeof(contents));
5985 if (n != 6 || memcmp(contents, "Mains\n", 6))
5989 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5991 if (errno == ENOENT)
5997 n = read(fd, contents, sizeof(contents));
6001 if (n != 2 || contents[1] != '\n')
6004 if (contents[0] == '1') {
6005 found_online = true;
6007 } else if (contents[0] == '0')
6008 found_offline = true;
6013 return found_online || !found_offline;
6016 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6023 if (!path_strv_resolve_uniq(search, root))
6026 STRV_FOREACH(i, search) {
6027 _cleanup_free_ char *p = NULL;
6031 p = strjoin(root, *i, "/", path, NULL);
6033 p = strjoin(*i, "/", path, NULL);
6043 if (errno != ENOENT)
6050 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6051 _cleanup_strv_free_ char **copy = NULL;
6057 if (path_is_absolute(path)) {
6060 f = fopen(path, mode);
6069 copy = strv_copy((char**) search);
6073 return search_and_fopen_internal(path, mode, root, copy, _f);
6076 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6077 _cleanup_strv_free_ char **s = NULL;
6079 if (path_is_absolute(path)) {
6082 f = fopen(path, mode);
6091 s = strv_split_nulstr(search);
6095 return search_and_fopen_internal(path, mode, root, s, _f);
6098 char *strextend(char **x, ...) {
6105 l = f = *x ? strlen(*x) : 0;
6112 t = va_arg(ap, const char *);
6117 if (n > ((size_t) -1) - l) {
6126 r = realloc(*x, l+1);
6136 t = va_arg(ap, const char *);
6150 char *strrep(const char *s, unsigned n) {
6158 p = r = malloc(l * n + 1);
6162 for (i = 0; i < n; i++)
6169 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6176 if (*allocated >= need)
6179 newalloc = MAX(need * 2, 64u / size);
6180 a = newalloc * size;
6182 /* check for overflows */
6183 if (a < size * need)
6191 *allocated = newalloc;
6195 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6204 q = greedy_realloc(p, allocated, need, size);
6208 if (*allocated > prev)
6209 memzero(q + prev * size, (*allocated - prev) * size);
6214 bool id128_is_valid(const char *s) {
6220 /* Simple formatted 128bit hex string */
6222 for (i = 0; i < l; i++) {
6225 if (!(c >= '0' && c <= '9') &&
6226 !(c >= 'a' && c <= 'z') &&
6227 !(c >= 'A' && c <= 'Z'))
6231 } else if (l == 36) {
6233 /* Formatted UUID */
6235 for (i = 0; i < l; i++) {
6238 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6242 if (!(c >= '0' && c <= '9') &&
6243 !(c >= 'a' && c <= 'z') &&
6244 !(c >= 'A' && c <= 'Z'))
6255 int split_pair(const char *s, const char *sep, char **l, char **r) {
6270 a = strndup(s, x - s);
6274 b = strdup(x + strlen(sep));
6286 int shall_restore_state(void) {
6287 _cleanup_free_ char *value = NULL;
6290 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6296 return parse_boolean(value) != 0;
6299 int proc_cmdline(char **ret) {
6302 if (detect_container(NULL) > 0)
6303 return get_process_cmdline(1, 0, false, ret);
6305 return read_one_line_file("/proc/cmdline", ret);
6308 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6309 _cleanup_free_ char *line = NULL;
6315 r = proc_cmdline(&line);
6321 _cleanup_free_ char *word = NULL;
6324 r = unquote_first_word(&p, &word, true);
6330 /* Filter out arguments that are intended only for the
6332 if (!in_initrd() && startswith(word, "rd."))
6335 value = strchr(word, '=');
6339 r = parse_item(word, value);
6347 int get_proc_cmdline_key(const char *key, char **value) {
6348 _cleanup_free_ char *line = NULL, *ret = NULL;
6355 r = proc_cmdline(&line);
6361 _cleanup_free_ char *word = NULL;
6364 r = unquote_first_word(&p, &word, true);
6370 /* Filter out arguments that are intended only for the
6372 if (!in_initrd() && startswith(word, "rd."))
6376 e = startswith(word, key);
6380 r = free_and_strdup(&ret, e);
6386 if (streq(word, key))
6400 int container_get_leader(const char *machine, pid_t *pid) {
6401 _cleanup_free_ char *s = NULL, *class = NULL;
6409 p = strappenda("/run/systemd/machines/", machine);
6410 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6418 if (!streq_ptr(class, "container"))
6421 r = parse_pid(s, &leader);
6431 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6432 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6440 mntns = procfs_file_alloca(pid, "ns/mnt");
6441 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6449 pidns = procfs_file_alloca(pid, "ns/pid");
6450 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6458 netns = procfs_file_alloca(pid, "ns/net");
6459 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6467 root = procfs_file_alloca(pid, "root");
6468 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6474 *pidns_fd = pidnsfd;
6477 *mntns_fd = mntnsfd;
6480 *netns_fd = netnsfd;
6485 pidnsfd = mntnsfd = netnsfd = -1;
6490 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6493 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6497 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6501 if (setns(netns_fd, CLONE_NEWNET) < 0)
6505 if (fchdir(root_fd) < 0)
6508 if (chroot(".") < 0)
6512 if (setresgid(0, 0, 0) < 0)
6515 if (setgroups(0, NULL) < 0)
6518 if (setresuid(0, 0, 0) < 0)
6524 bool pid_is_unwaited(pid_t pid) {
6525 /* Checks whether a PID is still valid at all, including a zombie */
6530 if (kill(pid, 0) >= 0)
6533 return errno != ESRCH;
6536 bool pid_is_alive(pid_t pid) {
6539 /* Checks whether a PID is still valid and not a zombie */
6544 r = get_process_state(pid);
6545 if (r == -ENOENT || r == 'Z')
6551 int getpeercred(int fd, struct ucred *ucred) {
6552 socklen_t n = sizeof(struct ucred);
6559 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6563 if (n != sizeof(struct ucred))
6566 /* Check if the data is actually useful and not suppressed due
6567 * to namespacing issues */
6570 if (u.uid == UID_INVALID)
6572 if (u.gid == GID_INVALID)
6579 int getpeersec(int fd, char **ret) {
6591 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6595 if (errno != ERANGE)
6602 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6618 /* This is much like like mkostemp() but is subject to umask(). */
6619 int mkostemp_safe(char *pattern, int flags) {
6620 _cleanup_umask_ mode_t u;
6627 fd = mkostemp(pattern, flags);
6634 int open_tmpfile(const char *path, int flags) {
6641 /* Try O_TMPFILE first, if it is supported */
6642 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6647 /* Fall back to unguessable name + unlinking */
6648 p = strappenda(path, "/systemd-tmp-XXXXXX");
6650 fd = mkostemp_safe(p, flags);
6658 int fd_warn_permissions(const char *path, int fd) {
6661 if (fstat(fd, &st) < 0)
6664 if (st.st_mode & 0111)
6665 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6667 if (st.st_mode & 0002)
6668 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6670 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6671 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6676 unsigned long personality_from_string(const char *p) {
6678 /* Parse a personality specifier. We introduce our own
6679 * identifiers that indicate specific ABIs, rather than just
6680 * hints regarding the register size, since we want to keep
6681 * things open for multiple locally supported ABIs for the
6682 * same register size. We try to reuse the ABI identifiers
6683 * used by libseccomp. */
6685 #if defined(__x86_64__)
6687 if (streq(p, "x86"))
6690 if (streq(p, "x86-64"))
6693 #elif defined(__i386__)
6695 if (streq(p, "x86"))
6699 /* personality(7) documents that 0xffffffffUL is used for
6700 * querying the current personality, hence let's use that here
6701 * as error indicator. */
6702 return 0xffffffffUL;
6705 const char* personality_to_string(unsigned long p) {
6707 #if defined(__x86_64__)
6709 if (p == PER_LINUX32)
6715 #elif defined(__i386__)
6724 uint64_t physical_memory(void) {
6727 /* We return this as uint64_t in case we are running as 32bit
6728 * process on a 64bit kernel with huge amounts of memory */
6730 mem = sysconf(_SC_PHYS_PAGES);
6733 return (uint64_t) mem * (uint64_t) page_size();
6736 void hexdump(FILE *f, const void *p, size_t s) {
6737 const uint8_t *b = p;
6740 assert(s == 0 || b);
6745 fprintf(f, "%04x ", n);
6747 for (i = 0; i < 16; i++) {
6752 fprintf(f, "%02x ", b[i]);
6760 for (i = 0; i < 16; i++) {
6765 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6779 int update_reboot_param_file(const char *param) {
6784 r = write_string_file(REBOOT_PARAM_FILE, param);
6786 log_error("Failed to write reboot param to "
6787 REBOOT_PARAM_FILE": %s", strerror(-r));
6789 unlink(REBOOT_PARAM_FILE);
6794 int umount_recursive(const char *prefix, int flags) {
6798 /* Try to umount everything recursively below a
6799 * directory. Also, take care of stacked mounts, and keep
6800 * unmounting them until they are gone. */
6803 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6808 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6809 if (!proc_self_mountinfo)
6813 _cleanup_free_ char *path = NULL, *p = NULL;
6816 k = fscanf(proc_self_mountinfo,
6817 "%*s " /* (1) mount id */
6818 "%*s " /* (2) parent id */
6819 "%*s " /* (3) major:minor */
6820 "%*s " /* (4) root */
6821 "%ms " /* (5) mount point */
6822 "%*s" /* (6) mount options */
6823 "%*[^-]" /* (7) optional fields */
6824 "- " /* (8) separator */
6825 "%*s " /* (9) file system type */
6826 "%*s" /* (10) mount source */
6827 "%*s" /* (11) mount options 2 */
6828 "%*[^\n]", /* some rubbish at the end */
6837 p = cunescape(path);
6841 if (!path_startswith(p, prefix))
6844 if (umount2(p, flags) < 0) {
6860 static int get_mount_flags(const char *path, unsigned long *flags) {
6863 if (statvfs(path, &buf) < 0)
6865 *flags = buf.f_flag;
6869 int bind_remount_recursive(const char *prefix, bool ro) {
6870 _cleanup_set_free_free_ Set *done = NULL;
6871 _cleanup_free_ char *cleaned = NULL;
6874 /* Recursively remount a directory (and all its submounts)
6875 * read-only or read-write. If the directory is already
6876 * mounted, we reuse the mount and simply mark it
6877 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6878 * operation). If it isn't we first make it one. Afterwards we
6879 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6880 * submounts we can access, too. When mounts are stacked on
6881 * the same mount point we only care for each individual
6882 * "top-level" mount on each point, as we cannot
6883 * influence/access the underlying mounts anyway. We do not
6884 * have any effect on future submounts that might get
6885 * propagated, they migt be writable. This includes future
6886 * submounts that have been triggered via autofs. */
6888 cleaned = strdup(prefix);
6892 path_kill_slashes(cleaned);
6894 done = set_new(&string_hash_ops);
6899 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6900 _cleanup_set_free_free_ Set *todo = NULL;
6901 bool top_autofs = false;
6903 unsigned long orig_flags;
6905 todo = set_new(&string_hash_ops);
6909 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6910 if (!proc_self_mountinfo)
6914 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6917 k = fscanf(proc_self_mountinfo,
6918 "%*s " /* (1) mount id */
6919 "%*s " /* (2) parent id */
6920 "%*s " /* (3) major:minor */
6921 "%*s " /* (4) root */
6922 "%ms " /* (5) mount point */
6923 "%*s" /* (6) mount options (superblock) */
6924 "%*[^-]" /* (7) optional fields */
6925 "- " /* (8) separator */
6926 "%ms " /* (9) file system type */
6927 "%*s" /* (10) mount source */
6928 "%*s" /* (11) mount options (bind mount) */
6929 "%*[^\n]", /* some rubbish at the end */
6939 p = cunescape(path);
6943 /* Let's ignore autofs mounts. If they aren't
6944 * triggered yet, we want to avoid triggering
6945 * them, as we don't make any guarantees for
6946 * future submounts anyway. If they are
6947 * already triggered, then we will find
6948 * another entry for this. */
6949 if (streq(type, "autofs")) {
6950 top_autofs = top_autofs || path_equal(cleaned, p);
6954 if (path_startswith(p, cleaned) &&
6955 !set_contains(done, p)) {
6957 r = set_consume(todo, p);
6967 /* If we have no submounts to process anymore and if
6968 * the root is either already done, or an autofs, we
6970 if (set_isempty(todo) &&
6971 (top_autofs || set_contains(done, cleaned)))
6974 if (!set_contains(done, cleaned) &&
6975 !set_contains(todo, cleaned)) {
6976 /* The prefix directory itself is not yet a
6977 * mount, make it one. */
6978 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
6982 (void) get_mount_flags(cleaned, &orig_flags);
6983 orig_flags &= ~MS_RDONLY;
6985 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
6988 x = strdup(cleaned);
6992 r = set_consume(done, x);
6997 while ((x = set_steal_first(todo))) {
6999 r = set_consume(done, x);
7005 /* Try to reuse the original flag set, but
7006 * don't care for errors, in case of
7007 * obstructed mounts */
7009 (void) get_mount_flags(x, &orig_flags);
7010 orig_flags &= ~MS_RDONLY;
7012 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7014 /* Deal with mount points that are
7015 * obstructed by a later mount */
7017 if (errno != ENOENT)
7025 int fflush_and_check(FILE *f) {
7032 return errno ? -errno : -EIO;
7037 int tempfn_xxxxxx(const char *p, char **ret) {
7049 * /foo/bar/.#waldoXXXXXX
7053 if (!filename_is_valid(fn))
7056 t = new(char, strlen(p) + 2 + 6 + 1);
7060 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7062 *ret = path_kill_slashes(t);
7066 int tempfn_random(const char *p, char **ret) {
7080 * /foo/bar/.#waldobaa2a261115984a9
7084 if (!filename_is_valid(fn))
7087 t = new(char, strlen(p) + 2 + 16 + 1);
7091 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7094 for (i = 0; i < 16; i++) {
7095 *(x++) = hexchar(u & 0xF);
7101 *ret = path_kill_slashes(t);
7105 int tempfn_random_child(const char *p, char **ret) {
7116 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7119 t = new(char, strlen(p) + 3 + 16 + 1);
7123 x = stpcpy(stpcpy(t, p), "/.#");
7126 for (i = 0; i < 16; i++) {
7127 *(x++) = hexchar(u & 0xF);
7133 *ret = path_kill_slashes(t);
7137 /* make sure the hostname is not "localhost" */
7138 bool is_localhost(const char *hostname) {
7141 /* This tries to identify local host and domain names
7142 * described in RFC6761 plus the redhatism of .localdomain */
7144 return streq(hostname, "localhost") ||
7145 streq(hostname, "localhost.") ||
7146 streq(hostname, "localdomain.") ||
7147 streq(hostname, "localdomain") ||
7148 endswith(hostname, ".localhost") ||
7149 endswith(hostname, ".localhost.") ||
7150 endswith(hostname, ".localdomain") ||
7151 endswith(hostname, ".localdomain.");
7154 int take_password_lock(const char *root) {
7156 struct flock flock = {
7158 .l_whence = SEEK_SET,
7166 /* This is roughly the same as lckpwdf(), but not as awful. We
7167 * don't want to use alarm() and signals, hence we implement
7168 * our own trivial version of this.
7170 * Note that shadow-utils also takes per-database locks in
7171 * addition to lckpwdf(). However, we don't given that they
7172 * are redundant as they they invoke lckpwdf() first and keep
7173 * it during everything they do. The per-database locks are
7174 * awfully racy, and thus we just won't do them. */
7177 path = strappenda(root, "/etc/.pwd.lock");
7179 path = "/etc/.pwd.lock";
7181 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7185 r = fcntl(fd, F_SETLKW, &flock);
7194 int is_symlink(const char *path) {
7197 if (lstat(path, &info) < 0)
7200 return !!S_ISLNK(info.st_mode);
7203 int is_dir(const char* path, bool follow) {
7208 r = stat(path, &st);
7210 r = lstat(path, &st);
7214 return !!S_ISDIR(st.st_mode);
7217 int unquote_first_word(const char **p, char **ret, bool relax) {
7218 _cleanup_free_ char *s = NULL;
7219 size_t allocated = 0, sz = 0;
7226 SINGLE_QUOTE_ESCAPE,
7228 DOUBLE_QUOTE_ESCAPE,
7236 /* Parses the first word of a string, and returns it in
7237 * *ret. Removes all quotes in the process. When parsing fails
7238 * (because of an uneven number of quotes or similar), leaves
7239 * the pointer *p at the first invalid character. */
7249 else if (strchr(WHITESPACE, c))
7259 state = SINGLE_QUOTE;
7261 state = VALUE_ESCAPE;
7263 state = DOUBLE_QUOTE;
7264 else if (strchr(WHITESPACE, c))
7267 if (!GREEDY_REALLOC(s, allocated, sz+2))
7282 if (!GREEDY_REALLOC(s, allocated, sz+2))
7295 } else if (c == '\'')
7298 state = SINGLE_QUOTE_ESCAPE;
7300 if (!GREEDY_REALLOC(s, allocated, sz+2))
7308 case SINGLE_QUOTE_ESCAPE:
7315 if (!GREEDY_REALLOC(s, allocated, sz+2))
7319 state = SINGLE_QUOTE;
7328 state = DOUBLE_QUOTE_ESCAPE;
7330 if (!GREEDY_REALLOC(s, allocated, sz+2))
7338 case DOUBLE_QUOTE_ESCAPE:
7345 if (!GREEDY_REALLOC(s, allocated, sz+2))
7349 state = DOUBLE_QUOTE;
7355 if (!strchr(WHITESPACE, c))
7377 int unquote_many_words(const char **p, ...) {
7382 /* Parses a number of words from a string, stripping any
7383 * quotes if necessary. */
7387 /* Count how many words are expected */
7390 if (!va_arg(ap, char **))
7399 /* Read all words into a temporary array */
7400 l = newa0(char*, n);
7401 for (c = 0; c < n; c++) {
7403 r = unquote_first_word(p, &l[c], false);
7407 for (j = 0; j < c; j++)
7417 /* If we managed to parse all words, return them in the passed
7420 for (i = 0; i < n; i++) {
7423 v = va_arg(ap, char **);
7433 int free_and_strdup(char **p, const char *s) {
7438 /* Replaces a string pointer with an strdup()ed new string,
7439 * possibly freeing the old one. */
7454 int sethostname_idempotent(const char *s) {
7456 char buf[HOST_NAME_MAX + 1] = {};
7460 r = gethostname(buf, sizeof(buf));
7467 r = sethostname(s, strlen(s));
7474 int ptsname_malloc(int fd, char **ret) {
7487 if (ptsname_r(fd, c, l) == 0) {
7491 if (errno != ERANGE) {
7501 int openpt_in_namespace(pid_t pid, int flags) {
7502 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7503 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7505 struct cmsghdr cmsghdr;
7506 uint8_t buf[CMSG_SPACE(sizeof(int))];
7508 struct msghdr mh = {
7509 .msg_control = &control,
7510 .msg_controllen = sizeof(control),
7512 struct cmsghdr *cmsg;
7519 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7523 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7533 pair[0] = safe_close(pair[0]);
7535 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7537 _exit(EXIT_FAILURE);
7539 master = posix_openpt(flags);
7541 _exit(EXIT_FAILURE);
7543 cmsg = CMSG_FIRSTHDR(&mh);
7544 cmsg->cmsg_level = SOL_SOCKET;
7545 cmsg->cmsg_type = SCM_RIGHTS;
7546 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7547 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7549 mh.msg_controllen = cmsg->cmsg_len;
7551 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7552 _exit(EXIT_FAILURE);
7554 _exit(EXIT_SUCCESS);
7557 pair[1] = safe_close(pair[1]);
7559 r = wait_for_terminate(child, &si);
7562 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7565 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7568 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7569 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7573 fds = (int*) CMSG_DATA(cmsg);
7574 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7577 close_many(fds, n_fds);
7587 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7588 _cleanup_close_ int fd = -1;
7591 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7593 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7597 l = fgetxattr(fd, attribute, value, size);
7604 static int parse_crtime(le64_t le, usec_t *usec) {
7610 if (u == 0 || u == (uint64_t) -1)
7617 int fd_getcrtime(int fd, usec_t *usec) {
7624 /* Until Linux gets a real concept of birthtime/creation time,
7625 * let's fake one with xattrs */
7627 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7630 if (n != sizeof(le))
7633 return parse_crtime(le, usec);
7636 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7640 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7643 if (n != sizeof(le))
7646 return parse_crtime(le, usec);
7649 int path_getcrtime(const char *p, usec_t *usec) {
7656 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7659 if (n != sizeof(le))
7662 return parse_crtime(le, usec);
7665 int fd_setcrtime(int fd, usec_t usec) {
7671 usec = now(CLOCK_REALTIME);
7673 le = htole64((uint64_t) usec);
7674 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7680 int same_fd(int a, int b) {
7681 struct stat sta, stb;
7688 /* Compares two file descriptors. Note that semantics are
7689 * quite different depending on whether we have kcmp() or we
7690 * don't. If we have kcmp() this will only return true for
7691 * dup()ed file descriptors, but not otherwise. If we don't
7692 * have kcmp() this will also return true for two fds of the same
7693 * file, created by separate open() calls. Since we use this
7694 * call mostly for filtering out duplicates in the fd store
7695 * this difference hopefully doesn't matter too much. */
7700 /* Try to use kcmp() if we have it. */
7702 r = kcmp(pid, pid, KCMP_FILE, a, b);
7707 if (errno != ENOSYS)
7710 /* We don't have kcmp(), use fstat() instead. */
7711 if (fstat(a, &sta) < 0)
7714 if (fstat(b, &stb) < 0)
7717 if ((sta.st_mode & S_IFMT) != (stb.st_mode & S_IFMT))
7720 /* We consider all device fds different, since two device fds
7721 * might refer to quite different device contexts even though
7722 * they share the same inode and backing dev_t. */
7724 if (S_ISCHR(sta.st_mode) || S_ISBLK(sta.st_mode))
7727 if (sta.st_dev != stb.st_dev || sta.st_ino != stb.st_ino)
7730 /* The fds refer to the same inode on disk, let's also check
7731 * if they have the same fd flags. This is useful to
7732 * distuingish the read and write side of a pipe created with
7734 fa = fcntl(a, F_GETFL);
7738 fb = fcntl(b, F_GETFL);
7745 int chattr_fd(int fd, bool b, unsigned mask) {
7746 unsigned old_attr, new_attr;
7753 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7757 new_attr = old_attr | mask;
7759 new_attr = old_attr & ~mask;
7761 if (new_attr == old_attr)
7764 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7770 int chattr_path(const char *p, bool b, unsigned mask) {
7771 _cleanup_close_ int fd = -1;
7778 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7782 return chattr_fd(fd, b, mask);
7785 int read_attr_fd(int fd, unsigned *ret) {
7788 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7794 int read_attr_path(const char *p, unsigned *ret) {
7795 _cleanup_close_ int fd = -1;
7800 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7804 return read_attr_fd(fd, ret);
7807 int make_lock_file(const char *p, int operation, LockFile *ret) {
7808 _cleanup_close_ int fd = -1;
7809 _cleanup_free_ char *t = NULL;
7813 * We use UNPOSIX locks if they are available. They have nice
7814 * semantics, and are mostly compatible with NFS. However,
7815 * they are only available on new kernels. When we detect we
7816 * are running on an older kernel, then we fall back to good
7817 * old BSD locks. They also have nice semantics, but are
7818 * slightly problematic on NFS, where they are upgraded to
7819 * POSIX locks, even though locally they are orthogonal to
7829 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7830 .l_whence = SEEK_SET,
7834 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7838 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7841 /* If the kernel is too old, use good old BSD locks */
7842 if (errno == EINVAL)
7843 r = flock(fd, operation);
7846 return errno == EAGAIN ? -EBUSY : -errno;
7849 /* If we acquired the lock, let's check if the file
7850 * still exists in the file system. If not, then the
7851 * previous exclusive owner removed it and then closed
7852 * it. In such a case our acquired lock is worthless,
7853 * hence try again. */
7858 if (st.st_nlink > 0)
7861 fd = safe_close(fd);
7866 ret->operation = operation;
7874 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7882 if (!filename_is_valid(fn))
7885 t = newa(char, strlen(p) + 2 + 4 + 1);
7886 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7888 return make_lock_file(t, operation, ret);
7891 void release_lock_file(LockFile *f) {
7899 /* If we are the exclusive owner we can safely delete
7900 * the lock file itself. If we are not the exclusive
7901 * owner, we can try becoming it. */
7904 (f->operation & ~LOCK_NB) == LOCK_SH) {
7905 static const struct flock fl = {
7907 .l_whence = SEEK_SET,
7910 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7911 if (r < 0 && errno == EINVAL)
7912 r = flock(f->fd, LOCK_EX|LOCK_NB);
7915 f->operation = LOCK_EX|LOCK_NB;
7918 if ((f->operation & ~LOCK_NB) == LOCK_EX)
7919 unlink_noerrno(f->path);
7925 f->fd = safe_close(f->fd);