1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
32 #include <sys/resource.h>
33 #include <linux/sched.h>
34 #include <sys/types.h>
38 #include <sys/ioctl.h>
40 #include <linux/tiocl.h>
45 #include <sys/prctl.h>
46 #include <sys/utsname.h>
48 #include <netinet/ip.h>
56 #include <sys/mount.h>
57 #include <linux/magic.h>
61 #include <sys/personality.h>
62 #include <sys/xattr.h>
63 #include <sys/statvfs.h>
67 /* When we include libgen.h because we need dirname() we immediately
68 * undefine basename() since libgen.h defines it as a macro to the XDG
69 * version which is really broken. */
73 #ifdef HAVE_SYS_AUXV_H
85 #include "path-util.h"
86 #include "exit-status.h"
90 #include "device-nodes.h"
95 #include "sparse-endian.h"
98 char **saved_argv = NULL;
100 static volatile unsigned cached_columns = 0;
101 static volatile unsigned cached_lines = 0;
103 size_t page_size(void) {
104 static thread_local size_t pgsz = 0;
107 if (_likely_(pgsz > 0))
110 r = sysconf(_SC_PAGESIZE);
117 bool streq_ptr(const char *a, const char *b) {
119 /* Like streq(), but tries to make sense of NULL pointers */
130 char* endswith(const char *s, const char *postfix) {
137 pl = strlen(postfix);
140 return (char*) s + sl;
145 if (memcmp(s + sl - pl, postfix, pl) != 0)
148 return (char*) s + sl - pl;
151 char* first_word(const char *s, const char *word) {
158 /* Checks if the string starts with the specified word, either
159 * followed by NUL or by whitespace. Returns a pointer to the
160 * NUL or the first character after the whitespace. */
171 if (memcmp(s, word, wl) != 0)
178 if (!strchr(WHITESPACE, *p))
181 p += strspn(p, WHITESPACE);
185 static size_t cescape_char(char c, char *buf) {
186 char * buf_old = buf;
232 /* For special chars we prefer octal over
233 * hexadecimal encoding, simply because glib's
234 * g_strescape() does the same */
235 if ((c < ' ') || (c >= 127)) {
237 *(buf++) = octchar((unsigned char) c >> 6);
238 *(buf++) = octchar((unsigned char) c >> 3);
239 *(buf++) = octchar((unsigned char) c);
245 return buf - buf_old;
248 int close_nointr(int fd) {
255 * Just ignore EINTR; a retry loop is the wrong thing to do on
258 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
259 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
260 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
261 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
269 int safe_close(int fd) {
272 * Like close_nointr() but cannot fail. Guarantees errno is
273 * unchanged. Is a NOP with negative fds passed, and returns
274 * -1, so that it can be used in this syntax:
276 * fd = safe_close(fd);
282 /* The kernel might return pretty much any error code
283 * via close(), but the fd will be closed anyway. The
284 * only condition we want to check for here is whether
285 * the fd was invalid at all... */
287 assert_se(close_nointr(fd) != -EBADF);
293 void close_many(const int fds[], unsigned n_fd) {
296 assert(fds || n_fd <= 0);
298 for (i = 0; i < n_fd; i++)
302 int unlink_noerrno(const char *path) {
313 int parse_boolean(const char *v) {
316 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
318 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
324 int parse_pid(const char *s, pid_t* ret_pid) {
325 unsigned long ul = 0;
332 r = safe_atolu(s, &ul);
338 if ((unsigned long) pid != ul)
348 int parse_uid(const char *s, uid_t* ret_uid) {
349 unsigned long ul = 0;
356 r = safe_atolu(s, &ul);
362 if ((unsigned long) uid != ul)
365 /* Some libc APIs use UID_INVALID as special placeholder */
366 if (uid == (uid_t) 0xFFFFFFFF)
369 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
370 if (uid == (uid_t) 0xFFFF)
377 int safe_atou(const char *s, unsigned *ret_u) {
385 l = strtoul(s, &x, 0);
387 if (!x || x == s || *x || errno)
388 return errno > 0 ? -errno : -EINVAL;
390 if ((unsigned long) (unsigned) l != l)
393 *ret_u = (unsigned) l;
397 int safe_atoi(const char *s, int *ret_i) {
405 l = strtol(s, &x, 0);
407 if (!x || x == s || *x || errno)
408 return errno > 0 ? -errno : -EINVAL;
410 if ((long) (int) l != l)
417 int safe_atou8(const char *s, uint8_t *ret) {
425 l = strtoul(s, &x, 0);
427 if (!x || x == s || *x || errno)
428 return errno > 0 ? -errno : -EINVAL;
430 if ((unsigned long) (uint8_t) l != l)
437 int safe_atou16(const char *s, uint16_t *ret) {
445 l = strtoul(s, &x, 0);
447 if (!x || x == s || *x || errno)
448 return errno > 0 ? -errno : -EINVAL;
450 if ((unsigned long) (uint16_t) l != l)
457 int safe_atoi16(const char *s, int16_t *ret) {
465 l = strtol(s, &x, 0);
467 if (!x || x == s || *x || errno)
468 return errno > 0 ? -errno : -EINVAL;
470 if ((long) (int16_t) l != l)
477 int safe_atollu(const char *s, long long unsigned *ret_llu) {
479 unsigned long long l;
485 l = strtoull(s, &x, 0);
487 if (!x || x == s || *x || errno)
488 return errno ? -errno : -EINVAL;
494 int safe_atolli(const char *s, long long int *ret_lli) {
502 l = strtoll(s, &x, 0);
504 if (!x || x == s || *x || errno)
505 return errno ? -errno : -EINVAL;
511 int safe_atod(const char *s, double *ret_d) {
519 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
520 if (loc == (locale_t) 0)
524 d = strtod_l(s, &x, loc);
526 if (!x || x == s || *x || errno) {
528 return errno ? -errno : -EINVAL;
536 static size_t strcspn_escaped(const char *s, const char *reject) {
537 bool escaped = false;
540 for (n=0; s[n]; n++) {
543 else if (s[n] == '\\')
545 else if (strchr(reject, s[n]))
549 /* if s ends in \, return index of previous char */
553 /* Split a string into words. */
554 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
560 assert(**state == '\0');
564 current += strspn(current, separator);
570 if (quoted && strchr("\'\"", *current)) {
571 char quotechars[2] = {*current, '\0'};
573 *l = strcspn_escaped(current + 1, quotechars);
574 if (current[*l + 1] == '\0' ||
575 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
576 /* right quote missing or garbage at the end */
580 assert(current[*l + 1] == quotechars[0]);
581 *state = current++ + *l + 2;
583 *l = strcspn_escaped(current, separator);
584 if (current[*l] && !strchr(separator, current[*l])) {
585 /* unfinished escape */
589 *state = current + *l;
591 *l = strcspn(current, separator);
592 *state = current + *l;
598 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
600 _cleanup_free_ char *line = NULL;
612 p = procfs_file_alloca(pid, "stat");
613 r = read_one_line_file(p, &line);
617 /* Let's skip the pid and comm fields. The latter is enclosed
618 * in () but does not escape any () in its value, so let's
619 * skip over it manually */
621 p = strrchr(line, ')');
633 if ((long unsigned) (pid_t) ppid != ppid)
636 *_ppid = (pid_t) ppid;
641 int fchmod_umask(int fd, mode_t m) {
646 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
652 char *truncate_nl(char *s) {
655 s[strcspn(s, NEWLINE)] = 0;
659 int get_process_state(pid_t pid) {
663 _cleanup_free_ char *line = NULL;
667 p = procfs_file_alloca(pid, "stat");
668 r = read_one_line_file(p, &line);
672 p = strrchr(line, ')');
678 if (sscanf(p, " %c", &state) != 1)
681 return (unsigned char) state;
684 int get_process_comm(pid_t pid, char **name) {
691 p = procfs_file_alloca(pid, "comm");
693 r = read_one_line_file(p, name);
700 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
701 _cleanup_fclose_ FILE *f = NULL;
709 p = procfs_file_alloca(pid, "cmdline");
715 if (max_length == 0) {
716 size_t len = 0, allocated = 0;
718 while ((c = getc(f)) != EOF) {
720 if (!GREEDY_REALLOC(r, allocated, len+2)) {
725 r[len++] = isprint(c) ? c : ' ';
735 r = new(char, max_length);
741 while ((c = getc(f)) != EOF) {
763 size_t n = MIN(left-1, 3U);
770 /* Kernel threads have no argv[] */
772 _cleanup_free_ char *t = NULL;
780 h = get_process_comm(pid, &t);
784 r = strjoin("[", t, "]", NULL);
793 int is_kernel_thread(pid_t pid) {
805 p = procfs_file_alloca(pid, "cmdline");
810 count = fread(&c, 1, 1, f);
814 /* Kernel threads have an empty cmdline */
817 return eof ? 1 : -errno;
822 int get_process_capeff(pid_t pid, char **capeff) {
828 p = procfs_file_alloca(pid, "status");
830 return get_status_field(p, "\nCapEff:", capeff);
833 static int get_process_link_contents(const char *proc_file, char **name) {
839 r = readlink_malloc(proc_file, name);
841 return r == -ENOENT ? -ESRCH : r;
846 int get_process_exe(pid_t pid, char **name) {
853 p = procfs_file_alloca(pid, "exe");
854 r = get_process_link_contents(p, name);
858 d = endswith(*name, " (deleted)");
865 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
866 _cleanup_fclose_ FILE *f = NULL;
876 p = procfs_file_alloca(pid, "status");
881 FOREACH_LINE(line, f, return -errno) {
886 if (startswith(l, field)) {
888 l += strspn(l, WHITESPACE);
890 l[strcspn(l, WHITESPACE)] = 0;
892 return parse_uid(l, uid);
899 int get_process_uid(pid_t pid, uid_t *uid) {
900 return get_process_id(pid, "Uid:", uid);
903 int get_process_gid(pid_t pid, gid_t *gid) {
904 assert_cc(sizeof(uid_t) == sizeof(gid_t));
905 return get_process_id(pid, "Gid:", gid);
908 int get_process_cwd(pid_t pid, char **cwd) {
913 p = procfs_file_alloca(pid, "cwd");
915 return get_process_link_contents(p, cwd);
918 int get_process_root(pid_t pid, char **root) {
923 p = procfs_file_alloca(pid, "root");
925 return get_process_link_contents(p, root);
928 int get_process_environ(pid_t pid, char **env) {
929 _cleanup_fclose_ FILE *f = NULL;
930 _cleanup_free_ char *outcome = NULL;
933 size_t allocated = 0, sz = 0;
938 p = procfs_file_alloca(pid, "environ");
944 while ((c = fgetc(f)) != EOF) {
945 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
949 outcome[sz++] = '\n';
951 sz += cescape_char(c, outcome + sz);
961 char *strnappend(const char *s, const char *suffix, size_t b) {
969 return strndup(suffix, b);
978 if (b > ((size_t) -1) - a)
981 r = new(char, a+b+1);
986 memcpy(r+a, suffix, b);
992 char *strappend(const char *s, const char *suffix) {
993 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
996 int readlinkat_malloc(int fd, const char *p, char **ret) {
1011 n = readlinkat(fd, p, c, l-1);
1018 if ((size_t) n < l-1) {
1029 int readlink_malloc(const char *p, char **ret) {
1030 return readlinkat_malloc(AT_FDCWD, p, ret);
1033 int readlink_value(const char *p, char **ret) {
1034 _cleanup_free_ char *link = NULL;
1038 r = readlink_malloc(p, &link);
1042 value = basename(link);
1046 value = strdup(value);
1055 int readlink_and_make_absolute(const char *p, char **r) {
1056 _cleanup_free_ char *target = NULL;
1063 j = readlink_malloc(p, &target);
1067 k = file_in_same_dir(p, target);
1075 int readlink_and_canonicalize(const char *p, char **r) {
1082 j = readlink_and_make_absolute(p, &t);
1086 s = canonicalize_file_name(t);
1093 path_kill_slashes(*r);
1098 int reset_all_signal_handlers(void) {
1101 for (sig = 1; sig < _NSIG; sig++) {
1102 struct sigaction sa = {
1103 .sa_handler = SIG_DFL,
1104 .sa_flags = SA_RESTART,
1107 /* These two cannot be caught... */
1108 if (sig == SIGKILL || sig == SIGSTOP)
1111 /* On Linux the first two RT signals are reserved by
1112 * glibc, and sigaction() will return EINVAL for them. */
1113 if ((sigaction(sig, &sa, NULL) < 0))
1114 if (errno != EINVAL && r == 0)
1121 int reset_signal_mask(void) {
1124 if (sigemptyset(&ss) < 0)
1127 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1133 char *strstrip(char *s) {
1136 /* Drops trailing whitespace. Modifies the string in
1137 * place. Returns pointer to first non-space character */
1139 s += strspn(s, WHITESPACE);
1141 for (e = strchr(s, 0); e > s; e --)
1142 if (!strchr(WHITESPACE, e[-1]))
1150 char *delete_chars(char *s, const char *bad) {
1153 /* Drops all whitespace, regardless where in the string */
1155 for (f = s, t = s; *f; f++) {
1156 if (strchr(bad, *f))
1167 char *file_in_same_dir(const char *path, const char *filename) {
1174 /* This removes the last component of path and appends
1175 * filename, unless the latter is absolute anyway or the
1178 if (path_is_absolute(filename))
1179 return strdup(filename);
1181 e = strrchr(path, '/');
1183 return strdup(filename);
1185 k = strlen(filename);
1186 ret = new(char, (e + 1 - path) + k + 1);
1190 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1194 int rmdir_parents(const char *path, const char *stop) {
1203 /* Skip trailing slashes */
1204 while (l > 0 && path[l-1] == '/')
1210 /* Skip last component */
1211 while (l > 0 && path[l-1] != '/')
1214 /* Skip trailing slashes */
1215 while (l > 0 && path[l-1] == '/')
1221 if (!(t = strndup(path, l)))
1224 if (path_startswith(stop, t)) {
1233 if (errno != ENOENT)
1240 char hexchar(int x) {
1241 static const char table[16] = "0123456789abcdef";
1243 return table[x & 15];
1246 int unhexchar(char c) {
1248 if (c >= '0' && c <= '9')
1251 if (c >= 'a' && c <= 'f')
1252 return c - 'a' + 10;
1254 if (c >= 'A' && c <= 'F')
1255 return c - 'A' + 10;
1260 char *hexmem(const void *p, size_t l) {
1264 z = r = malloc(l * 2 + 1);
1268 for (x = p; x < (const uint8_t*) p + l; x++) {
1269 *(z++) = hexchar(*x >> 4);
1270 *(z++) = hexchar(*x & 15);
1277 void *unhexmem(const char *p, size_t l) {
1283 z = r = malloc((l + 1) / 2 + 1);
1287 for (x = p; x < p + l; x += 2) {
1290 a = unhexchar(x[0]);
1292 b = unhexchar(x[1]);
1296 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1303 char octchar(int x) {
1304 return '0' + (x & 7);
1307 int unoctchar(char c) {
1309 if (c >= '0' && c <= '7')
1315 char decchar(int x) {
1316 return '0' + (x % 10);
1319 int undecchar(char c) {
1321 if (c >= '0' && c <= '9')
1327 char *cescape(const char *s) {
1333 /* Does C style string escaping. */
1335 r = new(char, strlen(s)*4 + 1);
1339 for (f = s, t = r; *f; f++)
1340 t += cescape_char(*f, t);
1347 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1354 /* Undoes C style string escaping, and optionally prefixes it. */
1356 pl = prefix ? strlen(prefix) : 0;
1358 r = new(char, pl+length+1);
1363 memcpy(r, prefix, pl);
1365 for (f = s, t = r + pl; f < s + length; f++) {
1366 size_t remaining = s + length - f;
1367 assert(remaining > 0);
1369 if (*f != '\\') { /* a literal literal */
1374 if (--remaining == 0) { /* copy trailing backslash verbatim */
1415 /* This is an extension of the XDG syntax files */
1420 /* hexadecimal encoding */
1423 if (remaining >= 2) {
1424 a = unhexchar(f[1]);
1425 b = unhexchar(f[2]);
1428 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1429 /* Invalid escape code, let's take it literal then */
1433 *(t++) = (char) ((a << 4) | b);
1448 /* octal encoding */
1449 int a = -1, b = -1, c = -1;
1451 if (remaining >= 3) {
1452 a = unoctchar(f[0]);
1453 b = unoctchar(f[1]);
1454 c = unoctchar(f[2]);
1457 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1458 /* Invalid escape code, let's take it literal then */
1462 *(t++) = (char) ((a << 6) | (b << 3) | c);
1470 /* Invalid escape code, let's take it literal then */
1481 char *cunescape_length(const char *s, size_t length) {
1482 return cunescape_length_with_prefix(s, length, NULL);
1485 char *cunescape(const char *s) {
1488 return cunescape_length(s, strlen(s));
1491 char *xescape(const char *s, const char *bad) {
1495 /* Escapes all chars in bad, in addition to \ and all special
1496 * chars, in \xFF style escaping. May be reversed with
1499 r = new(char, strlen(s) * 4 + 1);
1503 for (f = s, t = r; *f; f++) {
1505 if ((*f < ' ') || (*f >= 127) ||
1506 (*f == '\\') || strchr(bad, *f)) {
1509 *(t++) = hexchar(*f >> 4);
1510 *(t++) = hexchar(*f);
1520 char *ascii_strlower(char *t) {
1525 for (p = t; *p; p++)
1526 if (*p >= 'A' && *p <= 'Z')
1527 *p = *p - 'A' + 'a';
1532 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1536 filename[0] == '.' ||
1537 streq(filename, "lost+found") ||
1538 streq(filename, "aquota.user") ||
1539 streq(filename, "aquota.group") ||
1540 endswith(filename, ".rpmnew") ||
1541 endswith(filename, ".rpmsave") ||
1542 endswith(filename, ".rpmorig") ||
1543 endswith(filename, ".dpkg-old") ||
1544 endswith(filename, ".dpkg-new") ||
1545 endswith(filename, ".dpkg-tmp") ||
1546 endswith(filename, ".dpkg-dist") ||
1547 endswith(filename, ".dpkg-bak") ||
1548 endswith(filename, ".dpkg-backup") ||
1549 endswith(filename, ".dpkg-remove") ||
1550 endswith(filename, ".swp");
1553 bool hidden_file(const char *filename) {
1556 if (endswith(filename, "~"))
1559 return hidden_file_allow_backup(filename);
1562 int fd_nonblock(int fd, bool nonblock) {
1567 flags = fcntl(fd, F_GETFL, 0);
1572 nflags = flags | O_NONBLOCK;
1574 nflags = flags & ~O_NONBLOCK;
1576 if (nflags == flags)
1579 if (fcntl(fd, F_SETFL, nflags) < 0)
1585 int fd_cloexec(int fd, bool cloexec) {
1590 flags = fcntl(fd, F_GETFD, 0);
1595 nflags = flags | FD_CLOEXEC;
1597 nflags = flags & ~FD_CLOEXEC;
1599 if (nflags == flags)
1602 if (fcntl(fd, F_SETFD, nflags) < 0)
1608 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1611 assert(n_fdset == 0 || fdset);
1613 for (i = 0; i < n_fdset; i++)
1620 int close_all_fds(const int except[], unsigned n_except) {
1621 _cleanup_closedir_ DIR *d = NULL;
1625 assert(n_except == 0 || except);
1627 d = opendir("/proc/self/fd");
1632 /* When /proc isn't available (for example in chroots)
1633 * the fallback is brute forcing through the fd
1636 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1637 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1639 if (fd_in_set(fd, except, n_except))
1642 if (close_nointr(fd) < 0)
1643 if (errno != EBADF && r == 0)
1650 while ((de = readdir(d))) {
1653 if (hidden_file(de->d_name))
1656 if (safe_atoi(de->d_name, &fd) < 0)
1657 /* Let's better ignore this, just in case */
1666 if (fd_in_set(fd, except, n_except))
1669 if (close_nointr(fd) < 0) {
1670 /* Valgrind has its own FD and doesn't want to have it closed */
1671 if (errno != EBADF && r == 0)
1679 bool chars_intersect(const char *a, const char *b) {
1682 /* Returns true if any of the chars in a are in b. */
1683 for (p = a; *p; p++)
1690 bool fstype_is_network(const char *fstype) {
1691 static const char table[] =
1706 x = startswith(fstype, "fuse.");
1710 return nulstr_contains(table, fstype);
1714 _cleanup_close_ int fd;
1716 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1722 TIOCL_GETKMSGREDIRECT,
1726 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1729 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1732 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1738 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1739 struct termios old_termios, new_termios;
1740 char c, line[LINE_MAX];
1745 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1746 new_termios = old_termios;
1748 new_termios.c_lflag &= ~ICANON;
1749 new_termios.c_cc[VMIN] = 1;
1750 new_termios.c_cc[VTIME] = 0;
1752 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1755 if (t != USEC_INFINITY) {
1756 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1757 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1762 k = fread(&c, 1, 1, f);
1764 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1770 *need_nl = c != '\n';
1777 if (t != USEC_INFINITY) {
1778 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1783 if (!fgets(line, sizeof(line), f))
1784 return errno ? -errno : -EIO;
1788 if (strlen(line) != 1)
1798 int ask_char(char *ret, const char *replies, const char *text, ...) {
1808 bool need_nl = true;
1811 fputs(ANSI_HIGHLIGHT_ON, stdout);
1818 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1822 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1825 if (r == -EBADMSG) {
1826 puts("Bad input, please try again.");
1837 if (strchr(replies, c)) {
1842 puts("Read unexpected character, please try again.");
1846 int ask_string(char **ret, const char *text, ...) {
1851 char line[LINE_MAX];
1855 fputs(ANSI_HIGHLIGHT_ON, stdout);
1862 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1867 if (!fgets(line, sizeof(line), stdin))
1868 return errno ? -errno : -EIO;
1870 if (!endswith(line, "\n"))
1889 int reset_terminal_fd(int fd, bool switch_to_text) {
1890 struct termios termios;
1893 /* Set terminal to some sane defaults */
1897 /* We leave locked terminal attributes untouched, so that
1898 * Plymouth may set whatever it wants to set, and we don't
1899 * interfere with that. */
1901 /* Disable exclusive mode, just in case */
1902 ioctl(fd, TIOCNXCL);
1904 /* Switch to text mode */
1906 ioctl(fd, KDSETMODE, KD_TEXT);
1908 /* Enable console unicode mode */
1909 ioctl(fd, KDSKBMODE, K_UNICODE);
1911 if (tcgetattr(fd, &termios) < 0) {
1916 /* We only reset the stuff that matters to the software. How
1917 * hardware is set up we don't touch assuming that somebody
1918 * else will do that for us */
1920 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1921 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1922 termios.c_oflag |= ONLCR;
1923 termios.c_cflag |= CREAD;
1924 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1926 termios.c_cc[VINTR] = 03; /* ^C */
1927 termios.c_cc[VQUIT] = 034; /* ^\ */
1928 termios.c_cc[VERASE] = 0177;
1929 termios.c_cc[VKILL] = 025; /* ^X */
1930 termios.c_cc[VEOF] = 04; /* ^D */
1931 termios.c_cc[VSTART] = 021; /* ^Q */
1932 termios.c_cc[VSTOP] = 023; /* ^S */
1933 termios.c_cc[VSUSP] = 032; /* ^Z */
1934 termios.c_cc[VLNEXT] = 026; /* ^V */
1935 termios.c_cc[VWERASE] = 027; /* ^W */
1936 termios.c_cc[VREPRINT] = 022; /* ^R */
1937 termios.c_cc[VEOL] = 0;
1938 termios.c_cc[VEOL2] = 0;
1940 termios.c_cc[VTIME] = 0;
1941 termios.c_cc[VMIN] = 1;
1943 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1947 /* Just in case, flush all crap out */
1948 tcflush(fd, TCIOFLUSH);
1953 int reset_terminal(const char *name) {
1954 _cleanup_close_ int fd = -1;
1956 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1960 return reset_terminal_fd(fd, true);
1963 int open_terminal(const char *name, int mode) {
1968 * If a TTY is in the process of being closed opening it might
1969 * cause EIO. This is horribly awful, but unlikely to be
1970 * changed in the kernel. Hence we work around this problem by
1971 * retrying a couple of times.
1973 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
1976 assert(!(mode & O_CREAT));
1979 fd = open(name, mode, 0);
1986 /* Max 1s in total */
1990 usleep(50 * USEC_PER_MSEC);
2008 int flush_fd(int fd) {
2009 struct pollfd pollfd = {
2019 r = poll(&pollfd, 1, 0);
2029 l = read(fd, buf, sizeof(buf));
2035 if (errno == EAGAIN)
2044 int acquire_terminal(
2048 bool ignore_tiocstty_eperm,
2051 int fd = -1, notify = -1, r = 0, wd = -1;
2056 /* We use inotify to be notified when the tty is closed. We
2057 * create the watch before checking if we can actually acquire
2058 * it, so that we don't lose any event.
2060 * Note: strictly speaking this actually watches for the
2061 * device being closed, it does *not* really watch whether a
2062 * tty loses its controlling process. However, unless some
2063 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2064 * its tty otherwise this will not become a problem. As long
2065 * as the administrator makes sure not configure any service
2066 * on the same tty as an untrusted user this should not be a
2067 * problem. (Which he probably should not do anyway.) */
2069 if (timeout != USEC_INFINITY)
2070 ts = now(CLOCK_MONOTONIC);
2072 if (!fail && !force) {
2073 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2079 wd = inotify_add_watch(notify, name, IN_CLOSE);
2087 struct sigaction sa_old, sa_new = {
2088 .sa_handler = SIG_IGN,
2089 .sa_flags = SA_RESTART,
2093 r = flush_fd(notify);
2098 /* We pass here O_NOCTTY only so that we can check the return
2099 * value TIOCSCTTY and have a reliable way to figure out if we
2100 * successfully became the controlling process of the tty */
2101 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2105 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2106 * if we already own the tty. */
2107 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2109 /* First, try to get the tty */
2110 if (ioctl(fd, TIOCSCTTY, force) < 0)
2113 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2115 /* Sometimes it makes sense to ignore TIOCSCTTY
2116 * returning EPERM, i.e. when very likely we already
2117 * are have this controlling terminal. */
2118 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2121 if (r < 0 && (force || fail || r != -EPERM)) {
2130 assert(notify >= 0);
2133 union inotify_event_buffer buffer;
2134 struct inotify_event *e;
2137 if (timeout != USEC_INFINITY) {
2140 n = now(CLOCK_MONOTONIC);
2141 if (ts + timeout < n) {
2146 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2156 l = read(notify, &buffer, sizeof(buffer));
2158 if (errno == EINTR || errno == EAGAIN)
2165 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2166 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2175 /* We close the tty fd here since if the old session
2176 * ended our handle will be dead. It's important that
2177 * we do this after sleeping, so that we don't enter
2178 * an endless loop. */
2179 fd = safe_close(fd);
2184 r = reset_terminal_fd(fd, true);
2186 log_warning_errno(r, "Failed to reset terminal: %m");
2197 int release_terminal(void) {
2198 static const struct sigaction sa_new = {
2199 .sa_handler = SIG_IGN,
2200 .sa_flags = SA_RESTART,
2203 _cleanup_close_ int fd = -1;
2204 struct sigaction sa_old;
2207 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2211 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2212 * by our own TIOCNOTTY */
2213 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2215 if (ioctl(fd, TIOCNOTTY) < 0)
2218 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2223 int sigaction_many(const struct sigaction *sa, ...) {
2228 while ((sig = va_arg(ap, int)) > 0)
2229 if (sigaction(sig, sa, NULL) < 0)
2236 int ignore_signals(int sig, ...) {
2237 struct sigaction sa = {
2238 .sa_handler = SIG_IGN,
2239 .sa_flags = SA_RESTART,
2244 if (sigaction(sig, &sa, NULL) < 0)
2248 while ((sig = va_arg(ap, int)) > 0)
2249 if (sigaction(sig, &sa, NULL) < 0)
2256 int default_signals(int sig, ...) {
2257 struct sigaction sa = {
2258 .sa_handler = SIG_DFL,
2259 .sa_flags = SA_RESTART,
2264 if (sigaction(sig, &sa, NULL) < 0)
2268 while ((sig = va_arg(ap, int)) > 0)
2269 if (sigaction(sig, &sa, NULL) < 0)
2276 void safe_close_pair(int p[]) {
2280 /* Special case pairs which use the same fd in both
2282 p[0] = p[1] = safe_close(p[0]);
2286 p[0] = safe_close(p[0]);
2287 p[1] = safe_close(p[1]);
2290 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2297 while (nbytes > 0) {
2300 k = read(fd, p, nbytes);
2305 if (errno == EAGAIN && do_poll) {
2307 /* We knowingly ignore any return value here,
2308 * and expect that any error/EOF is reported
2311 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2315 return n > 0 ? n : -errno;
2329 int loop_read_exact(int fd, void *buf, size_t nbytes, bool do_poll) {
2332 n = loop_read(fd, buf, nbytes, do_poll);
2335 if ((size_t) n != nbytes)
2340 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2341 const uint8_t *p = buf;
2348 while (nbytes > 0) {
2351 k = write(fd, p, nbytes);
2356 if (errno == EAGAIN && do_poll) {
2357 /* We knowingly ignore any return value here,
2358 * and expect that any error/EOF is reported
2361 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2368 if (k == 0) /* Can't really happen */
2378 int parse_size(const char *t, off_t base, off_t *size) {
2380 /* Soo, sometimes we want to parse IEC binary suffxies, and
2381 * sometimes SI decimal suffixes. This function can parse
2382 * both. Which one is the right way depends on the
2383 * context. Wikipedia suggests that SI is customary for
2384 * hardrware metrics and network speeds, while IEC is
2385 * customary for most data sizes used by software and volatile
2386 * (RAM) memory. Hence be careful which one you pick!
2388 * In either case we use just K, M, G as suffix, and not Ki,
2389 * Mi, Gi or so (as IEC would suggest). That's because that's
2390 * frickin' ugly. But this means you really need to make sure
2391 * to document which base you are parsing when you use this
2396 unsigned long long factor;
2399 static const struct table iec[] = {
2400 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2401 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2402 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2403 { "G", 1024ULL*1024ULL*1024ULL },
2404 { "M", 1024ULL*1024ULL },
2410 static const struct table si[] = {
2411 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2412 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2413 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2414 { "G", 1000ULL*1000ULL*1000ULL },
2415 { "M", 1000ULL*1000ULL },
2421 const struct table *table;
2423 unsigned long long r = 0;
2424 unsigned n_entries, start_pos = 0;
2427 assert(base == 1000 || base == 1024);
2432 n_entries = ELEMENTSOF(si);
2435 n_entries = ELEMENTSOF(iec);
2441 unsigned long long l2;
2447 l = strtoll(p, &e, 10);
2460 if (*e >= '0' && *e <= '9') {
2463 /* strotoull itself would accept space/+/- */
2464 l2 = strtoull(e, &e2, 10);
2466 if (errno == ERANGE)
2469 /* Ignore failure. E.g. 10.M is valid */
2476 e += strspn(e, WHITESPACE);
2478 for (i = start_pos; i < n_entries; i++)
2479 if (startswith(e, table[i].suffix)) {
2480 unsigned long long tmp;
2481 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2483 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2484 if (tmp > ULLONG_MAX - r)
2488 if ((unsigned long long) (off_t) r != r)
2491 p = e + strlen(table[i].suffix);
2507 int make_stdio(int fd) {
2512 r = dup2(fd, STDIN_FILENO);
2513 s = dup2(fd, STDOUT_FILENO);
2514 t = dup2(fd, STDERR_FILENO);
2519 if (r < 0 || s < 0 || t < 0)
2522 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2523 * dup2() was a NOP and the bit hence possibly set. */
2524 fd_cloexec(STDIN_FILENO, false);
2525 fd_cloexec(STDOUT_FILENO, false);
2526 fd_cloexec(STDERR_FILENO, false);
2531 int make_null_stdio(void) {
2534 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2538 return make_stdio(null_fd);
2541 bool is_device_path(const char *path) {
2543 /* Returns true on paths that refer to a device, either in
2544 * sysfs or in /dev */
2547 path_startswith(path, "/dev/") ||
2548 path_startswith(path, "/sys/");
2551 int dir_is_empty(const char *path) {
2552 _cleanup_closedir_ DIR *d;
2563 if (!de && errno != 0)
2569 if (!hidden_file(de->d_name))
2574 char* dirname_malloc(const char *path) {
2575 char *d, *dir, *dir2;
2592 int dev_urandom(void *p, size_t n) {
2593 static int have_syscall = -1;
2595 _cleanup_close_ int fd = -1;
2598 /* Gathers some randomness from the kernel. This call will
2599 * never block, and will always return some data from the
2600 * kernel, regardless if the random pool is fully initialized
2601 * or not. It thus makes no guarantee for the quality of the
2602 * returned entropy, but is good enough for or usual usecases
2603 * of seeding the hash functions for hashtable */
2605 /* Use the getrandom() syscall unless we know we don't have
2606 * it, or when the requested size is too large for it. */
2607 if (have_syscall != 0 || (size_t) (int) n != n) {
2608 r = getrandom(p, n, GRND_NONBLOCK);
2610 have_syscall = true;
2615 if (errno == ENOSYS)
2616 /* we lack the syscall, continue with
2617 * reading from /dev/urandom */
2618 have_syscall = false;
2619 else if (errno == EAGAIN)
2620 /* not enough entropy for now. Let's
2621 * remember to use the syscall the
2622 * next time, again, but also read
2623 * from /dev/urandom for now, which
2624 * doesn't care about the current
2625 * amount of entropy. */
2626 have_syscall = true;
2630 /* too short read? */
2634 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2636 return errno == ENOENT ? -ENOSYS : -errno;
2638 return loop_read_exact(fd, p, n, true);
2641 void initialize_srand(void) {
2642 static bool srand_called = false;
2644 #ifdef HAVE_SYS_AUXV_H
2653 #ifdef HAVE_SYS_AUXV_H
2654 /* The kernel provides us with a bit of entropy in auxv, so
2655 * let's try to make use of that to seed the pseudo-random
2656 * generator. It's better than nothing... */
2658 auxv = (void*) getauxval(AT_RANDOM);
2660 x ^= *(unsigned*) auxv;
2663 x ^= (unsigned) now(CLOCK_REALTIME);
2664 x ^= (unsigned) gettid();
2667 srand_called = true;
2670 void random_bytes(void *p, size_t n) {
2674 r = dev_urandom(p, n);
2678 /* If some idiot made /dev/urandom unavailable to us, he'll
2679 * get a PRNG instead. */
2683 for (q = p; q < (uint8_t*) p + n; q ++)
2687 void rename_process(const char name[8]) {
2690 /* This is a like a poor man's setproctitle(). It changes the
2691 * comm field, argv[0], and also the glibc's internally used
2692 * name of the process. For the first one a limit of 16 chars
2693 * applies, to the second one usually one of 10 (i.e. length
2694 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2695 * "systemd"). If you pass a longer string it will be
2698 prctl(PR_SET_NAME, name);
2700 if (program_invocation_name)
2701 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2703 if (saved_argc > 0) {
2707 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2709 for (i = 1; i < saved_argc; i++) {
2713 memzero(saved_argv[i], strlen(saved_argv[i]));
2718 void sigset_add_many(sigset_t *ss, ...) {
2725 while ((sig = va_arg(ap, int)) > 0)
2726 assert_se(sigaddset(ss, sig) == 0);
2730 int sigprocmask_many(int how, ...) {
2735 assert_se(sigemptyset(&ss) == 0);
2738 while ((sig = va_arg(ap, int)) > 0)
2739 assert_se(sigaddset(&ss, sig) == 0);
2742 if (sigprocmask(how, &ss, NULL) < 0)
2748 char* gethostname_malloc(void) {
2751 assert_se(uname(&u) >= 0);
2753 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2754 return strdup(u.nodename);
2756 return strdup(u.sysname);
2759 bool hostname_is_set(void) {
2762 assert_se(uname(&u) >= 0);
2764 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2767 char *lookup_uid(uid_t uid) {
2770 _cleanup_free_ char *buf = NULL;
2771 struct passwd pwbuf, *pw = NULL;
2773 /* Shortcut things to avoid NSS lookups */
2775 return strdup("root");
2777 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2781 buf = malloc(bufsize);
2785 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2786 return strdup(pw->pw_name);
2788 if (asprintf(&name, UID_FMT, uid) < 0)
2794 char* getlogname_malloc(void) {
2798 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2803 return lookup_uid(uid);
2806 char *getusername_malloc(void) {
2813 return lookup_uid(getuid());
2816 int getttyname_malloc(int fd, char **ret) {
2826 r = ttyname_r(fd, path, sizeof(path));
2831 p = startswith(path, "/dev/");
2832 c = strdup(p ?: path);
2849 int getttyname_harder(int fd, char **r) {
2853 k = getttyname_malloc(fd, &s);
2857 if (streq(s, "tty")) {
2859 return get_ctty(0, NULL, r);
2866 int get_ctty_devnr(pid_t pid, dev_t *d) {
2868 _cleanup_free_ char *line = NULL;
2870 unsigned long ttynr;
2874 p = procfs_file_alloca(pid, "stat");
2875 r = read_one_line_file(p, &line);
2879 p = strrchr(line, ')');
2889 "%*d " /* session */
2894 if (major(ttynr) == 0 && minor(ttynr) == 0)
2903 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2904 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2905 _cleanup_free_ char *s = NULL;
2912 k = get_ctty_devnr(pid, &devnr);
2916 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
2918 k = readlink_malloc(fn, &s);
2924 /* This is an ugly hack */
2925 if (major(devnr) == 136) {
2926 asprintf(&b, "pts/%u", minor(devnr));
2930 /* Probably something like the ptys which have no
2931 * symlink in /dev/char. Let's return something
2932 * vaguely useful. */
2938 if (startswith(s, "/dev/"))
2940 else if (startswith(s, "../"))
2958 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2959 _cleanup_closedir_ DIR *d = NULL;
2964 /* This returns the first error we run into, but nevertheless
2965 * tries to go on. This closes the passed fd. */
2971 return errno == ENOENT ? 0 : -errno;
2976 bool is_dir, keep_around;
2983 if (errno != 0 && ret == 0)
2988 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
2991 if (de->d_type == DT_UNKNOWN ||
2993 (de->d_type == DT_DIR && root_dev)) {
2994 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
2995 if (ret == 0 && errno != ENOENT)
3000 is_dir = S_ISDIR(st.st_mode);
3003 (st.st_uid == 0 || st.st_uid == getuid()) &&
3004 (st.st_mode & S_ISVTX);
3006 is_dir = de->d_type == DT_DIR;
3007 keep_around = false;
3013 /* if root_dev is set, remove subdirectories only, if device is same as dir */
3014 if (root_dev && st.st_dev != root_dev->st_dev)
3017 subdir_fd = openat(fd, de->d_name,
3018 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3019 if (subdir_fd < 0) {
3020 if (ret == 0 && errno != ENOENT)
3025 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
3026 if (r < 0 && ret == 0)
3030 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
3031 if (ret == 0 && errno != ENOENT)
3035 } else if (!only_dirs && !keep_around) {
3037 if (unlinkat(fd, de->d_name, 0) < 0) {
3038 if (ret == 0 && errno != ENOENT)
3045 _pure_ static int is_temporary_fs(struct statfs *s) {
3048 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3049 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3052 int is_fd_on_temporary_fs(int fd) {
3055 if (fstatfs(fd, &s) < 0)
3058 return is_temporary_fs(&s);
3061 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
3066 if (fstatfs(fd, &s) < 0) {
3071 /* We refuse to clean disk file systems with this call. This
3072 * is extra paranoia just to be sure we never ever remove
3074 if (!is_temporary_fs(&s)) {
3075 log_error("Attempted to remove disk file system, and we can't allow that.");
3080 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
3083 static int file_is_priv_sticky(const char *p) {
3088 if (lstat(p, &st) < 0)
3092 (st.st_uid == 0 || st.st_uid == getuid()) &&
3093 (st.st_mode & S_ISVTX);
3096 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
3102 /* We refuse to clean the root file system with this
3103 * call. This is extra paranoia to never cause a really
3104 * seriously broken system. */
3105 if (path_equal(path, "/")) {
3106 log_error("Attempted to remove entire root file system, and we can't allow that.");
3110 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3113 if (errno != ENOTDIR && errno != ELOOP)
3117 if (statfs(path, &s) < 0)
3120 if (!is_temporary_fs(&s)) {
3121 log_error("Attempted to remove disk file system, and we can't allow that.");
3126 if (delete_root && !only_dirs)
3127 if (unlink(path) < 0 && errno != ENOENT)
3134 if (fstatfs(fd, &s) < 0) {
3139 if (!is_temporary_fs(&s)) {
3140 log_error("Attempted to remove disk file system, and we can't allow that.");
3146 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
3149 if (honour_sticky && file_is_priv_sticky(path) > 0)
3152 if (rmdir(path) < 0 && errno != ENOENT) {
3161 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3162 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
3165 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3166 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
3169 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3172 /* Under the assumption that we are running privileged we
3173 * first change the access mode and only then hand out
3174 * ownership to avoid a window where access is too open. */
3176 if (mode != MODE_INVALID)
3177 if (chmod(path, mode) < 0)
3180 if (uid != UID_INVALID || gid != GID_INVALID)
3181 if (chown(path, uid, gid) < 0)
3187 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3190 /* Under the assumption that we are running privileged we
3191 * first change the access mode and only then hand out
3192 * ownership to avoid a window where access is too open. */
3194 if (mode != MODE_INVALID)
3195 if (fchmod(fd, mode) < 0)
3198 if (uid != UID_INVALID || gid != GID_INVALID)
3199 if (fchown(fd, uid, gid) < 0)
3205 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3209 /* Allocates the cpuset in the right size */
3212 if (!(r = CPU_ALLOC(n)))
3215 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3216 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3226 if (errno != EINVAL)
3233 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3234 static const char status_indent[] = " "; /* "[" STATUS "] " */
3235 _cleanup_free_ char *s = NULL;
3236 _cleanup_close_ int fd = -1;
3237 struct iovec iovec[6] = {};
3239 static bool prev_ephemeral;
3243 /* This is independent of logging, as status messages are
3244 * optional and go exclusively to the console. */
3246 if (vasprintf(&s, format, ap) < 0)
3249 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3262 sl = status ? sizeof(status_indent)-1 : 0;
3268 e = ellipsize(s, emax, 50);
3276 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3277 prev_ephemeral = ephemeral;
3280 if (!isempty(status)) {
3281 IOVEC_SET_STRING(iovec[n++], "[");
3282 IOVEC_SET_STRING(iovec[n++], status);
3283 IOVEC_SET_STRING(iovec[n++], "] ");
3285 IOVEC_SET_STRING(iovec[n++], status_indent);
3288 IOVEC_SET_STRING(iovec[n++], s);
3290 IOVEC_SET_STRING(iovec[n++], "\n");
3292 if (writev(fd, iovec, n) < 0)
3298 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3304 va_start(ap, format);
3305 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3311 char *replace_env(const char *format, char **env) {
3318 const char *e, *word = format;
3323 for (e = format; *e; e ++) {
3334 k = strnappend(r, word, e-word-1);
3344 } else if (*e == '$') {
3345 k = strnappend(r, word, e-word);
3362 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3364 k = strappend(r, t);
3378 k = strnappend(r, word, e-word);
3390 char **replace_env_argv(char **argv, char **env) {
3392 unsigned k = 0, l = 0;
3394 l = strv_length(argv);
3396 ret = new(char*, l+1);
3400 STRV_FOREACH(i, argv) {
3402 /* If $FOO appears as single word, replace it by the split up variable */
3403 if ((*i)[0] == '$' && (*i)[1] != '{') {
3408 e = strv_env_get(env, *i+1);
3412 r = strv_split_quoted(&m, e, true);
3424 w = realloc(ret, sizeof(char*) * (l+1));
3434 memcpy(ret + k, m, q * sizeof(char*));
3442 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3443 ret[k] = replace_env(*i, env);
3455 int fd_columns(int fd) {
3456 struct winsize ws = {};
3458 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3467 unsigned columns(void) {
3471 if (_likely_(cached_columns > 0))
3472 return cached_columns;
3475 e = getenv("COLUMNS");
3477 (void) safe_atoi(e, &c);
3480 c = fd_columns(STDOUT_FILENO);
3486 return cached_columns;
3489 int fd_lines(int fd) {
3490 struct winsize ws = {};
3492 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3501 unsigned lines(void) {
3505 if (_likely_(cached_lines > 0))
3506 return cached_lines;
3509 e = getenv("LINES");
3511 (void) safe_atoi(e, &l);
3514 l = fd_lines(STDOUT_FILENO);
3520 return cached_lines;
3523 /* intended to be used as a SIGWINCH sighandler */
3524 void columns_lines_cache_reset(int signum) {
3530 static int cached_on_tty = -1;
3532 if (_unlikely_(cached_on_tty < 0))
3533 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3535 return cached_on_tty;
3538 int files_same(const char *filea, const char *fileb) {
3541 if (stat(filea, &a) < 0)
3544 if (stat(fileb, &b) < 0)
3547 return a.st_dev == b.st_dev &&
3548 a.st_ino == b.st_ino;
3551 int running_in_chroot(void) {
3554 ret = files_same("/proc/1/root", "/");
3561 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3566 assert(percent <= 100);
3567 assert(new_length >= 3);
3569 if (old_length <= 3 || old_length <= new_length)
3570 return strndup(s, old_length);
3572 r = new0(char, new_length+1);
3576 x = (new_length * percent) / 100;
3578 if (x > new_length - 3)
3586 s + old_length - (new_length - x - 3),
3587 new_length - x - 3);
3592 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3596 unsigned k, len, len2;
3599 assert(percent <= 100);
3600 assert(new_length >= 3);
3602 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3603 if (ascii_is_valid(s))
3604 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3606 if (old_length <= 3 || old_length <= new_length)
3607 return strndup(s, old_length);
3609 x = (new_length * percent) / 100;
3611 if (x > new_length - 3)
3615 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3618 c = utf8_encoded_to_unichar(i);
3621 k += unichar_iswide(c) ? 2 : 1;
3624 if (k > x) /* last character was wide and went over quota */
3627 for (j = s + old_length; k < new_length && j > i; ) {
3630 j = utf8_prev_char(j);
3631 c = utf8_encoded_to_unichar(j);
3634 k += unichar_iswide(c) ? 2 : 1;
3638 /* we don't actually need to ellipsize */
3640 return memdup(s, old_length + 1);
3642 /* make space for ellipsis */
3643 j = utf8_next_char(j);
3646 len2 = s + old_length - j;
3647 e = new(char, len + 3 + len2 + 1);
3652 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3653 old_length, new_length, x, len, len2, k);
3657 e[len] = 0xe2; /* tri-dot ellipsis: … */
3661 memcpy(e + len + 3, j, len2 + 1);
3666 char *ellipsize(const char *s, size_t length, unsigned percent) {
3667 return ellipsize_mem(s, strlen(s), length, percent);
3670 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3671 _cleanup_close_ int fd;
3677 mkdir_parents(path, 0755);
3679 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3684 r = fchmod(fd, mode);
3689 if (uid != UID_INVALID || gid != GID_INVALID) {
3690 r = fchown(fd, uid, gid);
3695 if (stamp != USEC_INFINITY) {
3696 struct timespec ts[2];
3698 timespec_store(&ts[0], stamp);
3700 r = futimens(fd, ts);
3702 r = futimens(fd, NULL);
3709 int touch(const char *path) {
3710 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3713 char *unquote(const char *s, const char* quotes) {
3717 /* This is rather stupid, simply removes the heading and
3718 * trailing quotes if there is one. Doesn't care about
3719 * escaping or anything. We should make this smarter one
3726 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3727 return strndup(s+1, l-2);
3732 char *normalize_env_assignment(const char *s) {
3733 _cleanup_free_ char *value = NULL;
3737 eq = strchr(s, '=');
3747 memmove(r, t, strlen(t) + 1);
3752 name = strndupa(s, eq - s);
3753 p = strdupa(eq + 1);
3755 value = unquote(strstrip(p), QUOTES);
3759 return strjoin(strstrip(name), "=", value, NULL);
3762 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3773 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3787 * < 0 : wait_for_terminate() failed to get the state of the
3788 * process, the process was terminated by a signal, or
3789 * failed for an unknown reason.
3790 * >=0 : The process terminated normally, and its exit code is
3793 * That is, success is indicated by a return value of zero, and an
3794 * error is indicated by a non-zero value.
3796 * A warning is emitted if the process terminates abnormally,
3797 * and also if it returns non-zero unless check_exit_code is true.
3799 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3806 r = wait_for_terminate(pid, &status);
3808 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3810 if (status.si_code == CLD_EXITED) {
3811 if (status.si_status != 0)
3812 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3813 "%s failed with error code %i.", name, status.si_status);
3815 log_debug("%s succeeded.", name);
3817 return status.si_status;
3818 } else if (status.si_code == CLD_KILLED ||
3819 status.si_code == CLD_DUMPED) {
3821 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3825 log_warning("%s failed due to unknown reason.", name);
3829 noreturn void freeze(void) {
3831 /* Make sure nobody waits for us on a socket anymore */
3832 close_all_fds(NULL, 0);
3840 bool null_or_empty(struct stat *st) {
3843 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3846 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3852 int null_or_empty_path(const char *fn) {
3857 if (stat(fn, &st) < 0)
3860 return null_or_empty(&st);
3863 int null_or_empty_fd(int fd) {
3868 if (fstat(fd, &st) < 0)
3871 return null_or_empty(&st);
3874 DIR *xopendirat(int fd, const char *name, int flags) {
3878 assert(!(flags & O_CREAT));
3880 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3893 int signal_from_string_try_harder(const char *s) {
3897 signo = signal_from_string(s);
3899 if (startswith(s, "SIG"))
3900 return signal_from_string(s+3);
3905 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3906 _cleanup_free_ char *t = NULL, *u = NULL;
3909 u = unquote(tagvalue, "\"\'");
3913 enc_len = strlen(u) * 4 + 1;
3914 t = new(char, enc_len);
3918 if (encode_devnode_name(u, t, enc_len) < 0)
3921 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3924 char *fstab_node_to_udev_node(const char *p) {
3927 if (startswith(p, "LABEL="))
3928 return tag_to_udev_node(p+6, "label");
3930 if (startswith(p, "UUID="))
3931 return tag_to_udev_node(p+5, "uuid");
3933 if (startswith(p, "PARTUUID="))
3934 return tag_to_udev_node(p+9, "partuuid");
3936 if (startswith(p, "PARTLABEL="))
3937 return tag_to_udev_node(p+10, "partlabel");
3942 bool tty_is_vc(const char *tty) {
3945 return vtnr_from_tty(tty) >= 0;
3948 bool tty_is_console(const char *tty) {
3951 if (startswith(tty, "/dev/"))
3954 return streq(tty, "console");
3957 int vtnr_from_tty(const char *tty) {
3962 if (startswith(tty, "/dev/"))
3965 if (!startswith(tty, "tty") )
3968 if (tty[3] < '0' || tty[3] > '9')
3971 r = safe_atoi(tty+3, &i);
3975 if (i < 0 || i > 63)
3981 char *resolve_dev_console(char **active) {
3984 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3985 * (i.e. not read-only-mounted which is a sign for container setups) */
3987 if (path_is_read_only_fs("/sys") > 0)
3990 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3993 /* If multiple log outputs are configured the last one is what
3994 * /dev/console points to */
3995 tty = strrchr(*active, ' ');
4001 if (streq(tty, "tty0")) {
4004 /* Get the active VC (e.g. tty1) */
4005 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
4007 tty = *active = tmp;
4014 bool tty_is_vc_resolve(const char *tty) {
4015 _cleanup_free_ char *active = NULL;
4019 if (startswith(tty, "/dev/"))
4022 if (streq(tty, "console")) {
4023 tty = resolve_dev_console(&active);
4028 return tty_is_vc(tty);
4031 const char *default_term_for_tty(const char *tty) {
4034 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
4037 bool dirent_is_file(const struct dirent *de) {
4040 if (hidden_file(de->d_name))
4043 if (de->d_type != DT_REG &&
4044 de->d_type != DT_LNK &&
4045 de->d_type != DT_UNKNOWN)
4051 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
4054 if (de->d_type != DT_REG &&
4055 de->d_type != DT_LNK &&
4056 de->d_type != DT_UNKNOWN)
4059 if (hidden_file_allow_backup(de->d_name))
4062 return endswith(de->d_name, suffix);
4065 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4066 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4067 _cleanup_set_free_free_ Set *seen = NULL;
4070 /* We fork this all off from a child process so that we can
4071 * somewhat cleanly make use of SIGALRM to set a time limit */
4073 reset_all_signal_handlers();
4074 reset_signal_mask();
4076 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4078 pids = hashmap_new(NULL);
4082 seen = set_new(&string_hash_ops);
4086 STRV_FOREACH(directory, directories) {
4087 _cleanup_closedir_ DIR *d;
4090 d = opendir(*directory);
4092 if (errno == ENOENT)
4095 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4098 FOREACH_DIRENT(de, d, break) {
4099 _cleanup_free_ char *path = NULL;
4103 if (!dirent_is_file(de))
4106 if (set_contains(seen, de->d_name)) {
4107 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4111 r = set_put_strdup(seen, de->d_name);
4115 path = strjoin(*directory, "/", de->d_name, NULL);
4119 if (null_or_empty_path(path)) {
4120 log_debug("%s is empty (a mask).", path);
4123 log_debug("%s will be executed.", path);
4127 log_error_errno(errno, "Failed to fork: %m");
4129 } else if (pid == 0) {
4132 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4142 return log_error_errno(errno, "Failed to execute %s: %m", path);
4145 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4147 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4154 /* Abort execution of this process after the timout. We simply
4155 * rely on SIGALRM as default action terminating the process,
4156 * and turn on alarm(). */
4158 if (timeout != USEC_INFINITY)
4159 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4161 while (!hashmap_isempty(pids)) {
4162 _cleanup_free_ char *path = NULL;
4165 pid = PTR_TO_UINT(hashmap_first_key(pids));
4168 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4171 wait_for_terminate_and_warn(path, pid, true);
4177 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4181 char **dirs = (char**) directories;
4183 assert(!strv_isempty(dirs));
4185 name = basename(dirs[0]);
4186 assert(!isempty(name));
4188 /* Executes all binaries in the directories in parallel and waits
4189 * for them to finish. Optionally a timeout is applied. If a file
4190 * with the same name exists in more than one directory, the
4191 * earliest one wins. */
4193 executor_pid = fork();
4194 if (executor_pid < 0) {
4195 log_error_errno(errno, "Failed to fork: %m");
4198 } else if (executor_pid == 0) {
4199 r = do_execute(dirs, timeout, argv);
4200 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4203 wait_for_terminate_and_warn(name, executor_pid, true);
4206 int kill_and_sigcont(pid_t pid, int sig) {
4209 r = kill(pid, sig) < 0 ? -errno : 0;
4217 bool nulstr_contains(const char*nulstr, const char *needle) {
4223 NULSTR_FOREACH(i, nulstr)
4224 if (streq(i, needle))
4230 bool plymouth_running(void) {
4231 return access("/run/plymouth/pid", F_OK) >= 0;
4234 char* strshorten(char *s, size_t l) {
4243 static bool hostname_valid_char(char c) {
4245 (c >= 'a' && c <= 'z') ||
4246 (c >= 'A' && c <= 'Z') ||
4247 (c >= '0' && c <= '9') ||
4253 bool hostname_is_valid(const char *s) {
4260 /* Doesn't accept empty hostnames, hostnames with trailing or
4261 * leading dots, and hostnames with multiple dots in a
4262 * sequence. Also ensures that the length stays below
4265 for (p = s, dot = true; *p; p++) {
4272 if (!hostname_valid_char(*p))
4282 if (p-s > HOST_NAME_MAX)
4288 char* hostname_cleanup(char *s, bool lowercase) {
4292 for (p = s, d = s, dot = true; *p; p++) {
4299 } else if (hostname_valid_char(*p)) {
4300 *(d++) = lowercase ? tolower(*p) : *p;
4311 strshorten(s, HOST_NAME_MAX);
4316 bool machine_name_is_valid(const char *s) {
4318 if (!hostname_is_valid(s))
4321 /* Machine names should be useful hostnames, but also be
4322 * useful in unit names, hence we enforce a stricter length
4331 int pipe_eof(int fd) {
4332 struct pollfd pollfd = {
4334 .events = POLLIN|POLLHUP,
4339 r = poll(&pollfd, 1, 0);
4346 return pollfd.revents & POLLHUP;
4349 int fd_wait_for_event(int fd, int event, usec_t t) {
4351 struct pollfd pollfd = {
4359 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4366 return pollfd.revents;
4369 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4378 r = tempfn_xxxxxx(path, &t);
4382 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4388 f = fdopen(fd, "we");
4401 int terminal_vhangup_fd(int fd) {
4404 if (ioctl(fd, TIOCVHANGUP) < 0)
4410 int terminal_vhangup(const char *name) {
4411 _cleanup_close_ int fd;
4413 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4417 return terminal_vhangup_fd(fd);
4420 int vt_disallocate(const char *name) {
4424 /* Deallocate the VT if possible. If not possible
4425 * (i.e. because it is the active one), at least clear it
4426 * entirely (including the scrollback buffer) */
4428 if (!startswith(name, "/dev/"))
4431 if (!tty_is_vc(name)) {
4432 /* So this is not a VT. I guess we cannot deallocate
4433 * it then. But let's at least clear the screen */
4435 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4440 "\033[r" /* clear scrolling region */
4441 "\033[H" /* move home */
4442 "\033[2J", /* clear screen */
4449 if (!startswith(name, "/dev/tty"))
4452 r = safe_atou(name+8, &u);
4459 /* Try to deallocate */
4460 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4464 r = ioctl(fd, VT_DISALLOCATE, u);
4473 /* Couldn't deallocate, so let's clear it fully with
4475 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4480 "\033[r" /* clear scrolling region */
4481 "\033[H" /* move home */
4482 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4489 int symlink_atomic(const char *from, const char *to) {
4490 _cleanup_free_ char *t = NULL;
4496 r = tempfn_random(to, &t);
4500 if (symlink(from, t) < 0)
4503 if (rename(t, to) < 0) {
4511 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4512 _cleanup_free_ char *t = NULL;
4517 r = tempfn_random(path, &t);
4521 if (mknod(t, mode, dev) < 0)
4524 if (rename(t, path) < 0) {
4532 int mkfifo_atomic(const char *path, mode_t mode) {
4533 _cleanup_free_ char *t = NULL;
4538 r = tempfn_random(path, &t);
4542 if (mkfifo(t, mode) < 0)
4545 if (rename(t, path) < 0) {
4553 bool display_is_local(const char *display) {
4557 display[0] == ':' &&
4558 display[1] >= '0' &&
4562 int socket_from_display(const char *display, char **path) {
4569 if (!display_is_local(display))
4572 k = strspn(display+1, "0123456789");
4574 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4578 c = stpcpy(f, "/tmp/.X11-unix/X");
4579 memcpy(c, display+1, k);
4588 const char **username,
4589 uid_t *uid, gid_t *gid,
4591 const char **shell) {
4599 /* We enforce some special rules for uid=0: in order to avoid
4600 * NSS lookups for root we hardcode its data. */
4602 if (streq(*username, "root") || streq(*username, "0")) {
4620 if (parse_uid(*username, &u) >= 0) {
4624 /* If there are multiple users with the same id, make
4625 * sure to leave $USER to the configured value instead
4626 * of the first occurrence in the database. However if
4627 * the uid was configured by a numeric uid, then let's
4628 * pick the real username from /etc/passwd. */
4630 *username = p->pw_name;
4633 p = getpwnam(*username);
4637 return errno > 0 ? -errno : -ESRCH;
4649 *shell = p->pw_shell;
4654 char* uid_to_name(uid_t uid) {
4659 return strdup("root");
4663 return strdup(p->pw_name);
4665 if (asprintf(&r, UID_FMT, uid) < 0)
4671 char* gid_to_name(gid_t gid) {
4676 return strdup("root");
4680 return strdup(p->gr_name);
4682 if (asprintf(&r, GID_FMT, gid) < 0)
4688 int get_group_creds(const char **groupname, gid_t *gid) {
4694 /* We enforce some special rules for gid=0: in order to avoid
4695 * NSS lookups for root we hardcode its data. */
4697 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4698 *groupname = "root";
4706 if (parse_gid(*groupname, &id) >= 0) {
4711 *groupname = g->gr_name;
4714 g = getgrnam(*groupname);
4718 return errno > 0 ? -errno : -ESRCH;
4726 int in_gid(gid_t gid) {
4728 int ngroups_max, r, i;
4730 if (getgid() == gid)
4733 if (getegid() == gid)
4736 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4737 assert(ngroups_max > 0);
4739 gids = alloca(sizeof(gid_t) * ngroups_max);
4741 r = getgroups(ngroups_max, gids);
4745 for (i = 0; i < r; i++)
4752 int in_group(const char *name) {
4756 r = get_group_creds(&name, &gid);
4763 int glob_exists(const char *path) {
4764 _cleanup_globfree_ glob_t g = {};
4770 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4772 if (k == GLOB_NOMATCH)
4774 else if (k == GLOB_NOSPACE)
4777 return !strv_isempty(g.gl_pathv);
4779 return errno ? -errno : -EIO;
4782 int glob_extend(char ***strv, const char *path) {
4783 _cleanup_globfree_ glob_t g = {};
4788 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4790 if (k == GLOB_NOMATCH)
4792 else if (k == GLOB_NOSPACE)
4794 else if (k != 0 || strv_isempty(g.gl_pathv))
4795 return errno ? -errno : -EIO;
4797 STRV_FOREACH(p, g.gl_pathv) {
4798 k = strv_extend(strv, *p);
4806 int dirent_ensure_type(DIR *d, struct dirent *de) {
4812 if (de->d_type != DT_UNKNOWN)
4815 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4819 S_ISREG(st.st_mode) ? DT_REG :
4820 S_ISDIR(st.st_mode) ? DT_DIR :
4821 S_ISLNK(st.st_mode) ? DT_LNK :
4822 S_ISFIFO(st.st_mode) ? DT_FIFO :
4823 S_ISSOCK(st.st_mode) ? DT_SOCK :
4824 S_ISCHR(st.st_mode) ? DT_CHR :
4825 S_ISBLK(st.st_mode) ? DT_BLK :
4831 int get_files_in_directory(const char *path, char ***list) {
4832 _cleanup_closedir_ DIR *d = NULL;
4833 size_t bufsize = 0, n = 0;
4834 _cleanup_strv_free_ char **l = NULL;
4838 /* Returns all files in a directory in *list, and the number
4839 * of files as return value. If list is NULL returns only the
4851 if (!de && errno != 0)
4856 dirent_ensure_type(d, de);
4858 if (!dirent_is_file(de))
4862 /* one extra slot is needed for the terminating NULL */
4863 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4866 l[n] = strdup(de->d_name);
4877 l = NULL; /* avoid freeing */
4883 char *strjoin(const char *x, ...) {
4897 t = va_arg(ap, const char *);
4902 if (n > ((size_t) -1) - l) {
4926 t = va_arg(ap, const char *);
4940 bool is_main_thread(void) {
4941 static thread_local int cached = 0;
4943 if (_unlikely_(cached == 0))
4944 cached = getpid() == gettid() ? 1 : -1;
4949 int block_get_whole_disk(dev_t d, dev_t *ret) {
4956 /* If it has a queue this is good enough for us */
4957 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4960 r = access(p, F_OK);
4968 /* If it is a partition find the originating device */
4969 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4972 r = access(p, F_OK);
4978 /* Get parent dev_t */
4979 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4982 r = read_one_line_file(p, &s);
4988 r = sscanf(s, "%u:%u", &m, &n);
4994 /* Only return this if it is really good enough for us. */
4995 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4998 r = access(p, F_OK);
5002 *ret = makedev(m, n);
5009 static const char *const ioprio_class_table[] = {
5010 [IOPRIO_CLASS_NONE] = "none",
5011 [IOPRIO_CLASS_RT] = "realtime",
5012 [IOPRIO_CLASS_BE] = "best-effort",
5013 [IOPRIO_CLASS_IDLE] = "idle"
5016 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
5018 static const char *const sigchld_code_table[] = {
5019 [CLD_EXITED] = "exited",
5020 [CLD_KILLED] = "killed",
5021 [CLD_DUMPED] = "dumped",
5022 [CLD_TRAPPED] = "trapped",
5023 [CLD_STOPPED] = "stopped",
5024 [CLD_CONTINUED] = "continued",
5027 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
5029 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
5030 [LOG_FAC(LOG_KERN)] = "kern",
5031 [LOG_FAC(LOG_USER)] = "user",
5032 [LOG_FAC(LOG_MAIL)] = "mail",
5033 [LOG_FAC(LOG_DAEMON)] = "daemon",
5034 [LOG_FAC(LOG_AUTH)] = "auth",
5035 [LOG_FAC(LOG_SYSLOG)] = "syslog",
5036 [LOG_FAC(LOG_LPR)] = "lpr",
5037 [LOG_FAC(LOG_NEWS)] = "news",
5038 [LOG_FAC(LOG_UUCP)] = "uucp",
5039 [LOG_FAC(LOG_CRON)] = "cron",
5040 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
5041 [LOG_FAC(LOG_FTP)] = "ftp",
5042 [LOG_FAC(LOG_LOCAL0)] = "local0",
5043 [LOG_FAC(LOG_LOCAL1)] = "local1",
5044 [LOG_FAC(LOG_LOCAL2)] = "local2",
5045 [LOG_FAC(LOG_LOCAL3)] = "local3",
5046 [LOG_FAC(LOG_LOCAL4)] = "local4",
5047 [LOG_FAC(LOG_LOCAL5)] = "local5",
5048 [LOG_FAC(LOG_LOCAL6)] = "local6",
5049 [LOG_FAC(LOG_LOCAL7)] = "local7"
5052 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
5054 static const char *const log_level_table[] = {
5055 [LOG_EMERG] = "emerg",
5056 [LOG_ALERT] = "alert",
5057 [LOG_CRIT] = "crit",
5059 [LOG_WARNING] = "warning",
5060 [LOG_NOTICE] = "notice",
5061 [LOG_INFO] = "info",
5062 [LOG_DEBUG] = "debug"
5065 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5067 static const char* const sched_policy_table[] = {
5068 [SCHED_OTHER] = "other",
5069 [SCHED_BATCH] = "batch",
5070 [SCHED_IDLE] = "idle",
5071 [SCHED_FIFO] = "fifo",
5075 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5077 static const char* const rlimit_table[_RLIMIT_MAX] = {
5078 [RLIMIT_CPU] = "LimitCPU",
5079 [RLIMIT_FSIZE] = "LimitFSIZE",
5080 [RLIMIT_DATA] = "LimitDATA",
5081 [RLIMIT_STACK] = "LimitSTACK",
5082 [RLIMIT_CORE] = "LimitCORE",
5083 [RLIMIT_RSS] = "LimitRSS",
5084 [RLIMIT_NOFILE] = "LimitNOFILE",
5085 [RLIMIT_AS] = "LimitAS",
5086 [RLIMIT_NPROC] = "LimitNPROC",
5087 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5088 [RLIMIT_LOCKS] = "LimitLOCKS",
5089 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5090 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5091 [RLIMIT_NICE] = "LimitNICE",
5092 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5093 [RLIMIT_RTTIME] = "LimitRTTIME"
5096 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5098 static const char* const ip_tos_table[] = {
5099 [IPTOS_LOWDELAY] = "low-delay",
5100 [IPTOS_THROUGHPUT] = "throughput",
5101 [IPTOS_RELIABILITY] = "reliability",
5102 [IPTOS_LOWCOST] = "low-cost",
5105 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5107 static const char *const __signal_table[] = {
5124 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5135 [SIGVTALRM] = "VTALRM",
5137 [SIGWINCH] = "WINCH",
5143 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5145 const char *signal_to_string(int signo) {
5146 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5149 name = __signal_to_string(signo);
5153 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5154 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5156 snprintf(buf, sizeof(buf), "%d", signo);
5161 int signal_from_string(const char *s) {
5166 signo = __signal_from_string(s);
5170 if (startswith(s, "RTMIN+")) {
5174 if (safe_atou(s, &u) >= 0) {
5175 signo = (int) u + offset;
5176 if (signo > 0 && signo < _NSIG)
5182 bool kexec_loaded(void) {
5183 bool loaded = false;
5186 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5194 int prot_from_flags(int flags) {
5196 switch (flags & O_ACCMODE) {
5205 return PROT_READ|PROT_WRITE;
5212 char *format_bytes(char *buf, size_t l, off_t t) {
5215 static const struct {
5219 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5220 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5221 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5222 { "G", 1024ULL*1024ULL*1024ULL },
5223 { "M", 1024ULL*1024ULL },
5227 if (t == (off_t) -1)
5230 for (i = 0; i < ELEMENTSOF(table); i++) {
5232 if (t >= table[i].factor) {
5235 (unsigned long long) (t / table[i].factor),
5236 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5243 snprintf(buf, l, "%lluB", (unsigned long long) t);
5251 void* memdup(const void *p, size_t l) {
5264 int fd_inc_sndbuf(int fd, size_t n) {
5266 socklen_t l = sizeof(value);
5268 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5269 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5272 /* If we have the privileges we will ignore the kernel limit. */
5275 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5276 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5282 int fd_inc_rcvbuf(int fd, size_t n) {
5284 socklen_t l = sizeof(value);
5286 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5287 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5290 /* If we have the privileges we will ignore the kernel limit. */
5293 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5294 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5299 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5300 bool stdout_is_tty, stderr_is_tty;
5301 pid_t parent_pid, agent_pid;
5302 sigset_t ss, saved_ss;
5310 /* Spawns a temporary TTY agent, making sure it goes away when
5313 parent_pid = getpid();
5315 /* First we temporarily block all signals, so that the new
5316 * child has them blocked initially. This way, we can be sure
5317 * that SIGTERMs are not lost we might send to the agent. */
5318 assert_se(sigfillset(&ss) >= 0);
5319 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5322 if (agent_pid < 0) {
5323 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5327 if (agent_pid != 0) {
5328 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5335 * Make sure the agent goes away when the parent dies */
5336 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5337 _exit(EXIT_FAILURE);
5339 /* Make sure we actually can kill the agent, if we need to, in
5340 * case somebody invoked us from a shell script that trapped
5341 * SIGTERM or so... */
5342 reset_all_signal_handlers();
5343 reset_signal_mask();
5345 /* Check whether our parent died before we were able
5346 * to set the death signal and unblock the signals */
5347 if (getppid() != parent_pid)
5348 _exit(EXIT_SUCCESS);
5350 /* Don't leak fds to the agent */
5351 close_all_fds(except, n_except);
5353 stdout_is_tty = isatty(STDOUT_FILENO);
5354 stderr_is_tty = isatty(STDERR_FILENO);
5356 if (!stdout_is_tty || !stderr_is_tty) {
5359 /* Detach from stdout/stderr. and reopen
5360 * /dev/tty for them. This is important to
5361 * ensure that when systemctl is started via
5362 * popen() or a similar call that expects to
5363 * read EOF we actually do generate EOF and
5364 * not delay this indefinitely by because we
5365 * keep an unused copy of stdin around. */
5366 fd = open("/dev/tty", O_WRONLY);
5368 log_error_errno(errno, "Failed to open /dev/tty: %m");
5369 _exit(EXIT_FAILURE);
5373 dup2(fd, STDOUT_FILENO);
5376 dup2(fd, STDERR_FILENO);
5382 /* Count arguments */
5384 for (n = 0; va_arg(ap, char*); n++)
5389 l = alloca(sizeof(char *) * (n + 1));
5391 /* Fill in arguments */
5393 for (i = 0; i <= n; i++)
5394 l[i] = va_arg(ap, char*);
5398 _exit(EXIT_FAILURE);
5401 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5402 struct rlimit highest, fixed;
5406 if (setrlimit(resource, rlim) >= 0)
5412 /* So we failed to set the desired setrlimit, then let's try
5413 * to get as close as we can */
5414 assert_se(getrlimit(resource, &highest) == 0);
5416 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5417 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5419 if (setrlimit(resource, &fixed) < 0)
5425 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5426 _cleanup_fclose_ FILE *f = NULL;
5437 path = procfs_file_alloca(pid, "environ");
5439 f = fopen(path, "re");
5447 char line[LINE_MAX];
5450 for (i = 0; i < sizeof(line)-1; i++) {
5454 if (_unlikely_(c == EOF)) {
5464 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5465 value = strdup(line + l + 1);
5479 bool http_etag_is_valid(const char *etag) {
5483 if (!endswith(etag, "\""))
5486 if (!startswith(etag, "\"") && !startswith(etag, "W/\""))
5492 bool http_url_is_valid(const char *url) {
5498 p = startswith(url, "http://");
5500 p = startswith(url, "https://");
5507 return ascii_is_valid(p);
5510 bool documentation_url_is_valid(const char *url) {
5516 if (http_url_is_valid(url))
5519 p = startswith(url, "file:/");
5521 p = startswith(url, "info:");
5523 p = startswith(url, "man:");
5528 return ascii_is_valid(p);
5531 bool in_initrd(void) {
5532 static int saved = -1;
5538 /* We make two checks here:
5540 * 1. the flag file /etc/initrd-release must exist
5541 * 2. the root file system must be a memory file system
5543 * The second check is extra paranoia, since misdetecting an
5544 * initrd can have bad bad consequences due the initrd
5545 * emptying when transititioning to the main systemd.
5548 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5549 statfs("/", &s) >= 0 &&
5550 is_temporary_fs(&s);
5555 void warn_melody(void) {
5556 _cleanup_close_ int fd = -1;
5558 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5562 /* Yeah, this is synchronous. Kinda sucks. But well... */
5564 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5565 usleep(125*USEC_PER_MSEC);
5567 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5568 usleep(125*USEC_PER_MSEC);
5570 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5571 usleep(125*USEC_PER_MSEC);
5573 ioctl(fd, KIOCSOUND, 0);
5576 int make_console_stdio(void) {
5579 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5581 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5583 return log_error_errno(fd, "Failed to acquire terminal: %m");
5587 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5592 int get_home_dir(char **_h) {
5600 /* Take the user specified one */
5601 e = secure_getenv("HOME");
5602 if (e && path_is_absolute(e)) {
5611 /* Hardcode home directory for root to avoid NSS */
5614 h = strdup("/root");
5622 /* Check the database... */
5626 return errno > 0 ? -errno : -ESRCH;
5628 if (!path_is_absolute(p->pw_dir))
5631 h = strdup(p->pw_dir);
5639 int get_shell(char **_s) {
5647 /* Take the user specified one */
5648 e = getenv("SHELL");
5658 /* Hardcode home directory for root to avoid NSS */
5661 s = strdup("/bin/sh");
5669 /* Check the database... */
5673 return errno > 0 ? -errno : -ESRCH;
5675 if (!path_is_absolute(p->pw_shell))
5678 s = strdup(p->pw_shell);
5686 bool filename_is_valid(const char *p) {
5700 if (strlen(p) > FILENAME_MAX)
5706 bool string_is_safe(const char *p) {
5712 for (t = p; *t; t++) {
5713 if (*t > 0 && *t < ' ')
5716 if (strchr("\\\"\'\0x7f", *t))
5724 * Check if a string contains control characters. If 'ok' is non-NULL
5725 * it may be a string containing additional CCs to be considered OK.
5727 bool string_has_cc(const char *p, const char *ok) {
5732 for (t = p; *t; t++) {
5733 if (ok && strchr(ok, *t))
5736 if (*t > 0 && *t < ' ')
5746 bool path_is_safe(const char *p) {
5751 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5754 if (strlen(p) > PATH_MAX)
5757 /* The following two checks are not really dangerous, but hey, they still are confusing */
5758 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5761 if (strstr(p, "//"))
5767 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5768 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5769 int (*compar) (const void *, const void *, void *), void *arg) {
5778 p = (void *)(((const char *) base) + (idx * size));
5779 comparison = compar(key, p, arg);
5782 else if (comparison > 0)
5790 void init_gettext(void) {
5791 setlocale(LC_ALL, "");
5792 textdomain(GETTEXT_PACKAGE);
5795 bool is_locale_utf8(void) {
5797 static int cached_answer = -1;
5799 if (cached_answer >= 0)
5802 if (!setlocale(LC_ALL, "")) {
5803 cached_answer = true;
5807 set = nl_langinfo(CODESET);
5809 cached_answer = true;
5813 if (streq(set, "UTF-8")) {
5814 cached_answer = true;
5818 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5819 * unset and everything can do to UTF-8 nowadays. */
5820 set = setlocale(LC_CTYPE, NULL);
5822 cached_answer = true;
5826 /* Check result, but ignore the result if C was set
5830 !getenv("LC_ALL") &&
5831 !getenv("LC_CTYPE") &&
5835 return (bool) cached_answer;
5838 const char *draw_special_char(DrawSpecialChar ch) {
5839 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5842 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5843 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5844 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5845 [DRAW_TREE_SPACE] = " ", /* */
5846 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5847 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5848 [DRAW_ARROW] = "\342\206\222", /* → */
5849 [DRAW_DASH] = "\342\200\223", /* – */
5852 /* ASCII fallback */ {
5853 [DRAW_TREE_VERTICAL] = "| ",
5854 [DRAW_TREE_BRANCH] = "|-",
5855 [DRAW_TREE_RIGHT] = "`-",
5856 [DRAW_TREE_SPACE] = " ",
5857 [DRAW_TRIANGULAR_BULLET] = ">",
5858 [DRAW_BLACK_CIRCLE] = "*",
5859 [DRAW_ARROW] = "->",
5864 return draw_table[!is_locale_utf8()][ch];
5867 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5870 size_t l, old_len, new_len;
5876 old_len = strlen(old_string);
5877 new_len = strlen(new_string);
5890 if (!startswith(f, old_string)) {
5896 nl = l - old_len + new_len;
5897 a = realloc(r, nl + 1);
5905 t = stpcpy(t, new_string);
5917 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5918 const char *i, *begin = NULL;
5923 } state = STATE_OTHER;
5925 size_t osz = 0, isz;
5931 /* Strips ANSI color and replaces TABs by 8 spaces */
5933 isz = _isz ? *_isz : strlen(*ibuf);
5935 f = open_memstream(&obuf, &osz);
5939 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5944 if (i >= *ibuf + isz) /* EOT */
5946 else if (*i == '\x1B')
5947 state = STATE_ESCAPE;
5948 else if (*i == '\t')
5955 if (i >= *ibuf + isz) { /* EOT */
5958 } else if (*i == '[') {
5959 state = STATE_BRACKET;
5964 state = STATE_OTHER;
5971 if (i >= *ibuf + isz || /* EOT */
5972 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5975 state = STATE_OTHER;
5977 } else if (*i == 'm')
5978 state = STATE_OTHER;
6000 int on_ac_power(void) {
6001 bool found_offline = false, found_online = false;
6002 _cleanup_closedir_ DIR *d = NULL;
6004 d = opendir("/sys/class/power_supply");
6006 return errno == ENOENT ? true : -errno;
6010 _cleanup_close_ int fd = -1, device = -1;
6016 if (!de && errno != 0)
6022 if (hidden_file(de->d_name))
6025 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
6027 if (errno == ENOENT || errno == ENOTDIR)
6033 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6035 if (errno == ENOENT)
6041 n = read(fd, contents, sizeof(contents));
6045 if (n != 6 || memcmp(contents, "Mains\n", 6))
6049 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6051 if (errno == ENOENT)
6057 n = read(fd, contents, sizeof(contents));
6061 if (n != 2 || contents[1] != '\n')
6064 if (contents[0] == '1') {
6065 found_online = true;
6067 } else if (contents[0] == '0')
6068 found_offline = true;
6073 return found_online || !found_offline;
6076 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6083 if (!path_strv_resolve_uniq(search, root))
6086 STRV_FOREACH(i, search) {
6087 _cleanup_free_ char *p = NULL;
6091 p = strjoin(root, *i, "/", path, NULL);
6093 p = strjoin(*i, "/", path, NULL);
6103 if (errno != ENOENT)
6110 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6111 _cleanup_strv_free_ char **copy = NULL;
6117 if (path_is_absolute(path)) {
6120 f = fopen(path, mode);
6129 copy = strv_copy((char**) search);
6133 return search_and_fopen_internal(path, mode, root, copy, _f);
6136 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6137 _cleanup_strv_free_ char **s = NULL;
6139 if (path_is_absolute(path)) {
6142 f = fopen(path, mode);
6151 s = strv_split_nulstr(search);
6155 return search_and_fopen_internal(path, mode, root, s, _f);
6158 char *strextend(char **x, ...) {
6165 l = f = *x ? strlen(*x) : 0;
6172 t = va_arg(ap, const char *);
6177 if (n > ((size_t) -1) - l) {
6186 r = realloc(*x, l+1);
6196 t = va_arg(ap, const char *);
6210 char *strrep(const char *s, unsigned n) {
6218 p = r = malloc(l * n + 1);
6222 for (i = 0; i < n; i++)
6229 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6236 if (*allocated >= need)
6239 newalloc = MAX(need * 2, 64u / size);
6240 a = newalloc * size;
6242 /* check for overflows */
6243 if (a < size * need)
6251 *allocated = newalloc;
6255 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6264 q = greedy_realloc(p, allocated, need, size);
6268 if (*allocated > prev)
6269 memzero(q + prev * size, (*allocated - prev) * size);
6274 bool id128_is_valid(const char *s) {
6280 /* Simple formatted 128bit hex string */
6282 for (i = 0; i < l; i++) {
6285 if (!(c >= '0' && c <= '9') &&
6286 !(c >= 'a' && c <= 'z') &&
6287 !(c >= 'A' && c <= 'Z'))
6291 } else if (l == 36) {
6293 /* Formatted UUID */
6295 for (i = 0; i < l; i++) {
6298 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6302 if (!(c >= '0' && c <= '9') &&
6303 !(c >= 'a' && c <= 'z') &&
6304 !(c >= 'A' && c <= 'Z'))
6315 int split_pair(const char *s, const char *sep, char **l, char **r) {
6330 a = strndup(s, x - s);
6334 b = strdup(x + strlen(sep));
6346 int shall_restore_state(void) {
6347 _cleanup_free_ char *value = NULL;
6350 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6356 return parse_boolean(value) != 0;
6359 int proc_cmdline(char **ret) {
6362 if (detect_container(NULL) > 0)
6363 return get_process_cmdline(1, 0, false, ret);
6365 return read_one_line_file("/proc/cmdline", ret);
6368 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6369 _cleanup_free_ char *line = NULL;
6375 r = proc_cmdline(&line);
6381 _cleanup_free_ char *word = NULL;
6384 r = unquote_first_word(&p, &word, true);
6390 /* Filter out arguments that are intended only for the
6392 if (!in_initrd() && startswith(word, "rd."))
6395 value = strchr(word, '=');
6399 r = parse_item(word, value);
6407 int get_proc_cmdline_key(const char *key, char **value) {
6408 _cleanup_free_ char *line = NULL, *ret = NULL;
6415 r = proc_cmdline(&line);
6421 _cleanup_free_ char *word = NULL;
6424 r = unquote_first_word(&p, &word, true);
6430 /* Filter out arguments that are intended only for the
6432 if (!in_initrd() && startswith(word, "rd."))
6436 e = startswith(word, key);
6440 r = free_and_strdup(&ret, e);
6446 if (streq(word, key))
6460 int container_get_leader(const char *machine, pid_t *pid) {
6461 _cleanup_free_ char *s = NULL, *class = NULL;
6469 p = strjoina("/run/systemd/machines/", machine);
6470 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6478 if (!streq_ptr(class, "container"))
6481 r = parse_pid(s, &leader);
6491 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6492 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6500 mntns = procfs_file_alloca(pid, "ns/mnt");
6501 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6509 pidns = procfs_file_alloca(pid, "ns/pid");
6510 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6518 netns = procfs_file_alloca(pid, "ns/net");
6519 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6527 root = procfs_file_alloca(pid, "root");
6528 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6534 *pidns_fd = pidnsfd;
6537 *mntns_fd = mntnsfd;
6540 *netns_fd = netnsfd;
6545 pidnsfd = mntnsfd = netnsfd = -1;
6550 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6553 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6557 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6561 if (setns(netns_fd, CLONE_NEWNET) < 0)
6565 if (fchdir(root_fd) < 0)
6568 if (chroot(".") < 0)
6572 if (setresgid(0, 0, 0) < 0)
6575 if (setgroups(0, NULL) < 0)
6578 if (setresuid(0, 0, 0) < 0)
6584 bool pid_is_unwaited(pid_t pid) {
6585 /* Checks whether a PID is still valid at all, including a zombie */
6590 if (kill(pid, 0) >= 0)
6593 return errno != ESRCH;
6596 bool pid_is_alive(pid_t pid) {
6599 /* Checks whether a PID is still valid and not a zombie */
6604 r = get_process_state(pid);
6605 if (r == -ENOENT || r == 'Z')
6611 int getpeercred(int fd, struct ucred *ucred) {
6612 socklen_t n = sizeof(struct ucred);
6619 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6623 if (n != sizeof(struct ucred))
6626 /* Check if the data is actually useful and not suppressed due
6627 * to namespacing issues */
6630 if (u.uid == UID_INVALID)
6632 if (u.gid == GID_INVALID)
6639 int getpeersec(int fd, char **ret) {
6651 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6655 if (errno != ERANGE)
6662 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6678 /* This is much like like mkostemp() but is subject to umask(). */
6679 int mkostemp_safe(char *pattern, int flags) {
6680 _cleanup_umask_ mode_t u;
6687 fd = mkostemp(pattern, flags);
6694 int open_tmpfile(const char *path, int flags) {
6701 /* Try O_TMPFILE first, if it is supported */
6702 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6707 /* Fall back to unguessable name + unlinking */
6708 p = strjoina(path, "/systemd-tmp-XXXXXX");
6710 fd = mkostemp_safe(p, flags);
6718 int fd_warn_permissions(const char *path, int fd) {
6721 if (fstat(fd, &st) < 0)
6724 if (st.st_mode & 0111)
6725 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6727 if (st.st_mode & 0002)
6728 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6730 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6731 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6736 unsigned long personality_from_string(const char *p) {
6738 /* Parse a personality specifier. We introduce our own
6739 * identifiers that indicate specific ABIs, rather than just
6740 * hints regarding the register size, since we want to keep
6741 * things open for multiple locally supported ABIs for the
6742 * same register size. We try to reuse the ABI identifiers
6743 * used by libseccomp. */
6745 #if defined(__x86_64__)
6747 if (streq(p, "x86"))
6750 if (streq(p, "x86-64"))
6753 #elif defined(__i386__)
6755 if (streq(p, "x86"))
6759 /* personality(7) documents that 0xffffffffUL is used for
6760 * querying the current personality, hence let's use that here
6761 * as error indicator. */
6762 return 0xffffffffUL;
6765 const char* personality_to_string(unsigned long p) {
6767 #if defined(__x86_64__)
6769 if (p == PER_LINUX32)
6775 #elif defined(__i386__)
6784 uint64_t physical_memory(void) {
6787 /* We return this as uint64_t in case we are running as 32bit
6788 * process on a 64bit kernel with huge amounts of memory */
6790 mem = sysconf(_SC_PHYS_PAGES);
6793 return (uint64_t) mem * (uint64_t) page_size();
6796 void hexdump(FILE *f, const void *p, size_t s) {
6797 const uint8_t *b = p;
6800 assert(s == 0 || b);
6805 fprintf(f, "%04x ", n);
6807 for (i = 0; i < 16; i++) {
6812 fprintf(f, "%02x ", b[i]);
6820 for (i = 0; i < 16; i++) {
6825 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6839 int update_reboot_param_file(const char *param) {
6844 r = write_string_file(REBOOT_PARAM_FILE, param);
6846 log_error("Failed to write reboot param to "
6847 REBOOT_PARAM_FILE": %s", strerror(-r));
6849 unlink(REBOOT_PARAM_FILE);
6854 int umount_recursive(const char *prefix, int flags) {
6858 /* Try to umount everything recursively below a
6859 * directory. Also, take care of stacked mounts, and keep
6860 * unmounting them until they are gone. */
6863 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6868 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6869 if (!proc_self_mountinfo)
6873 _cleanup_free_ char *path = NULL, *p = NULL;
6876 k = fscanf(proc_self_mountinfo,
6877 "%*s " /* (1) mount id */
6878 "%*s " /* (2) parent id */
6879 "%*s " /* (3) major:minor */
6880 "%*s " /* (4) root */
6881 "%ms " /* (5) mount point */
6882 "%*s" /* (6) mount options */
6883 "%*[^-]" /* (7) optional fields */
6884 "- " /* (8) separator */
6885 "%*s " /* (9) file system type */
6886 "%*s" /* (10) mount source */
6887 "%*s" /* (11) mount options 2 */
6888 "%*[^\n]", /* some rubbish at the end */
6897 p = cunescape(path);
6901 if (!path_startswith(p, prefix))
6904 if (umount2(p, flags) < 0) {
6920 static int get_mount_flags(const char *path, unsigned long *flags) {
6923 if (statvfs(path, &buf) < 0)
6925 *flags = buf.f_flag;
6929 int bind_remount_recursive(const char *prefix, bool ro) {
6930 _cleanup_set_free_free_ Set *done = NULL;
6931 _cleanup_free_ char *cleaned = NULL;
6934 /* Recursively remount a directory (and all its submounts)
6935 * read-only or read-write. If the directory is already
6936 * mounted, we reuse the mount and simply mark it
6937 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6938 * operation). If it isn't we first make it one. Afterwards we
6939 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6940 * submounts we can access, too. When mounts are stacked on
6941 * the same mount point we only care for each individual
6942 * "top-level" mount on each point, as we cannot
6943 * influence/access the underlying mounts anyway. We do not
6944 * have any effect on future submounts that might get
6945 * propagated, they migt be writable. This includes future
6946 * submounts that have been triggered via autofs. */
6948 cleaned = strdup(prefix);
6952 path_kill_slashes(cleaned);
6954 done = set_new(&string_hash_ops);
6959 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6960 _cleanup_set_free_free_ Set *todo = NULL;
6961 bool top_autofs = false;
6963 unsigned long orig_flags;
6965 todo = set_new(&string_hash_ops);
6969 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6970 if (!proc_self_mountinfo)
6974 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6977 k = fscanf(proc_self_mountinfo,
6978 "%*s " /* (1) mount id */
6979 "%*s " /* (2) parent id */
6980 "%*s " /* (3) major:minor */
6981 "%*s " /* (4) root */
6982 "%ms " /* (5) mount point */
6983 "%*s" /* (6) mount options (superblock) */
6984 "%*[^-]" /* (7) optional fields */
6985 "- " /* (8) separator */
6986 "%ms " /* (9) file system type */
6987 "%*s" /* (10) mount source */
6988 "%*s" /* (11) mount options (bind mount) */
6989 "%*[^\n]", /* some rubbish at the end */
6999 p = cunescape(path);
7003 /* Let's ignore autofs mounts. If they aren't
7004 * triggered yet, we want to avoid triggering
7005 * them, as we don't make any guarantees for
7006 * future submounts anyway. If they are
7007 * already triggered, then we will find
7008 * another entry for this. */
7009 if (streq(type, "autofs")) {
7010 top_autofs = top_autofs || path_equal(cleaned, p);
7014 if (path_startswith(p, cleaned) &&
7015 !set_contains(done, p)) {
7017 r = set_consume(todo, p);
7027 /* If we have no submounts to process anymore and if
7028 * the root is either already done, or an autofs, we
7030 if (set_isempty(todo) &&
7031 (top_autofs || set_contains(done, cleaned)))
7034 if (!set_contains(done, cleaned) &&
7035 !set_contains(todo, cleaned)) {
7036 /* The prefix directory itself is not yet a
7037 * mount, make it one. */
7038 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
7042 (void) get_mount_flags(cleaned, &orig_flags);
7043 orig_flags &= ~MS_RDONLY;
7045 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
7048 x = strdup(cleaned);
7052 r = set_consume(done, x);
7057 while ((x = set_steal_first(todo))) {
7059 r = set_consume(done, x);
7065 /* Try to reuse the original flag set, but
7066 * don't care for errors, in case of
7067 * obstructed mounts */
7069 (void) get_mount_flags(x, &orig_flags);
7070 orig_flags &= ~MS_RDONLY;
7072 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7074 /* Deal with mount points that are
7075 * obstructed by a later mount */
7077 if (errno != ENOENT)
7085 int fflush_and_check(FILE *f) {
7092 return errno ? -errno : -EIO;
7097 int tempfn_xxxxxx(const char *p, char **ret) {
7109 * /foo/bar/.#waldoXXXXXX
7113 if (!filename_is_valid(fn))
7116 t = new(char, strlen(p) + 2 + 6 + 1);
7120 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7122 *ret = path_kill_slashes(t);
7126 int tempfn_random(const char *p, char **ret) {
7140 * /foo/bar/.#waldobaa2a261115984a9
7144 if (!filename_is_valid(fn))
7147 t = new(char, strlen(p) + 2 + 16 + 1);
7151 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7154 for (i = 0; i < 16; i++) {
7155 *(x++) = hexchar(u & 0xF);
7161 *ret = path_kill_slashes(t);
7165 int tempfn_random_child(const char *p, char **ret) {
7176 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7179 t = new(char, strlen(p) + 3 + 16 + 1);
7183 x = stpcpy(stpcpy(t, p), "/.#");
7186 for (i = 0; i < 16; i++) {
7187 *(x++) = hexchar(u & 0xF);
7193 *ret = path_kill_slashes(t);
7197 /* make sure the hostname is not "localhost" */
7198 bool is_localhost(const char *hostname) {
7201 /* This tries to identify local host and domain names
7202 * described in RFC6761 plus the redhatism of .localdomain */
7204 return streq(hostname, "localhost") ||
7205 streq(hostname, "localhost.") ||
7206 streq(hostname, "localdomain.") ||
7207 streq(hostname, "localdomain") ||
7208 endswith(hostname, ".localhost") ||
7209 endswith(hostname, ".localhost.") ||
7210 endswith(hostname, ".localdomain") ||
7211 endswith(hostname, ".localdomain.");
7214 int take_password_lock(const char *root) {
7216 struct flock flock = {
7218 .l_whence = SEEK_SET,
7226 /* This is roughly the same as lckpwdf(), but not as awful. We
7227 * don't want to use alarm() and signals, hence we implement
7228 * our own trivial version of this.
7230 * Note that shadow-utils also takes per-database locks in
7231 * addition to lckpwdf(). However, we don't given that they
7232 * are redundant as they they invoke lckpwdf() first and keep
7233 * it during everything they do. The per-database locks are
7234 * awfully racy, and thus we just won't do them. */
7237 path = strjoina(root, "/etc/.pwd.lock");
7239 path = "/etc/.pwd.lock";
7241 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7245 r = fcntl(fd, F_SETLKW, &flock);
7254 int is_symlink(const char *path) {
7257 if (lstat(path, &info) < 0)
7260 return !!S_ISLNK(info.st_mode);
7263 int is_dir(const char* path, bool follow) {
7268 r = stat(path, &st);
7270 r = lstat(path, &st);
7274 return !!S_ISDIR(st.st_mode);
7277 int unquote_first_word(const char **p, char **ret, bool relax) {
7278 _cleanup_free_ char *s = NULL;
7279 size_t allocated = 0, sz = 0;
7286 SINGLE_QUOTE_ESCAPE,
7288 DOUBLE_QUOTE_ESCAPE,
7296 /* Parses the first word of a string, and returns it in
7297 * *ret. Removes all quotes in the process. When parsing fails
7298 * (because of an uneven number of quotes or similar), leaves
7299 * the pointer *p at the first invalid character. */
7309 else if (strchr(WHITESPACE, c))
7319 state = SINGLE_QUOTE;
7321 state = VALUE_ESCAPE;
7323 state = DOUBLE_QUOTE;
7324 else if (strchr(WHITESPACE, c))
7327 if (!GREEDY_REALLOC(s, allocated, sz+2))
7342 if (!GREEDY_REALLOC(s, allocated, sz+2))
7355 } else if (c == '\'')
7358 state = SINGLE_QUOTE_ESCAPE;
7360 if (!GREEDY_REALLOC(s, allocated, sz+2))
7368 case SINGLE_QUOTE_ESCAPE:
7375 if (!GREEDY_REALLOC(s, allocated, sz+2))
7379 state = SINGLE_QUOTE;
7388 state = DOUBLE_QUOTE_ESCAPE;
7390 if (!GREEDY_REALLOC(s, allocated, sz+2))
7398 case DOUBLE_QUOTE_ESCAPE:
7405 if (!GREEDY_REALLOC(s, allocated, sz+2))
7409 state = DOUBLE_QUOTE;
7415 if (!strchr(WHITESPACE, c))
7437 int unquote_many_words(const char **p, ...) {
7442 /* Parses a number of words from a string, stripping any
7443 * quotes if necessary. */
7447 /* Count how many words are expected */
7450 if (!va_arg(ap, char **))
7459 /* Read all words into a temporary array */
7460 l = newa0(char*, n);
7461 for (c = 0; c < n; c++) {
7463 r = unquote_first_word(p, &l[c], false);
7467 for (j = 0; j < c; j++)
7477 /* If we managed to parse all words, return them in the passed
7480 for (i = 0; i < n; i++) {
7483 v = va_arg(ap, char **);
7493 int free_and_strdup(char **p, const char *s) {
7498 /* Replaces a string pointer with an strdup()ed new string,
7499 * possibly freeing the old one. */
7514 int sethostname_idempotent(const char *s) {
7516 char buf[HOST_NAME_MAX + 1] = {};
7520 r = gethostname(buf, sizeof(buf));
7527 r = sethostname(s, strlen(s));
7534 int ptsname_malloc(int fd, char **ret) {
7547 if (ptsname_r(fd, c, l) == 0) {
7551 if (errno != ERANGE) {
7561 int openpt_in_namespace(pid_t pid, int flags) {
7562 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7563 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7565 struct cmsghdr cmsghdr;
7566 uint8_t buf[CMSG_SPACE(sizeof(int))];
7568 struct msghdr mh = {
7569 .msg_control = &control,
7570 .msg_controllen = sizeof(control),
7572 struct cmsghdr *cmsg;
7579 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7583 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7593 pair[0] = safe_close(pair[0]);
7595 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7597 _exit(EXIT_FAILURE);
7599 master = posix_openpt(flags);
7601 _exit(EXIT_FAILURE);
7603 cmsg = CMSG_FIRSTHDR(&mh);
7604 cmsg->cmsg_level = SOL_SOCKET;
7605 cmsg->cmsg_type = SCM_RIGHTS;
7606 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7607 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7609 mh.msg_controllen = cmsg->cmsg_len;
7611 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7612 _exit(EXIT_FAILURE);
7614 _exit(EXIT_SUCCESS);
7617 pair[1] = safe_close(pair[1]);
7619 r = wait_for_terminate(child, &si);
7622 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7625 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7628 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7629 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7633 fds = (int*) CMSG_DATA(cmsg);
7634 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7637 close_many(fds, n_fds);
7647 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7648 _cleanup_close_ int fd = -1;
7651 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7653 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7657 l = fgetxattr(fd, attribute, value, size);
7664 static int parse_crtime(le64_t le, usec_t *usec) {
7670 if (u == 0 || u == (uint64_t) -1)
7677 int fd_getcrtime(int fd, usec_t *usec) {
7684 /* Until Linux gets a real concept of birthtime/creation time,
7685 * let's fake one with xattrs */
7687 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7690 if (n != sizeof(le))
7693 return parse_crtime(le, usec);
7696 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7700 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7703 if (n != sizeof(le))
7706 return parse_crtime(le, usec);
7709 int path_getcrtime(const char *p, usec_t *usec) {
7716 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7719 if (n != sizeof(le))
7722 return parse_crtime(le, usec);
7725 int fd_setcrtime(int fd, usec_t usec) {
7731 usec = now(CLOCK_REALTIME);
7733 le = htole64((uint64_t) usec);
7734 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7740 int same_fd(int a, int b) {
7741 struct stat sta, stb;
7748 /* Compares two file descriptors. Note that semantics are
7749 * quite different depending on whether we have kcmp() or we
7750 * don't. If we have kcmp() this will only return true for
7751 * dup()ed file descriptors, but not otherwise. If we don't
7752 * have kcmp() this will also return true for two fds of the same
7753 * file, created by separate open() calls. Since we use this
7754 * call mostly for filtering out duplicates in the fd store
7755 * this difference hopefully doesn't matter too much. */
7760 /* Try to use kcmp() if we have it. */
7762 r = kcmp(pid, pid, KCMP_FILE, a, b);
7767 if (errno != ENOSYS)
7770 /* We don't have kcmp(), use fstat() instead. */
7771 if (fstat(a, &sta) < 0)
7774 if (fstat(b, &stb) < 0)
7777 if ((sta.st_mode & S_IFMT) != (stb.st_mode & S_IFMT))
7780 /* We consider all device fds different, since two device fds
7781 * might refer to quite different device contexts even though
7782 * they share the same inode and backing dev_t. */
7784 if (S_ISCHR(sta.st_mode) || S_ISBLK(sta.st_mode))
7787 if (sta.st_dev != stb.st_dev || sta.st_ino != stb.st_ino)
7790 /* The fds refer to the same inode on disk, let's also check
7791 * if they have the same fd flags. This is useful to
7792 * distuingish the read and write side of a pipe created with
7794 fa = fcntl(a, F_GETFL);
7798 fb = fcntl(b, F_GETFL);
7805 int chattr_fd(int fd, bool b, unsigned mask) {
7806 unsigned old_attr, new_attr;
7813 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7817 new_attr = old_attr | mask;
7819 new_attr = old_attr & ~mask;
7821 if (new_attr == old_attr)
7824 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7830 int chattr_path(const char *p, bool b, unsigned mask) {
7831 _cleanup_close_ int fd = -1;
7838 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7842 return chattr_fd(fd, b, mask);
7845 int read_attr_fd(int fd, unsigned *ret) {
7848 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7854 int read_attr_path(const char *p, unsigned *ret) {
7855 _cleanup_close_ int fd = -1;
7860 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7864 return read_attr_fd(fd, ret);
7867 int make_lock_file(const char *p, int operation, LockFile *ret) {
7868 _cleanup_close_ int fd = -1;
7869 _cleanup_free_ char *t = NULL;
7873 * We use UNPOSIX locks if they are available. They have nice
7874 * semantics, and are mostly compatible with NFS. However,
7875 * they are only available on new kernels. When we detect we
7876 * are running on an older kernel, then we fall back to good
7877 * old BSD locks. They also have nice semantics, but are
7878 * slightly problematic on NFS, where they are upgraded to
7879 * POSIX locks, even though locally they are orthogonal to
7889 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7890 .l_whence = SEEK_SET,
7894 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7898 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7901 /* If the kernel is too old, use good old BSD locks */
7902 if (errno == EINVAL)
7903 r = flock(fd, operation);
7906 return errno == EAGAIN ? -EBUSY : -errno;
7909 /* If we acquired the lock, let's check if the file
7910 * still exists in the file system. If not, then the
7911 * previous exclusive owner removed it and then closed
7912 * it. In such a case our acquired lock is worthless,
7913 * hence try again. */
7918 if (st.st_nlink > 0)
7921 fd = safe_close(fd);
7926 ret->operation = operation;
7934 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7942 if (!filename_is_valid(fn))
7945 t = newa(char, strlen(p) + 2 + 4 + 1);
7946 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7948 return make_lock_file(t, operation, ret);
7951 void release_lock_file(LockFile *f) {
7959 /* If we are the exclusive owner we can safely delete
7960 * the lock file itself. If we are not the exclusive
7961 * owner, we can try becoming it. */
7964 (f->operation & ~LOCK_NB) == LOCK_SH) {
7965 static const struct flock fl = {
7967 .l_whence = SEEK_SET,
7970 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7971 if (r < 0 && errno == EINVAL)
7972 r = flock(f->fd, LOCK_EX|LOCK_NB);
7975 f->operation = LOCK_EX|LOCK_NB;
7978 if ((f->operation & ~LOCK_NB) == LOCK_EX)
7979 unlink_noerrno(f->path);
7985 f->fd = safe_close(f->fd);
7989 static size_t nul_length(const uint8_t *p, size_t sz) {
8004 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
8005 const uint8_t *q, *w, *e;
8013 n = nul_length(q, e - q);
8015 /* If there are more than the specified run length of
8016 * NUL bytes, or if this is the beginning or the end
8017 * of the buffer, then seek instead of write */
8018 if ((n > run_length) ||
8019 (n > 0 && q == p) ||
8020 (n > 0 && q + n >= e)) {
8022 l = write(fd, w, q - w);
8029 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
8041 l = write(fd, w, q - w);
8048 return q - (const uint8_t*) p;
8051 void sigkill_wait(pid_t *pid) {
8057 if (kill(*pid, SIGKILL) > 0)
8058 (void) wait_for_terminate(*pid, NULL);
8061 int syslog_parse_priority(const char **p, int *priority, bool with_facility) {
8062 int a = 0, b = 0, c = 0;
8072 if (!strchr(*p, '>'))
8075 if ((*p)[2] == '>') {
8076 c = undecchar((*p)[1]);
8078 } else if ((*p)[3] == '>') {
8079 b = undecchar((*p)[1]);
8080 c = undecchar((*p)[2]);
8082 } else if ((*p)[4] == '>') {
8083 a = undecchar((*p)[1]);
8084 b = undecchar((*p)[2]);
8085 c = undecchar((*p)[3]);
8090 if (a < 0 || b < 0 || c < 0 ||
8091 (!with_facility && (a || b || c > 7)))
8095 *priority = a*100 + b*10 + c;
8097 *priority = (*priority & LOG_FACMASK) | c;
8103 ssize_t string_table_lookup(const char * const *table, size_t len, const char *key) {
8109 for (i = 0; i < len; ++i)
8110 if (streq_ptr(table[i], key))
8116 void cmsg_close_all(struct msghdr *mh) {
8117 struct cmsghdr *cmsg;
8121 for (cmsg = CMSG_FIRSTHDR(mh); cmsg; cmsg = CMSG_NXTHDR(mh, cmsg))
8122 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS)
8123 close_many((int*) CMSG_DATA(cmsg), (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int));
8126 int rename_noreplace(int olddirfd, const char *oldpath, int newdirfd, const char *newpath) {
8130 ret = renameat2(olddirfd, oldpath, newdirfd, newpath, RENAME_NOREPLACE);
8134 /* Even though renameat2() exists since Linux 3.15, btrfs added
8135 * support for it later. If it is not implemented, fallback to another
8137 if (errno != EINVAL)
8140 /* The link()/unlink() fallback does not work on directories. But
8141 * renameat() without RENAME_NOREPLACE gives the same semantics on
8142 * directories, except when newpath is an *empty* directory. This is
8144 ret = fstatat(olddirfd, oldpath, &buf, AT_SYMLINK_NOFOLLOW);
8145 if (ret >= 0 && S_ISDIR(buf.st_mode)) {
8146 ret = renameat(olddirfd, oldpath, newdirfd, newpath);
8147 return ret >= 0 ? 0 : -errno;
8150 /* If it is not a directory, use the link()/unlink() fallback. */
8151 ret = linkat(olddirfd, oldpath, newdirfd, newpath, 0);
8155 ret = unlinkat(olddirfd, oldpath, 0);
8157 /* backup errno before the following unlinkat() alters it */
8159 (void) unlinkat(newdirfd, newpath, 0);