1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
32 #include <sys/resource.h>
33 #include <linux/sched.h>
34 #include <sys/types.h>
38 #include <sys/ioctl.h>
40 #include <linux/tiocl.h>
45 #include <sys/prctl.h>
46 #include <sys/utsname.h>
48 #include <netinet/ip.h>
56 #include <sys/mount.h>
57 #include <linux/magic.h>
61 #include <sys/personality.h>
62 #include <sys/xattr.h>
63 #include <sys/statvfs.h>
67 /* When we include libgen.h because we need dirname() we immediately
68 * undefine basename() since libgen.h defines it as a macro to the XDG
69 * version which is really broken. */
73 #ifdef HAVE_SYS_AUXV_H
85 #include "path-util.h"
86 #include "exit-status.h"
90 #include "device-nodes.h"
95 #include "sparse-endian.h"
97 /* Put this test here for a lack of better place */
98 assert_cc(EAGAIN == EWOULDBLOCK);
101 char **saved_argv = NULL;
103 static volatile unsigned cached_columns = 0;
104 static volatile unsigned cached_lines = 0;
106 size_t page_size(void) {
107 static thread_local size_t pgsz = 0;
110 if (_likely_(pgsz > 0))
113 r = sysconf(_SC_PAGESIZE);
120 bool streq_ptr(const char *a, const char *b) {
122 /* Like streq(), but tries to make sense of NULL pointers */
133 char* endswith(const char *s, const char *postfix) {
140 pl = strlen(postfix);
143 return (char*) s + sl;
148 if (memcmp(s + sl - pl, postfix, pl) != 0)
151 return (char*) s + sl - pl;
154 char* first_word(const char *s, const char *word) {
161 /* Checks if the string starts with the specified word, either
162 * followed by NUL or by whitespace. Returns a pointer to the
163 * NUL or the first character after the whitespace. */
174 if (memcmp(s, word, wl) != 0)
181 if (!strchr(WHITESPACE, *p))
184 p += strspn(p, WHITESPACE);
188 static size_t cescape_char(char c, char *buf) {
189 char * buf_old = buf;
235 /* For special chars we prefer octal over
236 * hexadecimal encoding, simply because glib's
237 * g_strescape() does the same */
238 if ((c < ' ') || (c >= 127)) {
240 *(buf++) = octchar((unsigned char) c >> 6);
241 *(buf++) = octchar((unsigned char) c >> 3);
242 *(buf++) = octchar((unsigned char) c);
248 return buf - buf_old;
251 int close_nointr(int fd) {
258 * Just ignore EINTR; a retry loop is the wrong thing to do on
261 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
262 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
263 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
264 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
272 int safe_close(int fd) {
275 * Like close_nointr() but cannot fail. Guarantees errno is
276 * unchanged. Is a NOP with negative fds passed, and returns
277 * -1, so that it can be used in this syntax:
279 * fd = safe_close(fd);
285 /* The kernel might return pretty much any error code
286 * via close(), but the fd will be closed anyway. The
287 * only condition we want to check for here is whether
288 * the fd was invalid at all... */
290 assert_se(close_nointr(fd) != -EBADF);
296 void close_many(const int fds[], unsigned n_fd) {
299 assert(fds || n_fd <= 0);
301 for (i = 0; i < n_fd; i++)
305 int unlink_noerrno(const char *path) {
316 int parse_boolean(const char *v) {
319 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
321 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
327 int parse_pid(const char *s, pid_t* ret_pid) {
328 unsigned long ul = 0;
335 r = safe_atolu(s, &ul);
341 if ((unsigned long) pid != ul)
351 int parse_uid(const char *s, uid_t* ret_uid) {
352 unsigned long ul = 0;
359 r = safe_atolu(s, &ul);
365 if ((unsigned long) uid != ul)
368 /* Some libc APIs use UID_INVALID as special placeholder */
369 if (uid == (uid_t) 0xFFFFFFFF)
372 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
373 if (uid == (uid_t) 0xFFFF)
380 int safe_atou(const char *s, unsigned *ret_u) {
388 l = strtoul(s, &x, 0);
390 if (!x || x == s || *x || errno)
391 return errno > 0 ? -errno : -EINVAL;
393 if ((unsigned long) (unsigned) l != l)
396 *ret_u = (unsigned) l;
400 int safe_atoi(const char *s, int *ret_i) {
408 l = strtol(s, &x, 0);
410 if (!x || x == s || *x || errno)
411 return errno > 0 ? -errno : -EINVAL;
413 if ((long) (int) l != l)
420 int safe_atou8(const char *s, uint8_t *ret) {
428 l = strtoul(s, &x, 0);
430 if (!x || x == s || *x || errno)
431 return errno > 0 ? -errno : -EINVAL;
433 if ((unsigned long) (uint8_t) l != l)
440 int safe_atou16(const char *s, uint16_t *ret) {
448 l = strtoul(s, &x, 0);
450 if (!x || x == s || *x || errno)
451 return errno > 0 ? -errno : -EINVAL;
453 if ((unsigned long) (uint16_t) l != l)
460 int safe_atoi16(const char *s, int16_t *ret) {
468 l = strtol(s, &x, 0);
470 if (!x || x == s || *x || errno)
471 return errno > 0 ? -errno : -EINVAL;
473 if ((long) (int16_t) l != l)
480 int safe_atollu(const char *s, long long unsigned *ret_llu) {
482 unsigned long long l;
488 l = strtoull(s, &x, 0);
490 if (!x || x == s || *x || errno)
491 return errno ? -errno : -EINVAL;
497 int safe_atolli(const char *s, long long int *ret_lli) {
505 l = strtoll(s, &x, 0);
507 if (!x || x == s || *x || errno)
508 return errno ? -errno : -EINVAL;
514 int safe_atod(const char *s, double *ret_d) {
522 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
523 if (loc == (locale_t) 0)
527 d = strtod_l(s, &x, loc);
529 if (!x || x == s || *x || errno) {
531 return errno ? -errno : -EINVAL;
539 static size_t strcspn_escaped(const char *s, const char *reject) {
540 bool escaped = false;
543 for (n=0; s[n]; n++) {
546 else if (s[n] == '\\')
548 else if (strchr(reject, s[n]))
552 /* if s ends in \, return index of previous char */
556 /* Split a string into words. */
557 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
563 assert(**state == '\0');
567 current += strspn(current, separator);
573 if (quoted && strchr("\'\"", *current)) {
574 char quotechars[2] = {*current, '\0'};
576 *l = strcspn_escaped(current + 1, quotechars);
577 if (current[*l + 1] == '\0' ||
578 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
579 /* right quote missing or garbage at the end */
583 assert(current[*l + 1] == quotechars[0]);
584 *state = current++ + *l + 2;
586 *l = strcspn_escaped(current, separator);
587 if (current[*l] && !strchr(separator, current[*l])) {
588 /* unfinished escape */
592 *state = current + *l;
594 *l = strcspn(current, separator);
595 *state = current + *l;
601 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
603 _cleanup_free_ char *line = NULL;
615 p = procfs_file_alloca(pid, "stat");
616 r = read_one_line_file(p, &line);
620 /* Let's skip the pid and comm fields. The latter is enclosed
621 * in () but does not escape any () in its value, so let's
622 * skip over it manually */
624 p = strrchr(line, ')');
636 if ((long unsigned) (pid_t) ppid != ppid)
639 *_ppid = (pid_t) ppid;
644 int fchmod_umask(int fd, mode_t m) {
649 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
655 char *truncate_nl(char *s) {
658 s[strcspn(s, NEWLINE)] = 0;
662 int get_process_state(pid_t pid) {
666 _cleanup_free_ char *line = NULL;
670 p = procfs_file_alloca(pid, "stat");
671 r = read_one_line_file(p, &line);
675 p = strrchr(line, ')');
681 if (sscanf(p, " %c", &state) != 1)
684 return (unsigned char) state;
687 int get_process_comm(pid_t pid, char **name) {
694 p = procfs_file_alloca(pid, "comm");
696 r = read_one_line_file(p, name);
703 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
704 _cleanup_fclose_ FILE *f = NULL;
712 p = procfs_file_alloca(pid, "cmdline");
718 if (max_length == 0) {
719 size_t len = 0, allocated = 0;
721 while ((c = getc(f)) != EOF) {
723 if (!GREEDY_REALLOC(r, allocated, len+2)) {
728 r[len++] = isprint(c) ? c : ' ';
738 r = new(char, max_length);
744 while ((c = getc(f)) != EOF) {
766 size_t n = MIN(left-1, 3U);
773 /* Kernel threads have no argv[] */
775 _cleanup_free_ char *t = NULL;
783 h = get_process_comm(pid, &t);
787 r = strjoin("[", t, "]", NULL);
796 int is_kernel_thread(pid_t pid) {
808 p = procfs_file_alloca(pid, "cmdline");
813 count = fread(&c, 1, 1, f);
817 /* Kernel threads have an empty cmdline */
820 return eof ? 1 : -errno;
825 int get_process_capeff(pid_t pid, char **capeff) {
831 p = procfs_file_alloca(pid, "status");
833 return get_status_field(p, "\nCapEff:", capeff);
836 static int get_process_link_contents(const char *proc_file, char **name) {
842 r = readlink_malloc(proc_file, name);
844 return r == -ENOENT ? -ESRCH : r;
849 int get_process_exe(pid_t pid, char **name) {
856 p = procfs_file_alloca(pid, "exe");
857 r = get_process_link_contents(p, name);
861 d = endswith(*name, " (deleted)");
868 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
869 _cleanup_fclose_ FILE *f = NULL;
879 p = procfs_file_alloca(pid, "status");
884 FOREACH_LINE(line, f, return -errno) {
889 if (startswith(l, field)) {
891 l += strspn(l, WHITESPACE);
893 l[strcspn(l, WHITESPACE)] = 0;
895 return parse_uid(l, uid);
902 int get_process_uid(pid_t pid, uid_t *uid) {
903 return get_process_id(pid, "Uid:", uid);
906 int get_process_gid(pid_t pid, gid_t *gid) {
907 assert_cc(sizeof(uid_t) == sizeof(gid_t));
908 return get_process_id(pid, "Gid:", gid);
911 int get_process_cwd(pid_t pid, char **cwd) {
916 p = procfs_file_alloca(pid, "cwd");
918 return get_process_link_contents(p, cwd);
921 int get_process_root(pid_t pid, char **root) {
926 p = procfs_file_alloca(pid, "root");
928 return get_process_link_contents(p, root);
931 int get_process_environ(pid_t pid, char **env) {
932 _cleanup_fclose_ FILE *f = NULL;
933 _cleanup_free_ char *outcome = NULL;
936 size_t allocated = 0, sz = 0;
941 p = procfs_file_alloca(pid, "environ");
947 while ((c = fgetc(f)) != EOF) {
948 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
952 outcome[sz++] = '\n';
954 sz += cescape_char(c, outcome + sz);
964 char *strnappend(const char *s, const char *suffix, size_t b) {
972 return strndup(suffix, b);
981 if (b > ((size_t) -1) - a)
984 r = new(char, a+b+1);
989 memcpy(r+a, suffix, b);
995 char *strappend(const char *s, const char *suffix) {
996 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
999 int readlinkat_malloc(int fd, const char *p, char **ret) {
1014 n = readlinkat(fd, p, c, l-1);
1021 if ((size_t) n < l-1) {
1032 int readlink_malloc(const char *p, char **ret) {
1033 return readlinkat_malloc(AT_FDCWD, p, ret);
1036 int readlink_value(const char *p, char **ret) {
1037 _cleanup_free_ char *link = NULL;
1041 r = readlink_malloc(p, &link);
1045 value = basename(link);
1049 value = strdup(value);
1058 int readlink_and_make_absolute(const char *p, char **r) {
1059 _cleanup_free_ char *target = NULL;
1066 j = readlink_malloc(p, &target);
1070 k = file_in_same_dir(p, target);
1078 int readlink_and_canonicalize(const char *p, char **r) {
1085 j = readlink_and_make_absolute(p, &t);
1089 s = canonicalize_file_name(t);
1096 path_kill_slashes(*r);
1101 int reset_all_signal_handlers(void) {
1104 for (sig = 1; sig < _NSIG; sig++) {
1105 struct sigaction sa = {
1106 .sa_handler = SIG_DFL,
1107 .sa_flags = SA_RESTART,
1110 /* These two cannot be caught... */
1111 if (sig == SIGKILL || sig == SIGSTOP)
1114 /* On Linux the first two RT signals are reserved by
1115 * glibc, and sigaction() will return EINVAL for them. */
1116 if ((sigaction(sig, &sa, NULL) < 0))
1117 if (errno != EINVAL && r == 0)
1124 int reset_signal_mask(void) {
1127 if (sigemptyset(&ss) < 0)
1130 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1136 char *strstrip(char *s) {
1139 /* Drops trailing whitespace. Modifies the string in
1140 * place. Returns pointer to first non-space character */
1142 s += strspn(s, WHITESPACE);
1144 for (e = strchr(s, 0); e > s; e --)
1145 if (!strchr(WHITESPACE, e[-1]))
1153 char *delete_chars(char *s, const char *bad) {
1156 /* Drops all whitespace, regardless where in the string */
1158 for (f = s, t = s; *f; f++) {
1159 if (strchr(bad, *f))
1170 char *file_in_same_dir(const char *path, const char *filename) {
1177 /* This removes the last component of path and appends
1178 * filename, unless the latter is absolute anyway or the
1181 if (path_is_absolute(filename))
1182 return strdup(filename);
1184 e = strrchr(path, '/');
1186 return strdup(filename);
1188 k = strlen(filename);
1189 ret = new(char, (e + 1 - path) + k + 1);
1193 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1197 int rmdir_parents(const char *path, const char *stop) {
1206 /* Skip trailing slashes */
1207 while (l > 0 && path[l-1] == '/')
1213 /* Skip last component */
1214 while (l > 0 && path[l-1] != '/')
1217 /* Skip trailing slashes */
1218 while (l > 0 && path[l-1] == '/')
1224 if (!(t = strndup(path, l)))
1227 if (path_startswith(stop, t)) {
1236 if (errno != ENOENT)
1243 char hexchar(int x) {
1244 static const char table[16] = "0123456789abcdef";
1246 return table[x & 15];
1249 int unhexchar(char c) {
1251 if (c >= '0' && c <= '9')
1254 if (c >= 'a' && c <= 'f')
1255 return c - 'a' + 10;
1257 if (c >= 'A' && c <= 'F')
1258 return c - 'A' + 10;
1263 char *hexmem(const void *p, size_t l) {
1267 z = r = malloc(l * 2 + 1);
1271 for (x = p; x < (const uint8_t*) p + l; x++) {
1272 *(z++) = hexchar(*x >> 4);
1273 *(z++) = hexchar(*x & 15);
1280 void *unhexmem(const char *p, size_t l) {
1286 z = r = malloc((l + 1) / 2 + 1);
1290 for (x = p; x < p + l; x += 2) {
1293 a = unhexchar(x[0]);
1295 b = unhexchar(x[1]);
1299 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1306 char octchar(int x) {
1307 return '0' + (x & 7);
1310 int unoctchar(char c) {
1312 if (c >= '0' && c <= '7')
1318 char decchar(int x) {
1319 return '0' + (x % 10);
1322 int undecchar(char c) {
1324 if (c >= '0' && c <= '9')
1330 char *cescape(const char *s) {
1336 /* Does C style string escaping. */
1338 r = new(char, strlen(s)*4 + 1);
1342 for (f = s, t = r; *f; f++)
1343 t += cescape_char(*f, t);
1350 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1357 /* Undoes C style string escaping, and optionally prefixes it. */
1359 pl = prefix ? strlen(prefix) : 0;
1361 r = new(char, pl+length+1);
1366 memcpy(r, prefix, pl);
1368 for (f = s, t = r + pl; f < s + length; f++) {
1369 size_t remaining = s + length - f;
1370 assert(remaining > 0);
1372 if (*f != '\\') { /* a literal literal */
1377 if (--remaining == 0) { /* copy trailing backslash verbatim */
1418 /* This is an extension of the XDG syntax files */
1423 /* hexadecimal encoding */
1426 if (remaining >= 2) {
1427 a = unhexchar(f[1]);
1428 b = unhexchar(f[2]);
1431 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1432 /* Invalid escape code, let's take it literal then */
1436 *(t++) = (char) ((a << 4) | b);
1451 /* octal encoding */
1452 int a = -1, b = -1, c = -1;
1454 if (remaining >= 3) {
1455 a = unoctchar(f[0]);
1456 b = unoctchar(f[1]);
1457 c = unoctchar(f[2]);
1460 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1461 /* Invalid escape code, let's take it literal then */
1465 *(t++) = (char) ((a << 6) | (b << 3) | c);
1473 /* Invalid escape code, let's take it literal then */
1484 char *cunescape_length(const char *s, size_t length) {
1485 return cunescape_length_with_prefix(s, length, NULL);
1488 char *cunescape(const char *s) {
1491 return cunescape_length(s, strlen(s));
1494 char *xescape(const char *s, const char *bad) {
1498 /* Escapes all chars in bad, in addition to \ and all special
1499 * chars, in \xFF style escaping. May be reversed with
1502 r = new(char, strlen(s) * 4 + 1);
1506 for (f = s, t = r; *f; f++) {
1508 if ((*f < ' ') || (*f >= 127) ||
1509 (*f == '\\') || strchr(bad, *f)) {
1512 *(t++) = hexchar(*f >> 4);
1513 *(t++) = hexchar(*f);
1523 char *ascii_strlower(char *t) {
1528 for (p = t; *p; p++)
1529 if (*p >= 'A' && *p <= 'Z')
1530 *p = *p - 'A' + 'a';
1535 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1539 filename[0] == '.' ||
1540 streq(filename, "lost+found") ||
1541 streq(filename, "aquota.user") ||
1542 streq(filename, "aquota.group") ||
1543 endswith(filename, ".rpmnew") ||
1544 endswith(filename, ".rpmsave") ||
1545 endswith(filename, ".rpmorig") ||
1546 endswith(filename, ".dpkg-old") ||
1547 endswith(filename, ".dpkg-new") ||
1548 endswith(filename, ".dpkg-tmp") ||
1549 endswith(filename, ".dpkg-dist") ||
1550 endswith(filename, ".dpkg-bak") ||
1551 endswith(filename, ".dpkg-backup") ||
1552 endswith(filename, ".dpkg-remove") ||
1553 endswith(filename, ".swp");
1556 bool hidden_file(const char *filename) {
1559 if (endswith(filename, "~"))
1562 return hidden_file_allow_backup(filename);
1565 int fd_nonblock(int fd, bool nonblock) {
1570 flags = fcntl(fd, F_GETFL, 0);
1575 nflags = flags | O_NONBLOCK;
1577 nflags = flags & ~O_NONBLOCK;
1579 if (nflags == flags)
1582 if (fcntl(fd, F_SETFL, nflags) < 0)
1588 int fd_cloexec(int fd, bool cloexec) {
1593 flags = fcntl(fd, F_GETFD, 0);
1598 nflags = flags | FD_CLOEXEC;
1600 nflags = flags & ~FD_CLOEXEC;
1602 if (nflags == flags)
1605 if (fcntl(fd, F_SETFD, nflags) < 0)
1611 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1614 assert(n_fdset == 0 || fdset);
1616 for (i = 0; i < n_fdset; i++)
1623 int close_all_fds(const int except[], unsigned n_except) {
1624 _cleanup_closedir_ DIR *d = NULL;
1628 assert(n_except == 0 || except);
1630 d = opendir("/proc/self/fd");
1635 /* When /proc isn't available (for example in chroots)
1636 * the fallback is brute forcing through the fd
1639 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1640 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1642 if (fd_in_set(fd, except, n_except))
1645 if (close_nointr(fd) < 0)
1646 if (errno != EBADF && r == 0)
1653 while ((de = readdir(d))) {
1656 if (hidden_file(de->d_name))
1659 if (safe_atoi(de->d_name, &fd) < 0)
1660 /* Let's better ignore this, just in case */
1669 if (fd_in_set(fd, except, n_except))
1672 if (close_nointr(fd) < 0) {
1673 /* Valgrind has its own FD and doesn't want to have it closed */
1674 if (errno != EBADF && r == 0)
1682 bool chars_intersect(const char *a, const char *b) {
1685 /* Returns true if any of the chars in a are in b. */
1686 for (p = a; *p; p++)
1693 bool fstype_is_network(const char *fstype) {
1694 static const char table[] =
1709 x = startswith(fstype, "fuse.");
1713 return nulstr_contains(table, fstype);
1717 _cleanup_close_ int fd;
1719 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1725 TIOCL_GETKMSGREDIRECT,
1729 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1732 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1735 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1741 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1742 struct termios old_termios, new_termios;
1743 char c, line[LINE_MAX];
1748 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1749 new_termios = old_termios;
1751 new_termios.c_lflag &= ~ICANON;
1752 new_termios.c_cc[VMIN] = 1;
1753 new_termios.c_cc[VTIME] = 0;
1755 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1758 if (t != USEC_INFINITY) {
1759 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1760 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1765 k = fread(&c, 1, 1, f);
1767 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1773 *need_nl = c != '\n';
1780 if (t != USEC_INFINITY) {
1781 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1786 if (!fgets(line, sizeof(line), f))
1787 return errno ? -errno : -EIO;
1791 if (strlen(line) != 1)
1801 int ask_char(char *ret, const char *replies, const char *text, ...) {
1811 bool need_nl = true;
1814 fputs(ANSI_HIGHLIGHT_ON, stdout);
1821 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1825 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1828 if (r == -EBADMSG) {
1829 puts("Bad input, please try again.");
1840 if (strchr(replies, c)) {
1845 puts("Read unexpected character, please try again.");
1849 int ask_string(char **ret, const char *text, ...) {
1854 char line[LINE_MAX];
1858 fputs(ANSI_HIGHLIGHT_ON, stdout);
1865 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1870 if (!fgets(line, sizeof(line), stdin))
1871 return errno ? -errno : -EIO;
1873 if (!endswith(line, "\n"))
1892 int reset_terminal_fd(int fd, bool switch_to_text) {
1893 struct termios termios;
1896 /* Set terminal to some sane defaults */
1900 /* We leave locked terminal attributes untouched, so that
1901 * Plymouth may set whatever it wants to set, and we don't
1902 * interfere with that. */
1904 /* Disable exclusive mode, just in case */
1905 ioctl(fd, TIOCNXCL);
1907 /* Switch to text mode */
1909 ioctl(fd, KDSETMODE, KD_TEXT);
1911 /* Enable console unicode mode */
1912 ioctl(fd, KDSKBMODE, K_UNICODE);
1914 if (tcgetattr(fd, &termios) < 0) {
1919 /* We only reset the stuff that matters to the software. How
1920 * hardware is set up we don't touch assuming that somebody
1921 * else will do that for us */
1923 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1924 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1925 termios.c_oflag |= ONLCR;
1926 termios.c_cflag |= CREAD;
1927 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1929 termios.c_cc[VINTR] = 03; /* ^C */
1930 termios.c_cc[VQUIT] = 034; /* ^\ */
1931 termios.c_cc[VERASE] = 0177;
1932 termios.c_cc[VKILL] = 025; /* ^X */
1933 termios.c_cc[VEOF] = 04; /* ^D */
1934 termios.c_cc[VSTART] = 021; /* ^Q */
1935 termios.c_cc[VSTOP] = 023; /* ^S */
1936 termios.c_cc[VSUSP] = 032; /* ^Z */
1937 termios.c_cc[VLNEXT] = 026; /* ^V */
1938 termios.c_cc[VWERASE] = 027; /* ^W */
1939 termios.c_cc[VREPRINT] = 022; /* ^R */
1940 termios.c_cc[VEOL] = 0;
1941 termios.c_cc[VEOL2] = 0;
1943 termios.c_cc[VTIME] = 0;
1944 termios.c_cc[VMIN] = 1;
1946 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1950 /* Just in case, flush all crap out */
1951 tcflush(fd, TCIOFLUSH);
1956 int reset_terminal(const char *name) {
1957 _cleanup_close_ int fd = -1;
1959 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1963 return reset_terminal_fd(fd, true);
1966 int open_terminal(const char *name, int mode) {
1971 * If a TTY is in the process of being closed opening it might
1972 * cause EIO. This is horribly awful, but unlikely to be
1973 * changed in the kernel. Hence we work around this problem by
1974 * retrying a couple of times.
1976 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
1979 assert(!(mode & O_CREAT));
1982 fd = open(name, mode, 0);
1989 /* Max 1s in total */
1993 usleep(50 * USEC_PER_MSEC);
2011 int flush_fd(int fd) {
2012 struct pollfd pollfd = {
2022 r = poll(&pollfd, 1, 0);
2032 l = read(fd, buf, sizeof(buf));
2038 if (errno == EAGAIN)
2047 int acquire_terminal(
2051 bool ignore_tiocstty_eperm,
2054 int fd = -1, notify = -1, r = 0, wd = -1;
2059 /* We use inotify to be notified when the tty is closed. We
2060 * create the watch before checking if we can actually acquire
2061 * it, so that we don't lose any event.
2063 * Note: strictly speaking this actually watches for the
2064 * device being closed, it does *not* really watch whether a
2065 * tty loses its controlling process. However, unless some
2066 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2067 * its tty otherwise this will not become a problem. As long
2068 * as the administrator makes sure not configure any service
2069 * on the same tty as an untrusted user this should not be a
2070 * problem. (Which he probably should not do anyway.) */
2072 if (timeout != USEC_INFINITY)
2073 ts = now(CLOCK_MONOTONIC);
2075 if (!fail && !force) {
2076 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2082 wd = inotify_add_watch(notify, name, IN_CLOSE);
2090 struct sigaction sa_old, sa_new = {
2091 .sa_handler = SIG_IGN,
2092 .sa_flags = SA_RESTART,
2096 r = flush_fd(notify);
2101 /* We pass here O_NOCTTY only so that we can check the return
2102 * value TIOCSCTTY and have a reliable way to figure out if we
2103 * successfully became the controlling process of the tty */
2104 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2108 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2109 * if we already own the tty. */
2110 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2112 /* First, try to get the tty */
2113 if (ioctl(fd, TIOCSCTTY, force) < 0)
2116 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2118 /* Sometimes it makes sense to ignore TIOCSCTTY
2119 * returning EPERM, i.e. when very likely we already
2120 * are have this controlling terminal. */
2121 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2124 if (r < 0 && (force || fail || r != -EPERM)) {
2133 assert(notify >= 0);
2136 union inotify_event_buffer buffer;
2137 struct inotify_event *e;
2140 if (timeout != USEC_INFINITY) {
2143 n = now(CLOCK_MONOTONIC);
2144 if (ts + timeout < n) {
2149 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2159 l = read(notify, &buffer, sizeof(buffer));
2161 if (errno == EINTR || errno == EAGAIN)
2168 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2169 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2178 /* We close the tty fd here since if the old session
2179 * ended our handle will be dead. It's important that
2180 * we do this after sleeping, so that we don't enter
2181 * an endless loop. */
2182 fd = safe_close(fd);
2187 r = reset_terminal_fd(fd, true);
2189 log_warning_errno(r, "Failed to reset terminal: %m");
2200 int release_terminal(void) {
2201 static const struct sigaction sa_new = {
2202 .sa_handler = SIG_IGN,
2203 .sa_flags = SA_RESTART,
2206 _cleanup_close_ int fd = -1;
2207 struct sigaction sa_old;
2210 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2214 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2215 * by our own TIOCNOTTY */
2216 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2218 if (ioctl(fd, TIOCNOTTY) < 0)
2221 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2226 int sigaction_many(const struct sigaction *sa, ...) {
2231 while ((sig = va_arg(ap, int)) > 0)
2232 if (sigaction(sig, sa, NULL) < 0)
2239 int ignore_signals(int sig, ...) {
2240 struct sigaction sa = {
2241 .sa_handler = SIG_IGN,
2242 .sa_flags = SA_RESTART,
2247 if (sigaction(sig, &sa, NULL) < 0)
2251 while ((sig = va_arg(ap, int)) > 0)
2252 if (sigaction(sig, &sa, NULL) < 0)
2259 int default_signals(int sig, ...) {
2260 struct sigaction sa = {
2261 .sa_handler = SIG_DFL,
2262 .sa_flags = SA_RESTART,
2267 if (sigaction(sig, &sa, NULL) < 0)
2271 while ((sig = va_arg(ap, int)) > 0)
2272 if (sigaction(sig, &sa, NULL) < 0)
2279 void safe_close_pair(int p[]) {
2283 /* Special case pairs which use the same fd in both
2285 p[0] = p[1] = safe_close(p[0]);
2289 p[0] = safe_close(p[0]);
2290 p[1] = safe_close(p[1]);
2293 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2300 while (nbytes > 0) {
2303 k = read(fd, p, nbytes);
2308 if (errno == EAGAIN && do_poll) {
2310 /* We knowingly ignore any return value here,
2311 * and expect that any error/EOF is reported
2314 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2318 return n > 0 ? n : -errno;
2332 int loop_read_exact(int fd, void *buf, size_t nbytes, bool do_poll) {
2335 n = loop_read(fd, buf, nbytes, do_poll);
2338 if ((size_t) n != nbytes)
2343 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2344 const uint8_t *p = buf;
2351 while (nbytes > 0) {
2354 k = write(fd, p, nbytes);
2359 if (errno == EAGAIN && do_poll) {
2360 /* We knowingly ignore any return value here,
2361 * and expect that any error/EOF is reported
2364 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2371 if (k == 0) /* Can't really happen */
2381 int parse_size(const char *t, off_t base, off_t *size) {
2383 /* Soo, sometimes we want to parse IEC binary suffxies, and
2384 * sometimes SI decimal suffixes. This function can parse
2385 * both. Which one is the right way depends on the
2386 * context. Wikipedia suggests that SI is customary for
2387 * hardrware metrics and network speeds, while IEC is
2388 * customary for most data sizes used by software and volatile
2389 * (RAM) memory. Hence be careful which one you pick!
2391 * In either case we use just K, M, G as suffix, and not Ki,
2392 * Mi, Gi or so (as IEC would suggest). That's because that's
2393 * frickin' ugly. But this means you really need to make sure
2394 * to document which base you are parsing when you use this
2399 unsigned long long factor;
2402 static const struct table iec[] = {
2403 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2404 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2405 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2406 { "G", 1024ULL*1024ULL*1024ULL },
2407 { "M", 1024ULL*1024ULL },
2413 static const struct table si[] = {
2414 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2415 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2416 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2417 { "G", 1000ULL*1000ULL*1000ULL },
2418 { "M", 1000ULL*1000ULL },
2424 const struct table *table;
2426 unsigned long long r = 0;
2427 unsigned n_entries, start_pos = 0;
2430 assert(base == 1000 || base == 1024);
2435 n_entries = ELEMENTSOF(si);
2438 n_entries = ELEMENTSOF(iec);
2444 unsigned long long l2;
2450 l = strtoll(p, &e, 10);
2463 if (*e >= '0' && *e <= '9') {
2466 /* strotoull itself would accept space/+/- */
2467 l2 = strtoull(e, &e2, 10);
2469 if (errno == ERANGE)
2472 /* Ignore failure. E.g. 10.M is valid */
2479 e += strspn(e, WHITESPACE);
2481 for (i = start_pos; i < n_entries; i++)
2482 if (startswith(e, table[i].suffix)) {
2483 unsigned long long tmp;
2484 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2486 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2487 if (tmp > ULLONG_MAX - r)
2491 if ((unsigned long long) (off_t) r != r)
2494 p = e + strlen(table[i].suffix);
2510 int make_stdio(int fd) {
2515 r = dup2(fd, STDIN_FILENO);
2516 s = dup2(fd, STDOUT_FILENO);
2517 t = dup2(fd, STDERR_FILENO);
2522 if (r < 0 || s < 0 || t < 0)
2525 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2526 * dup2() was a NOP and the bit hence possibly set. */
2527 fd_cloexec(STDIN_FILENO, false);
2528 fd_cloexec(STDOUT_FILENO, false);
2529 fd_cloexec(STDERR_FILENO, false);
2534 int make_null_stdio(void) {
2537 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2541 return make_stdio(null_fd);
2544 bool is_device_path(const char *path) {
2546 /* Returns true on paths that refer to a device, either in
2547 * sysfs or in /dev */
2550 path_startswith(path, "/dev/") ||
2551 path_startswith(path, "/sys/");
2554 int dir_is_empty(const char *path) {
2555 _cleanup_closedir_ DIR *d;
2566 if (!de && errno != 0)
2572 if (!hidden_file(de->d_name))
2577 char* dirname_malloc(const char *path) {
2578 char *d, *dir, *dir2;
2595 int dev_urandom(void *p, size_t n) {
2596 static int have_syscall = -1;
2598 _cleanup_close_ int fd = -1;
2601 /* Gathers some randomness from the kernel. This call will
2602 * never block, and will always return some data from the
2603 * kernel, regardless if the random pool is fully initialized
2604 * or not. It thus makes no guarantee for the quality of the
2605 * returned entropy, but is good enough for or usual usecases
2606 * of seeding the hash functions for hashtable */
2608 /* Use the getrandom() syscall unless we know we don't have
2609 * it, or when the requested size is too large for it. */
2610 if (have_syscall != 0 || (size_t) (int) n != n) {
2611 r = getrandom(p, n, GRND_NONBLOCK);
2613 have_syscall = true;
2618 if (errno == ENOSYS)
2619 /* we lack the syscall, continue with
2620 * reading from /dev/urandom */
2621 have_syscall = false;
2622 else if (errno == EAGAIN)
2623 /* not enough entropy for now. Let's
2624 * remember to use the syscall the
2625 * next time, again, but also read
2626 * from /dev/urandom for now, which
2627 * doesn't care about the current
2628 * amount of entropy. */
2629 have_syscall = true;
2633 /* too short read? */
2637 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2639 return errno == ENOENT ? -ENOSYS : -errno;
2641 return loop_read_exact(fd, p, n, true);
2644 void initialize_srand(void) {
2645 static bool srand_called = false;
2647 #ifdef HAVE_SYS_AUXV_H
2656 #ifdef HAVE_SYS_AUXV_H
2657 /* The kernel provides us with a bit of entropy in auxv, so
2658 * let's try to make use of that to seed the pseudo-random
2659 * generator. It's better than nothing... */
2661 auxv = (void*) getauxval(AT_RANDOM);
2663 x ^= *(unsigned*) auxv;
2666 x ^= (unsigned) now(CLOCK_REALTIME);
2667 x ^= (unsigned) gettid();
2670 srand_called = true;
2673 void random_bytes(void *p, size_t n) {
2677 r = dev_urandom(p, n);
2681 /* If some idiot made /dev/urandom unavailable to us, he'll
2682 * get a PRNG instead. */
2686 for (q = p; q < (uint8_t*) p + n; q ++)
2690 void rename_process(const char name[8]) {
2693 /* This is a like a poor man's setproctitle(). It changes the
2694 * comm field, argv[0], and also the glibc's internally used
2695 * name of the process. For the first one a limit of 16 chars
2696 * applies, to the second one usually one of 10 (i.e. length
2697 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2698 * "systemd"). If you pass a longer string it will be
2701 prctl(PR_SET_NAME, name);
2703 if (program_invocation_name)
2704 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2706 if (saved_argc > 0) {
2710 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2712 for (i = 1; i < saved_argc; i++) {
2716 memzero(saved_argv[i], strlen(saved_argv[i]));
2721 void sigset_add_many(sigset_t *ss, ...) {
2728 while ((sig = va_arg(ap, int)) > 0)
2729 assert_se(sigaddset(ss, sig) == 0);
2733 int sigprocmask_many(int how, ...) {
2738 assert_se(sigemptyset(&ss) == 0);
2741 while ((sig = va_arg(ap, int)) > 0)
2742 assert_se(sigaddset(&ss, sig) == 0);
2745 if (sigprocmask(how, &ss, NULL) < 0)
2751 char* gethostname_malloc(void) {
2754 assert_se(uname(&u) >= 0);
2756 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2757 return strdup(u.nodename);
2759 return strdup(u.sysname);
2762 bool hostname_is_set(void) {
2765 assert_se(uname(&u) >= 0);
2767 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2770 char *lookup_uid(uid_t uid) {
2773 _cleanup_free_ char *buf = NULL;
2774 struct passwd pwbuf, *pw = NULL;
2776 /* Shortcut things to avoid NSS lookups */
2778 return strdup("root");
2780 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2784 buf = malloc(bufsize);
2788 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2789 return strdup(pw->pw_name);
2791 if (asprintf(&name, UID_FMT, uid) < 0)
2797 char* getlogname_malloc(void) {
2801 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2806 return lookup_uid(uid);
2809 char *getusername_malloc(void) {
2816 return lookup_uid(getuid());
2819 int getttyname_malloc(int fd, char **ret) {
2829 r = ttyname_r(fd, path, sizeof(path));
2834 p = startswith(path, "/dev/");
2835 c = strdup(p ?: path);
2852 int getttyname_harder(int fd, char **r) {
2856 k = getttyname_malloc(fd, &s);
2860 if (streq(s, "tty")) {
2862 return get_ctty(0, NULL, r);
2869 int get_ctty_devnr(pid_t pid, dev_t *d) {
2871 _cleanup_free_ char *line = NULL;
2873 unsigned long ttynr;
2877 p = procfs_file_alloca(pid, "stat");
2878 r = read_one_line_file(p, &line);
2882 p = strrchr(line, ')');
2892 "%*d " /* session */
2897 if (major(ttynr) == 0 && minor(ttynr) == 0)
2906 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2907 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2908 _cleanup_free_ char *s = NULL;
2915 k = get_ctty_devnr(pid, &devnr);
2919 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
2921 k = readlink_malloc(fn, &s);
2927 /* This is an ugly hack */
2928 if (major(devnr) == 136) {
2929 if (asprintf(&b, "pts/%u", minor(devnr)) < 0)
2932 /* Probably something like the ptys which have no
2933 * symlink in /dev/char. Let's return something
2934 * vaguely useful. */
2941 if (startswith(s, "/dev/"))
2943 else if (startswith(s, "../"))
2960 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2961 _cleanup_closedir_ DIR *d = NULL;
2966 /* This returns the first error we run into, but nevertheless
2967 * tries to go on. This closes the passed fd. */
2973 return errno == ENOENT ? 0 : -errno;
2978 bool is_dir, keep_around;
2985 if (errno != 0 && ret == 0)
2990 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
2993 if (de->d_type == DT_UNKNOWN ||
2995 (de->d_type == DT_DIR && root_dev)) {
2996 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
2997 if (ret == 0 && errno != ENOENT)
3002 is_dir = S_ISDIR(st.st_mode);
3005 (st.st_uid == 0 || st.st_uid == getuid()) &&
3006 (st.st_mode & S_ISVTX);
3008 is_dir = de->d_type == DT_DIR;
3009 keep_around = false;
3015 /* if root_dev is set, remove subdirectories only, if device is same as dir */
3016 if (root_dev && st.st_dev != root_dev->st_dev)
3019 subdir_fd = openat(fd, de->d_name,
3020 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3021 if (subdir_fd < 0) {
3022 if (ret == 0 && errno != ENOENT)
3027 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
3028 if (r < 0 && ret == 0)
3032 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
3033 if (ret == 0 && errno != ENOENT)
3037 } else if (!only_dirs && !keep_around) {
3039 if (unlinkat(fd, de->d_name, 0) < 0) {
3040 if (ret == 0 && errno != ENOENT)
3047 _pure_ static int is_temporary_fs(struct statfs *s) {
3050 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3051 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3054 int is_fd_on_temporary_fs(int fd) {
3057 if (fstatfs(fd, &s) < 0)
3060 return is_temporary_fs(&s);
3063 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
3068 if (fstatfs(fd, &s) < 0) {
3073 /* We refuse to clean disk file systems with this call. This
3074 * is extra paranoia just to be sure we never ever remove
3076 if (!is_temporary_fs(&s)) {
3077 log_error("Attempted to remove disk file system, and we can't allow that.");
3082 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
3085 static int file_is_priv_sticky(const char *p) {
3090 if (lstat(p, &st) < 0)
3094 (st.st_uid == 0 || st.st_uid == getuid()) &&
3095 (st.st_mode & S_ISVTX);
3098 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
3104 /* We refuse to clean the root file system with this
3105 * call. This is extra paranoia to never cause a really
3106 * seriously broken system. */
3107 if (path_equal(path, "/")) {
3108 log_error("Attempted to remove entire root file system, and we can't allow that.");
3112 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3115 if (errno != ENOTDIR && errno != ELOOP)
3119 if (statfs(path, &s) < 0)
3122 if (!is_temporary_fs(&s)) {
3123 log_error("Attempted to remove disk file system, and we can't allow that.");
3128 if (delete_root && !only_dirs)
3129 if (unlink(path) < 0 && errno != ENOENT)
3136 if (fstatfs(fd, &s) < 0) {
3141 if (!is_temporary_fs(&s)) {
3142 log_error("Attempted to remove disk file system, and we can't allow that.");
3148 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
3151 if (honour_sticky && file_is_priv_sticky(path) > 0)
3154 if (rmdir(path) < 0 && errno != ENOENT) {
3163 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3164 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
3167 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3168 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
3171 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3174 /* Under the assumption that we are running privileged we
3175 * first change the access mode and only then hand out
3176 * ownership to avoid a window where access is too open. */
3178 if (mode != MODE_INVALID)
3179 if (chmod(path, mode) < 0)
3182 if (uid != UID_INVALID || gid != GID_INVALID)
3183 if (chown(path, uid, gid) < 0)
3189 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3192 /* Under the assumption that we are running privileged we
3193 * first change the access mode and only then hand out
3194 * ownership to avoid a window where access is too open. */
3196 if (mode != MODE_INVALID)
3197 if (fchmod(fd, mode) < 0)
3200 if (uid != UID_INVALID || gid != GID_INVALID)
3201 if (fchown(fd, uid, gid) < 0)
3207 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3211 /* Allocates the cpuset in the right size */
3214 if (!(r = CPU_ALLOC(n)))
3217 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3218 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3228 if (errno != EINVAL)
3235 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3236 static const char status_indent[] = " "; /* "[" STATUS "] " */
3237 _cleanup_free_ char *s = NULL;
3238 _cleanup_close_ int fd = -1;
3239 struct iovec iovec[6] = {};
3241 static bool prev_ephemeral;
3245 /* This is independent of logging, as status messages are
3246 * optional and go exclusively to the console. */
3248 if (vasprintf(&s, format, ap) < 0)
3251 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3264 sl = status ? sizeof(status_indent)-1 : 0;
3270 e = ellipsize(s, emax, 50);
3278 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3279 prev_ephemeral = ephemeral;
3282 if (!isempty(status)) {
3283 IOVEC_SET_STRING(iovec[n++], "[");
3284 IOVEC_SET_STRING(iovec[n++], status);
3285 IOVEC_SET_STRING(iovec[n++], "] ");
3287 IOVEC_SET_STRING(iovec[n++], status_indent);
3290 IOVEC_SET_STRING(iovec[n++], s);
3292 IOVEC_SET_STRING(iovec[n++], "\n");
3294 if (writev(fd, iovec, n) < 0)
3300 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3306 va_start(ap, format);
3307 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3313 char *replace_env(const char *format, char **env) {
3320 const char *e, *word = format;
3325 for (e = format; *e; e ++) {
3336 k = strnappend(r, word, e-word-1);
3346 } else if (*e == '$') {
3347 k = strnappend(r, word, e-word);
3364 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3366 k = strappend(r, t);
3380 k = strnappend(r, word, e-word);
3392 char **replace_env_argv(char **argv, char **env) {
3394 unsigned k = 0, l = 0;
3396 l = strv_length(argv);
3398 ret = new(char*, l+1);
3402 STRV_FOREACH(i, argv) {
3404 /* If $FOO appears as single word, replace it by the split up variable */
3405 if ((*i)[0] == '$' && (*i)[1] != '{') {
3410 e = strv_env_get(env, *i+1);
3414 r = strv_split_quoted(&m, e, true);
3426 w = realloc(ret, sizeof(char*) * (l+1));
3436 memcpy(ret + k, m, q * sizeof(char*));
3444 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3445 ret[k] = replace_env(*i, env);
3457 int fd_columns(int fd) {
3458 struct winsize ws = {};
3460 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3469 unsigned columns(void) {
3473 if (_likely_(cached_columns > 0))
3474 return cached_columns;
3477 e = getenv("COLUMNS");
3479 (void) safe_atoi(e, &c);
3482 c = fd_columns(STDOUT_FILENO);
3488 return cached_columns;
3491 int fd_lines(int fd) {
3492 struct winsize ws = {};
3494 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3503 unsigned lines(void) {
3507 if (_likely_(cached_lines > 0))
3508 return cached_lines;
3511 e = getenv("LINES");
3513 (void) safe_atoi(e, &l);
3516 l = fd_lines(STDOUT_FILENO);
3522 return cached_lines;
3525 /* intended to be used as a SIGWINCH sighandler */
3526 void columns_lines_cache_reset(int signum) {
3532 static int cached_on_tty = -1;
3534 if (_unlikely_(cached_on_tty < 0))
3535 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3537 return cached_on_tty;
3540 int files_same(const char *filea, const char *fileb) {
3543 if (stat(filea, &a) < 0)
3546 if (stat(fileb, &b) < 0)
3549 return a.st_dev == b.st_dev &&
3550 a.st_ino == b.st_ino;
3553 int running_in_chroot(void) {
3556 ret = files_same("/proc/1/root", "/");
3563 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3568 assert(percent <= 100);
3569 assert(new_length >= 3);
3571 if (old_length <= 3 || old_length <= new_length)
3572 return strndup(s, old_length);
3574 r = new0(char, new_length+1);
3578 x = (new_length * percent) / 100;
3580 if (x > new_length - 3)
3588 s + old_length - (new_length - x - 3),
3589 new_length - x - 3);
3594 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3598 unsigned k, len, len2;
3601 assert(percent <= 100);
3602 assert(new_length >= 3);
3604 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3605 if (ascii_is_valid(s))
3606 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3608 if (old_length <= 3 || old_length <= new_length)
3609 return strndup(s, old_length);
3611 x = (new_length * percent) / 100;
3613 if (x > new_length - 3)
3617 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3620 c = utf8_encoded_to_unichar(i);
3623 k += unichar_iswide(c) ? 2 : 1;
3626 if (k > x) /* last character was wide and went over quota */
3629 for (j = s + old_length; k < new_length && j > i; ) {
3632 j = utf8_prev_char(j);
3633 c = utf8_encoded_to_unichar(j);
3636 k += unichar_iswide(c) ? 2 : 1;
3640 /* we don't actually need to ellipsize */
3642 return memdup(s, old_length + 1);
3644 /* make space for ellipsis */
3645 j = utf8_next_char(j);
3648 len2 = s + old_length - j;
3649 e = new(char, len + 3 + len2 + 1);
3654 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3655 old_length, new_length, x, len, len2, k);
3659 e[len] = 0xe2; /* tri-dot ellipsis: … */
3663 memcpy(e + len + 3, j, len2 + 1);
3668 char *ellipsize(const char *s, size_t length, unsigned percent) {
3669 return ellipsize_mem(s, strlen(s), length, percent);
3672 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3673 _cleanup_close_ int fd;
3679 mkdir_parents(path, 0755);
3681 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3686 r = fchmod(fd, mode);
3691 if (uid != UID_INVALID || gid != GID_INVALID) {
3692 r = fchown(fd, uid, gid);
3697 if (stamp != USEC_INFINITY) {
3698 struct timespec ts[2];
3700 timespec_store(&ts[0], stamp);
3702 r = futimens(fd, ts);
3704 r = futimens(fd, NULL);
3711 int touch(const char *path) {
3712 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3715 char *unquote(const char *s, const char* quotes) {
3719 /* This is rather stupid, simply removes the heading and
3720 * trailing quotes if there is one. Doesn't care about
3721 * escaping or anything. We should make this smarter one
3728 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3729 return strndup(s+1, l-2);
3734 char *normalize_env_assignment(const char *s) {
3735 _cleanup_free_ char *value = NULL;
3739 eq = strchr(s, '=');
3749 memmove(r, t, strlen(t) + 1);
3754 name = strndupa(s, eq - s);
3755 p = strdupa(eq + 1);
3757 value = unquote(strstrip(p), QUOTES);
3761 return strjoin(strstrip(name), "=", value, NULL);
3764 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3775 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3789 * < 0 : wait_for_terminate() failed to get the state of the
3790 * process, the process was terminated by a signal, or
3791 * failed for an unknown reason.
3792 * >=0 : The process terminated normally, and its exit code is
3795 * That is, success is indicated by a return value of zero, and an
3796 * error is indicated by a non-zero value.
3798 * A warning is emitted if the process terminates abnormally,
3799 * and also if it returns non-zero unless check_exit_code is true.
3801 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3808 r = wait_for_terminate(pid, &status);
3810 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3812 if (status.si_code == CLD_EXITED) {
3813 if (status.si_status != 0)
3814 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3815 "%s failed with error code %i.", name, status.si_status);
3817 log_debug("%s succeeded.", name);
3819 return status.si_status;
3820 } else if (status.si_code == CLD_KILLED ||
3821 status.si_code == CLD_DUMPED) {
3823 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3827 log_warning("%s failed due to unknown reason.", name);
3831 noreturn void freeze(void) {
3833 /* Make sure nobody waits for us on a socket anymore */
3834 close_all_fds(NULL, 0);
3842 bool null_or_empty(struct stat *st) {
3845 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3848 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3854 int null_or_empty_path(const char *fn) {
3859 if (stat(fn, &st) < 0)
3862 return null_or_empty(&st);
3865 int null_or_empty_fd(int fd) {
3870 if (fstat(fd, &st) < 0)
3873 return null_or_empty(&st);
3876 DIR *xopendirat(int fd, const char *name, int flags) {
3880 assert(!(flags & O_CREAT));
3882 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3895 int signal_from_string_try_harder(const char *s) {
3899 signo = signal_from_string(s);
3901 if (startswith(s, "SIG"))
3902 return signal_from_string(s+3);
3907 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3908 _cleanup_free_ char *t = NULL, *u = NULL;
3911 u = unquote(tagvalue, "\"\'");
3915 enc_len = strlen(u) * 4 + 1;
3916 t = new(char, enc_len);
3920 if (encode_devnode_name(u, t, enc_len) < 0)
3923 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3926 char *fstab_node_to_udev_node(const char *p) {
3929 if (startswith(p, "LABEL="))
3930 return tag_to_udev_node(p+6, "label");
3932 if (startswith(p, "UUID="))
3933 return tag_to_udev_node(p+5, "uuid");
3935 if (startswith(p, "PARTUUID="))
3936 return tag_to_udev_node(p+9, "partuuid");
3938 if (startswith(p, "PARTLABEL="))
3939 return tag_to_udev_node(p+10, "partlabel");
3944 bool tty_is_vc(const char *tty) {
3947 return vtnr_from_tty(tty) >= 0;
3950 bool tty_is_console(const char *tty) {
3953 if (startswith(tty, "/dev/"))
3956 return streq(tty, "console");
3959 int vtnr_from_tty(const char *tty) {
3964 if (startswith(tty, "/dev/"))
3967 if (!startswith(tty, "tty") )
3970 if (tty[3] < '0' || tty[3] > '9')
3973 r = safe_atoi(tty+3, &i);
3977 if (i < 0 || i > 63)
3983 char *resolve_dev_console(char **active) {
3986 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3987 * (i.e. not read-only-mounted which is a sign for container setups) */
3989 if (path_is_read_only_fs("/sys") > 0)
3992 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3995 /* If multiple log outputs are configured the last one is what
3996 * /dev/console points to */
3997 tty = strrchr(*active, ' ');
4003 if (streq(tty, "tty0")) {
4006 /* Get the active VC (e.g. tty1) */
4007 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
4009 tty = *active = tmp;
4016 bool tty_is_vc_resolve(const char *tty) {
4017 _cleanup_free_ char *active = NULL;
4021 if (startswith(tty, "/dev/"))
4024 if (streq(tty, "console")) {
4025 tty = resolve_dev_console(&active);
4030 return tty_is_vc(tty);
4033 const char *default_term_for_tty(const char *tty) {
4036 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
4039 bool dirent_is_file(const struct dirent *de) {
4042 if (hidden_file(de->d_name))
4045 if (de->d_type != DT_REG &&
4046 de->d_type != DT_LNK &&
4047 de->d_type != DT_UNKNOWN)
4053 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
4056 if (de->d_type != DT_REG &&
4057 de->d_type != DT_LNK &&
4058 de->d_type != DT_UNKNOWN)
4061 if (hidden_file_allow_backup(de->d_name))
4064 return endswith(de->d_name, suffix);
4067 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4068 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4069 _cleanup_set_free_free_ Set *seen = NULL;
4072 /* We fork this all off from a child process so that we can
4073 * somewhat cleanly make use of SIGALRM to set a time limit */
4075 reset_all_signal_handlers();
4076 reset_signal_mask();
4078 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4080 pids = hashmap_new(NULL);
4084 seen = set_new(&string_hash_ops);
4088 STRV_FOREACH(directory, directories) {
4089 _cleanup_closedir_ DIR *d;
4092 d = opendir(*directory);
4094 if (errno == ENOENT)
4097 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4100 FOREACH_DIRENT(de, d, break) {
4101 _cleanup_free_ char *path = NULL;
4105 if (!dirent_is_file(de))
4108 if (set_contains(seen, de->d_name)) {
4109 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4113 r = set_put_strdup(seen, de->d_name);
4117 path = strjoin(*directory, "/", de->d_name, NULL);
4121 if (null_or_empty_path(path)) {
4122 log_debug("%s is empty (a mask).", path);
4128 log_error_errno(errno, "Failed to fork: %m");
4130 } else if (pid == 0) {
4133 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4143 return log_error_errno(errno, "Failed to execute %s: %m", path);
4146 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4148 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4155 /* Abort execution of this process after the timout. We simply
4156 * rely on SIGALRM as default action terminating the process,
4157 * and turn on alarm(). */
4159 if (timeout != USEC_INFINITY)
4160 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4162 while (!hashmap_isempty(pids)) {
4163 _cleanup_free_ char *path = NULL;
4166 pid = PTR_TO_UINT(hashmap_first_key(pids));
4169 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4172 wait_for_terminate_and_warn(path, pid, true);
4178 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4182 char **dirs = (char**) directories;
4184 assert(!strv_isempty(dirs));
4186 name = basename(dirs[0]);
4187 assert(!isempty(name));
4189 /* Executes all binaries in the directories in parallel and waits
4190 * for them to finish. Optionally a timeout is applied. If a file
4191 * with the same name exists in more than one directory, the
4192 * earliest one wins. */
4194 executor_pid = fork();
4195 if (executor_pid < 0) {
4196 log_error_errno(errno, "Failed to fork: %m");
4199 } else if (executor_pid == 0) {
4200 r = do_execute(dirs, timeout, argv);
4201 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4204 wait_for_terminate_and_warn(name, executor_pid, true);
4207 int kill_and_sigcont(pid_t pid, int sig) {
4210 r = kill(pid, sig) < 0 ? -errno : 0;
4218 bool nulstr_contains(const char*nulstr, const char *needle) {
4224 NULSTR_FOREACH(i, nulstr)
4225 if (streq(i, needle))
4231 bool plymouth_running(void) {
4232 return access("/run/plymouth/pid", F_OK) >= 0;
4235 char* strshorten(char *s, size_t l) {
4244 static bool hostname_valid_char(char c) {
4246 (c >= 'a' && c <= 'z') ||
4247 (c >= 'A' && c <= 'Z') ||
4248 (c >= '0' && c <= '9') ||
4254 bool hostname_is_valid(const char *s) {
4261 /* Doesn't accept empty hostnames, hostnames with trailing or
4262 * leading dots, and hostnames with multiple dots in a
4263 * sequence. Also ensures that the length stays below
4266 for (p = s, dot = true; *p; p++) {
4273 if (!hostname_valid_char(*p))
4283 if (p-s > HOST_NAME_MAX)
4289 char* hostname_cleanup(char *s, bool lowercase) {
4293 for (p = s, d = s, dot = true; *p; p++) {
4300 } else if (hostname_valid_char(*p)) {
4301 *(d++) = lowercase ? tolower(*p) : *p;
4312 strshorten(s, HOST_NAME_MAX);
4317 bool machine_name_is_valid(const char *s) {
4319 if (!hostname_is_valid(s))
4322 /* Machine names should be useful hostnames, but also be
4323 * useful in unit names, hence we enforce a stricter length
4332 int pipe_eof(int fd) {
4333 struct pollfd pollfd = {
4335 .events = POLLIN|POLLHUP,
4340 r = poll(&pollfd, 1, 0);
4347 return pollfd.revents & POLLHUP;
4350 int fd_wait_for_event(int fd, int event, usec_t t) {
4352 struct pollfd pollfd = {
4360 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4367 return pollfd.revents;
4370 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4379 r = tempfn_xxxxxx(path, &t);
4383 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4389 f = fdopen(fd, "we");
4402 int terminal_vhangup_fd(int fd) {
4405 if (ioctl(fd, TIOCVHANGUP) < 0)
4411 int terminal_vhangup(const char *name) {
4412 _cleanup_close_ int fd;
4414 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4418 return terminal_vhangup_fd(fd);
4421 int vt_disallocate(const char *name) {
4425 /* Deallocate the VT if possible. If not possible
4426 * (i.e. because it is the active one), at least clear it
4427 * entirely (including the scrollback buffer) */
4429 if (!startswith(name, "/dev/"))
4432 if (!tty_is_vc(name)) {
4433 /* So this is not a VT. I guess we cannot deallocate
4434 * it then. But let's at least clear the screen */
4436 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4441 "\033[r" /* clear scrolling region */
4442 "\033[H" /* move home */
4443 "\033[2J", /* clear screen */
4450 if (!startswith(name, "/dev/tty"))
4453 r = safe_atou(name+8, &u);
4460 /* Try to deallocate */
4461 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4465 r = ioctl(fd, VT_DISALLOCATE, u);
4474 /* Couldn't deallocate, so let's clear it fully with
4476 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4481 "\033[r" /* clear scrolling region */
4482 "\033[H" /* move home */
4483 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4490 int symlink_atomic(const char *from, const char *to) {
4491 _cleanup_free_ char *t = NULL;
4497 r = tempfn_random(to, &t);
4501 if (symlink(from, t) < 0)
4504 if (rename(t, to) < 0) {
4512 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4513 _cleanup_free_ char *t = NULL;
4518 r = tempfn_random(path, &t);
4522 if (mknod(t, mode, dev) < 0)
4525 if (rename(t, path) < 0) {
4533 int mkfifo_atomic(const char *path, mode_t mode) {
4534 _cleanup_free_ char *t = NULL;
4539 r = tempfn_random(path, &t);
4543 if (mkfifo(t, mode) < 0)
4546 if (rename(t, path) < 0) {
4554 bool display_is_local(const char *display) {
4558 display[0] == ':' &&
4559 display[1] >= '0' &&
4563 int socket_from_display(const char *display, char **path) {
4570 if (!display_is_local(display))
4573 k = strspn(display+1, "0123456789");
4575 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4579 c = stpcpy(f, "/tmp/.X11-unix/X");
4580 memcpy(c, display+1, k);
4589 const char **username,
4590 uid_t *uid, gid_t *gid,
4592 const char **shell) {
4600 /* We enforce some special rules for uid=0: in order to avoid
4601 * NSS lookups for root we hardcode its data. */
4603 if (streq(*username, "root") || streq(*username, "0")) {
4621 if (parse_uid(*username, &u) >= 0) {
4625 /* If there are multiple users with the same id, make
4626 * sure to leave $USER to the configured value instead
4627 * of the first occurrence in the database. However if
4628 * the uid was configured by a numeric uid, then let's
4629 * pick the real username from /etc/passwd. */
4631 *username = p->pw_name;
4634 p = getpwnam(*username);
4638 return errno > 0 ? -errno : -ESRCH;
4650 *shell = p->pw_shell;
4655 char* uid_to_name(uid_t uid) {
4660 return strdup("root");
4664 return strdup(p->pw_name);
4666 if (asprintf(&r, UID_FMT, uid) < 0)
4672 char* gid_to_name(gid_t gid) {
4677 return strdup("root");
4681 return strdup(p->gr_name);
4683 if (asprintf(&r, GID_FMT, gid) < 0)
4689 int get_group_creds(const char **groupname, gid_t *gid) {
4695 /* We enforce some special rules for gid=0: in order to avoid
4696 * NSS lookups for root we hardcode its data. */
4698 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4699 *groupname = "root";
4707 if (parse_gid(*groupname, &id) >= 0) {
4712 *groupname = g->gr_name;
4715 g = getgrnam(*groupname);
4719 return errno > 0 ? -errno : -ESRCH;
4727 int in_gid(gid_t gid) {
4729 int ngroups_max, r, i;
4731 if (getgid() == gid)
4734 if (getegid() == gid)
4737 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4738 assert(ngroups_max > 0);
4740 gids = alloca(sizeof(gid_t) * ngroups_max);
4742 r = getgroups(ngroups_max, gids);
4746 for (i = 0; i < r; i++)
4753 int in_group(const char *name) {
4757 r = get_group_creds(&name, &gid);
4764 int glob_exists(const char *path) {
4765 _cleanup_globfree_ glob_t g = {};
4771 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4773 if (k == GLOB_NOMATCH)
4775 else if (k == GLOB_NOSPACE)
4778 return !strv_isempty(g.gl_pathv);
4780 return errno ? -errno : -EIO;
4783 int glob_extend(char ***strv, const char *path) {
4784 _cleanup_globfree_ glob_t g = {};
4789 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4791 if (k == GLOB_NOMATCH)
4793 else if (k == GLOB_NOSPACE)
4795 else if (k != 0 || strv_isempty(g.gl_pathv))
4796 return errno ? -errno : -EIO;
4798 STRV_FOREACH(p, g.gl_pathv) {
4799 k = strv_extend(strv, *p);
4807 int dirent_ensure_type(DIR *d, struct dirent *de) {
4813 if (de->d_type != DT_UNKNOWN)
4816 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4820 S_ISREG(st.st_mode) ? DT_REG :
4821 S_ISDIR(st.st_mode) ? DT_DIR :
4822 S_ISLNK(st.st_mode) ? DT_LNK :
4823 S_ISFIFO(st.st_mode) ? DT_FIFO :
4824 S_ISSOCK(st.st_mode) ? DT_SOCK :
4825 S_ISCHR(st.st_mode) ? DT_CHR :
4826 S_ISBLK(st.st_mode) ? DT_BLK :
4832 int get_files_in_directory(const char *path, char ***list) {
4833 _cleanup_closedir_ DIR *d = NULL;
4834 size_t bufsize = 0, n = 0;
4835 _cleanup_strv_free_ char **l = NULL;
4839 /* Returns all files in a directory in *list, and the number
4840 * of files as return value. If list is NULL returns only the
4852 if (!de && errno != 0)
4857 dirent_ensure_type(d, de);
4859 if (!dirent_is_file(de))
4863 /* one extra slot is needed for the terminating NULL */
4864 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4867 l[n] = strdup(de->d_name);
4878 l = NULL; /* avoid freeing */
4884 char *strjoin(const char *x, ...) {
4898 t = va_arg(ap, const char *);
4903 if (n > ((size_t) -1) - l) {
4927 t = va_arg(ap, const char *);
4941 bool is_main_thread(void) {
4942 static thread_local int cached = 0;
4944 if (_unlikely_(cached == 0))
4945 cached = getpid() == gettid() ? 1 : -1;
4950 int block_get_whole_disk(dev_t d, dev_t *ret) {
4957 /* If it has a queue this is good enough for us */
4958 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4961 r = access(p, F_OK);
4969 /* If it is a partition find the originating device */
4970 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4973 r = access(p, F_OK);
4979 /* Get parent dev_t */
4980 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4983 r = read_one_line_file(p, &s);
4989 r = sscanf(s, "%u:%u", &m, &n);
4995 /* Only return this if it is really good enough for us. */
4996 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4999 r = access(p, F_OK);
5003 *ret = makedev(m, n);
5010 static const char *const ioprio_class_table[] = {
5011 [IOPRIO_CLASS_NONE] = "none",
5012 [IOPRIO_CLASS_RT] = "realtime",
5013 [IOPRIO_CLASS_BE] = "best-effort",
5014 [IOPRIO_CLASS_IDLE] = "idle"
5017 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
5019 static const char *const sigchld_code_table[] = {
5020 [CLD_EXITED] = "exited",
5021 [CLD_KILLED] = "killed",
5022 [CLD_DUMPED] = "dumped",
5023 [CLD_TRAPPED] = "trapped",
5024 [CLD_STOPPED] = "stopped",
5025 [CLD_CONTINUED] = "continued",
5028 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
5030 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
5031 [LOG_FAC(LOG_KERN)] = "kern",
5032 [LOG_FAC(LOG_USER)] = "user",
5033 [LOG_FAC(LOG_MAIL)] = "mail",
5034 [LOG_FAC(LOG_DAEMON)] = "daemon",
5035 [LOG_FAC(LOG_AUTH)] = "auth",
5036 [LOG_FAC(LOG_SYSLOG)] = "syslog",
5037 [LOG_FAC(LOG_LPR)] = "lpr",
5038 [LOG_FAC(LOG_NEWS)] = "news",
5039 [LOG_FAC(LOG_UUCP)] = "uucp",
5040 [LOG_FAC(LOG_CRON)] = "cron",
5041 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
5042 [LOG_FAC(LOG_FTP)] = "ftp",
5043 [LOG_FAC(LOG_LOCAL0)] = "local0",
5044 [LOG_FAC(LOG_LOCAL1)] = "local1",
5045 [LOG_FAC(LOG_LOCAL2)] = "local2",
5046 [LOG_FAC(LOG_LOCAL3)] = "local3",
5047 [LOG_FAC(LOG_LOCAL4)] = "local4",
5048 [LOG_FAC(LOG_LOCAL5)] = "local5",
5049 [LOG_FAC(LOG_LOCAL6)] = "local6",
5050 [LOG_FAC(LOG_LOCAL7)] = "local7"
5053 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
5055 static const char *const log_level_table[] = {
5056 [LOG_EMERG] = "emerg",
5057 [LOG_ALERT] = "alert",
5058 [LOG_CRIT] = "crit",
5060 [LOG_WARNING] = "warning",
5061 [LOG_NOTICE] = "notice",
5062 [LOG_INFO] = "info",
5063 [LOG_DEBUG] = "debug"
5066 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5068 static const char* const sched_policy_table[] = {
5069 [SCHED_OTHER] = "other",
5070 [SCHED_BATCH] = "batch",
5071 [SCHED_IDLE] = "idle",
5072 [SCHED_FIFO] = "fifo",
5076 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5078 static const char* const rlimit_table[_RLIMIT_MAX] = {
5079 [RLIMIT_CPU] = "LimitCPU",
5080 [RLIMIT_FSIZE] = "LimitFSIZE",
5081 [RLIMIT_DATA] = "LimitDATA",
5082 [RLIMIT_STACK] = "LimitSTACK",
5083 [RLIMIT_CORE] = "LimitCORE",
5084 [RLIMIT_RSS] = "LimitRSS",
5085 [RLIMIT_NOFILE] = "LimitNOFILE",
5086 [RLIMIT_AS] = "LimitAS",
5087 [RLIMIT_NPROC] = "LimitNPROC",
5088 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5089 [RLIMIT_LOCKS] = "LimitLOCKS",
5090 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5091 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5092 [RLIMIT_NICE] = "LimitNICE",
5093 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5094 [RLIMIT_RTTIME] = "LimitRTTIME"
5097 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5099 static const char* const ip_tos_table[] = {
5100 [IPTOS_LOWDELAY] = "low-delay",
5101 [IPTOS_THROUGHPUT] = "throughput",
5102 [IPTOS_RELIABILITY] = "reliability",
5103 [IPTOS_LOWCOST] = "low-cost",
5106 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5108 static const char *const __signal_table[] = {
5125 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5136 [SIGVTALRM] = "VTALRM",
5138 [SIGWINCH] = "WINCH",
5144 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5146 const char *signal_to_string(int signo) {
5147 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5150 name = __signal_to_string(signo);
5154 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5155 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5157 snprintf(buf, sizeof(buf), "%d", signo);
5162 int signal_from_string(const char *s) {
5167 signo = __signal_from_string(s);
5171 if (startswith(s, "RTMIN+")) {
5175 if (safe_atou(s, &u) >= 0) {
5176 signo = (int) u + offset;
5177 if (signo > 0 && signo < _NSIG)
5183 bool kexec_loaded(void) {
5184 bool loaded = false;
5187 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5195 int prot_from_flags(int flags) {
5197 switch (flags & O_ACCMODE) {
5206 return PROT_READ|PROT_WRITE;
5213 char *format_bytes(char *buf, size_t l, off_t t) {
5216 static const struct {
5220 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5221 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5222 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5223 { "G", 1024ULL*1024ULL*1024ULL },
5224 { "M", 1024ULL*1024ULL },
5228 if (t == (off_t) -1)
5231 for (i = 0; i < ELEMENTSOF(table); i++) {
5233 if (t >= table[i].factor) {
5236 (unsigned long long) (t / table[i].factor),
5237 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5244 snprintf(buf, l, "%lluB", (unsigned long long) t);
5252 void* memdup(const void *p, size_t l) {
5265 int fd_inc_sndbuf(int fd, size_t n) {
5267 socklen_t l = sizeof(value);
5269 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5270 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5273 /* If we have the privileges we will ignore the kernel limit. */
5276 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5277 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5283 int fd_inc_rcvbuf(int fd, size_t n) {
5285 socklen_t l = sizeof(value);
5287 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5288 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5291 /* If we have the privileges we will ignore the kernel limit. */
5294 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5295 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5300 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5301 bool stdout_is_tty, stderr_is_tty;
5302 pid_t parent_pid, agent_pid;
5303 sigset_t ss, saved_ss;
5311 /* Spawns a temporary TTY agent, making sure it goes away when
5314 parent_pid = getpid();
5316 /* First we temporarily block all signals, so that the new
5317 * child has them blocked initially. This way, we can be sure
5318 * that SIGTERMs are not lost we might send to the agent. */
5319 assert_se(sigfillset(&ss) >= 0);
5320 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5323 if (agent_pid < 0) {
5324 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5328 if (agent_pid != 0) {
5329 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5336 * Make sure the agent goes away when the parent dies */
5337 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5338 _exit(EXIT_FAILURE);
5340 /* Make sure we actually can kill the agent, if we need to, in
5341 * case somebody invoked us from a shell script that trapped
5342 * SIGTERM or so... */
5343 reset_all_signal_handlers();
5344 reset_signal_mask();
5346 /* Check whether our parent died before we were able
5347 * to set the death signal and unblock the signals */
5348 if (getppid() != parent_pid)
5349 _exit(EXIT_SUCCESS);
5351 /* Don't leak fds to the agent */
5352 close_all_fds(except, n_except);
5354 stdout_is_tty = isatty(STDOUT_FILENO);
5355 stderr_is_tty = isatty(STDERR_FILENO);
5357 if (!stdout_is_tty || !stderr_is_tty) {
5360 /* Detach from stdout/stderr. and reopen
5361 * /dev/tty for them. This is important to
5362 * ensure that when systemctl is started via
5363 * popen() or a similar call that expects to
5364 * read EOF we actually do generate EOF and
5365 * not delay this indefinitely by because we
5366 * keep an unused copy of stdin around. */
5367 fd = open("/dev/tty", O_WRONLY);
5369 log_error_errno(errno, "Failed to open /dev/tty: %m");
5370 _exit(EXIT_FAILURE);
5374 dup2(fd, STDOUT_FILENO);
5377 dup2(fd, STDERR_FILENO);
5383 /* Count arguments */
5385 for (n = 0; va_arg(ap, char*); n++)
5390 l = alloca(sizeof(char *) * (n + 1));
5392 /* Fill in arguments */
5394 for (i = 0; i <= n; i++)
5395 l[i] = va_arg(ap, char*);
5399 _exit(EXIT_FAILURE);
5402 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5403 struct rlimit highest, fixed;
5407 if (setrlimit(resource, rlim) >= 0)
5413 /* So we failed to set the desired setrlimit, then let's try
5414 * to get as close as we can */
5415 assert_se(getrlimit(resource, &highest) == 0);
5417 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5418 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5420 if (setrlimit(resource, &fixed) < 0)
5426 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5427 _cleanup_fclose_ FILE *f = NULL;
5438 path = procfs_file_alloca(pid, "environ");
5440 f = fopen(path, "re");
5448 char line[LINE_MAX];
5451 for (i = 0; i < sizeof(line)-1; i++) {
5455 if (_unlikely_(c == EOF)) {
5465 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5466 value = strdup(line + l + 1);
5480 bool http_etag_is_valid(const char *etag) {
5484 if (!endswith(etag, "\""))
5487 if (!startswith(etag, "\"") && !startswith(etag, "W/\""))
5493 bool http_url_is_valid(const char *url) {
5499 p = startswith(url, "http://");
5501 p = startswith(url, "https://");
5508 return ascii_is_valid(p);
5511 bool documentation_url_is_valid(const char *url) {
5517 if (http_url_is_valid(url))
5520 p = startswith(url, "file:/");
5522 p = startswith(url, "info:");
5524 p = startswith(url, "man:");
5529 return ascii_is_valid(p);
5532 bool in_initrd(void) {
5533 static int saved = -1;
5539 /* We make two checks here:
5541 * 1. the flag file /etc/initrd-release must exist
5542 * 2. the root file system must be a memory file system
5544 * The second check is extra paranoia, since misdetecting an
5545 * initrd can have bad bad consequences due the initrd
5546 * emptying when transititioning to the main systemd.
5549 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5550 statfs("/", &s) >= 0 &&
5551 is_temporary_fs(&s);
5556 void warn_melody(void) {
5557 _cleanup_close_ int fd = -1;
5559 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5563 /* Yeah, this is synchronous. Kinda sucks. But well... */
5565 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5566 usleep(125*USEC_PER_MSEC);
5568 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5569 usleep(125*USEC_PER_MSEC);
5571 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5572 usleep(125*USEC_PER_MSEC);
5574 ioctl(fd, KIOCSOUND, 0);
5577 int make_console_stdio(void) {
5580 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5582 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5584 return log_error_errno(fd, "Failed to acquire terminal: %m");
5588 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5593 int get_home_dir(char **_h) {
5601 /* Take the user specified one */
5602 e = secure_getenv("HOME");
5603 if (e && path_is_absolute(e)) {
5612 /* Hardcode home directory for root to avoid NSS */
5615 h = strdup("/root");
5623 /* Check the database... */
5627 return errno > 0 ? -errno : -ESRCH;
5629 if (!path_is_absolute(p->pw_dir))
5632 h = strdup(p->pw_dir);
5640 int get_shell(char **_s) {
5648 /* Take the user specified one */
5649 e = getenv("SHELL");
5659 /* Hardcode home directory for root to avoid NSS */
5662 s = strdup("/bin/sh");
5670 /* Check the database... */
5674 return errno > 0 ? -errno : -ESRCH;
5676 if (!path_is_absolute(p->pw_shell))
5679 s = strdup(p->pw_shell);
5687 bool filename_is_valid(const char *p) {
5701 if (strlen(p) > FILENAME_MAX)
5707 bool string_is_safe(const char *p) {
5713 for (t = p; *t; t++) {
5714 if (*t > 0 && *t < ' ')
5717 if (strchr("\\\"\'\0x7f", *t))
5725 * Check if a string contains control characters. If 'ok' is non-NULL
5726 * it may be a string containing additional CCs to be considered OK.
5728 bool string_has_cc(const char *p, const char *ok) {
5733 for (t = p; *t; t++) {
5734 if (ok && strchr(ok, *t))
5737 if (*t > 0 && *t < ' ')
5747 bool path_is_safe(const char *p) {
5752 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5755 if (strlen(p) > PATH_MAX)
5758 /* The following two checks are not really dangerous, but hey, they still are confusing */
5759 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5762 if (strstr(p, "//"))
5768 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5769 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5770 int (*compar) (const void *, const void *, void *), void *arg) {
5779 p = (void *)(((const char *) base) + (idx * size));
5780 comparison = compar(key, p, arg);
5783 else if (comparison > 0)
5791 void init_gettext(void) {
5792 setlocale(LC_ALL, "");
5793 textdomain(GETTEXT_PACKAGE);
5796 bool is_locale_utf8(void) {
5798 static int cached_answer = -1;
5800 if (cached_answer >= 0)
5803 if (!setlocale(LC_ALL, "")) {
5804 cached_answer = true;
5808 set = nl_langinfo(CODESET);
5810 cached_answer = true;
5814 if (streq(set, "UTF-8")) {
5815 cached_answer = true;
5819 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5820 * unset and everything can do to UTF-8 nowadays. */
5821 set = setlocale(LC_CTYPE, NULL);
5823 cached_answer = true;
5827 /* Check result, but ignore the result if C was set
5831 !getenv("LC_ALL") &&
5832 !getenv("LC_CTYPE") &&
5836 return (bool) cached_answer;
5839 const char *draw_special_char(DrawSpecialChar ch) {
5840 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5843 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5844 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5845 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5846 [DRAW_TREE_SPACE] = " ", /* */
5847 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5848 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5849 [DRAW_ARROW] = "\342\206\222", /* → */
5850 [DRAW_DASH] = "\342\200\223", /* – */
5853 /* ASCII fallback */ {
5854 [DRAW_TREE_VERTICAL] = "| ",
5855 [DRAW_TREE_BRANCH] = "|-",
5856 [DRAW_TREE_RIGHT] = "`-",
5857 [DRAW_TREE_SPACE] = " ",
5858 [DRAW_TRIANGULAR_BULLET] = ">",
5859 [DRAW_BLACK_CIRCLE] = "*",
5860 [DRAW_ARROW] = "->",
5865 return draw_table[!is_locale_utf8()][ch];
5868 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5871 size_t l, old_len, new_len;
5877 old_len = strlen(old_string);
5878 new_len = strlen(new_string);
5891 if (!startswith(f, old_string)) {
5897 nl = l - old_len + new_len;
5898 a = realloc(r, nl + 1);
5906 t = stpcpy(t, new_string);
5918 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5919 const char *i, *begin = NULL;
5924 } state = STATE_OTHER;
5926 size_t osz = 0, isz;
5932 /* Strips ANSI color and replaces TABs by 8 spaces */
5934 isz = _isz ? *_isz : strlen(*ibuf);
5936 f = open_memstream(&obuf, &osz);
5940 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5945 if (i >= *ibuf + isz) /* EOT */
5947 else if (*i == '\x1B')
5948 state = STATE_ESCAPE;
5949 else if (*i == '\t')
5956 if (i >= *ibuf + isz) { /* EOT */
5959 } else if (*i == '[') {
5960 state = STATE_BRACKET;
5965 state = STATE_OTHER;
5972 if (i >= *ibuf + isz || /* EOT */
5973 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5976 state = STATE_OTHER;
5978 } else if (*i == 'm')
5979 state = STATE_OTHER;
6001 int on_ac_power(void) {
6002 bool found_offline = false, found_online = false;
6003 _cleanup_closedir_ DIR *d = NULL;
6005 d = opendir("/sys/class/power_supply");
6007 return errno == ENOENT ? true : -errno;
6011 _cleanup_close_ int fd = -1, device = -1;
6017 if (!de && errno != 0)
6023 if (hidden_file(de->d_name))
6026 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
6028 if (errno == ENOENT || errno == ENOTDIR)
6034 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6036 if (errno == ENOENT)
6042 n = read(fd, contents, sizeof(contents));
6046 if (n != 6 || memcmp(contents, "Mains\n", 6))
6050 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6052 if (errno == ENOENT)
6058 n = read(fd, contents, sizeof(contents));
6062 if (n != 2 || contents[1] != '\n')
6065 if (contents[0] == '1') {
6066 found_online = true;
6068 } else if (contents[0] == '0')
6069 found_offline = true;
6074 return found_online || !found_offline;
6077 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6084 if (!path_strv_resolve_uniq(search, root))
6087 STRV_FOREACH(i, search) {
6088 _cleanup_free_ char *p = NULL;
6092 p = strjoin(root, *i, "/", path, NULL);
6094 p = strjoin(*i, "/", path, NULL);
6104 if (errno != ENOENT)
6111 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6112 _cleanup_strv_free_ char **copy = NULL;
6118 if (path_is_absolute(path)) {
6121 f = fopen(path, mode);
6130 copy = strv_copy((char**) search);
6134 return search_and_fopen_internal(path, mode, root, copy, _f);
6137 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6138 _cleanup_strv_free_ char **s = NULL;
6140 if (path_is_absolute(path)) {
6143 f = fopen(path, mode);
6152 s = strv_split_nulstr(search);
6156 return search_and_fopen_internal(path, mode, root, s, _f);
6159 char *strextend(char **x, ...) {
6166 l = f = *x ? strlen(*x) : 0;
6173 t = va_arg(ap, const char *);
6178 if (n > ((size_t) -1) - l) {
6187 r = realloc(*x, l+1);
6197 t = va_arg(ap, const char *);
6211 char *strrep(const char *s, unsigned n) {
6219 p = r = malloc(l * n + 1);
6223 for (i = 0; i < n; i++)
6230 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6237 if (*allocated >= need)
6240 newalloc = MAX(need * 2, 64u / size);
6241 a = newalloc * size;
6243 /* check for overflows */
6244 if (a < size * need)
6252 *allocated = newalloc;
6256 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6265 q = greedy_realloc(p, allocated, need, size);
6269 if (*allocated > prev)
6270 memzero(q + prev * size, (*allocated - prev) * size);
6275 bool id128_is_valid(const char *s) {
6281 /* Simple formatted 128bit hex string */
6283 for (i = 0; i < l; i++) {
6286 if (!(c >= '0' && c <= '9') &&
6287 !(c >= 'a' && c <= 'z') &&
6288 !(c >= 'A' && c <= 'Z'))
6292 } else if (l == 36) {
6294 /* Formatted UUID */
6296 for (i = 0; i < l; i++) {
6299 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6303 if (!(c >= '0' && c <= '9') &&
6304 !(c >= 'a' && c <= 'z') &&
6305 !(c >= 'A' && c <= 'Z'))
6316 int split_pair(const char *s, const char *sep, char **l, char **r) {
6331 a = strndup(s, x - s);
6335 b = strdup(x + strlen(sep));
6347 int shall_restore_state(void) {
6348 _cleanup_free_ char *value = NULL;
6351 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6357 return parse_boolean(value) != 0;
6360 int proc_cmdline(char **ret) {
6363 if (detect_container(NULL) > 0)
6364 return get_process_cmdline(1, 0, false, ret);
6366 return read_one_line_file("/proc/cmdline", ret);
6369 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6370 _cleanup_free_ char *line = NULL;
6376 r = proc_cmdline(&line);
6382 _cleanup_free_ char *word = NULL;
6385 r = unquote_first_word(&p, &word, true);
6391 /* Filter out arguments that are intended only for the
6393 if (!in_initrd() && startswith(word, "rd."))
6396 value = strchr(word, '=');
6400 r = parse_item(word, value);
6408 int get_proc_cmdline_key(const char *key, char **value) {
6409 _cleanup_free_ char *line = NULL, *ret = NULL;
6416 r = proc_cmdline(&line);
6422 _cleanup_free_ char *word = NULL;
6425 r = unquote_first_word(&p, &word, true);
6431 /* Filter out arguments that are intended only for the
6433 if (!in_initrd() && startswith(word, "rd."))
6437 e = startswith(word, key);
6441 r = free_and_strdup(&ret, e);
6447 if (streq(word, key))
6461 int container_get_leader(const char *machine, pid_t *pid) {
6462 _cleanup_free_ char *s = NULL, *class = NULL;
6470 p = strjoina("/run/systemd/machines/", machine);
6471 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6479 if (!streq_ptr(class, "container"))
6482 r = parse_pid(s, &leader);
6492 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6493 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6501 mntns = procfs_file_alloca(pid, "ns/mnt");
6502 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6510 pidns = procfs_file_alloca(pid, "ns/pid");
6511 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6519 netns = procfs_file_alloca(pid, "ns/net");
6520 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6528 root = procfs_file_alloca(pid, "root");
6529 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6535 *pidns_fd = pidnsfd;
6538 *mntns_fd = mntnsfd;
6541 *netns_fd = netnsfd;
6546 pidnsfd = mntnsfd = netnsfd = -1;
6551 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6554 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6558 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6562 if (setns(netns_fd, CLONE_NEWNET) < 0)
6566 if (fchdir(root_fd) < 0)
6569 if (chroot(".") < 0)
6573 if (setresgid(0, 0, 0) < 0)
6576 if (setgroups(0, NULL) < 0)
6579 if (setresuid(0, 0, 0) < 0)
6585 bool pid_is_unwaited(pid_t pid) {
6586 /* Checks whether a PID is still valid at all, including a zombie */
6591 if (kill(pid, 0) >= 0)
6594 return errno != ESRCH;
6597 bool pid_is_alive(pid_t pid) {
6600 /* Checks whether a PID is still valid and not a zombie */
6605 r = get_process_state(pid);
6606 if (r == -ENOENT || r == 'Z')
6612 int getpeercred(int fd, struct ucred *ucred) {
6613 socklen_t n = sizeof(struct ucred);
6620 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6624 if (n != sizeof(struct ucred))
6627 /* Check if the data is actually useful and not suppressed due
6628 * to namespacing issues */
6631 if (u.uid == UID_INVALID)
6633 if (u.gid == GID_INVALID)
6640 int getpeersec(int fd, char **ret) {
6652 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6656 if (errno != ERANGE)
6663 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6679 /* This is much like like mkostemp() but is subject to umask(). */
6680 int mkostemp_safe(char *pattern, int flags) {
6681 _cleanup_umask_ mode_t u;
6688 fd = mkostemp(pattern, flags);
6695 int open_tmpfile(const char *path, int flags) {
6702 /* Try O_TMPFILE first, if it is supported */
6703 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6708 /* Fall back to unguessable name + unlinking */
6709 p = strjoina(path, "/systemd-tmp-XXXXXX");
6711 fd = mkostemp_safe(p, flags);
6719 int fd_warn_permissions(const char *path, int fd) {
6722 if (fstat(fd, &st) < 0)
6725 if (st.st_mode & 0111)
6726 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6728 if (st.st_mode & 0002)
6729 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6731 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6732 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6737 unsigned long personality_from_string(const char *p) {
6739 /* Parse a personality specifier. We introduce our own
6740 * identifiers that indicate specific ABIs, rather than just
6741 * hints regarding the register size, since we want to keep
6742 * things open for multiple locally supported ABIs for the
6743 * same register size. We try to reuse the ABI identifiers
6744 * used by libseccomp. */
6746 #if defined(__x86_64__)
6748 if (streq(p, "x86"))
6751 if (streq(p, "x86-64"))
6754 #elif defined(__i386__)
6756 if (streq(p, "x86"))
6760 /* personality(7) documents that 0xffffffffUL is used for
6761 * querying the current personality, hence let's use that here
6762 * as error indicator. */
6763 return 0xffffffffUL;
6766 const char* personality_to_string(unsigned long p) {
6768 #if defined(__x86_64__)
6770 if (p == PER_LINUX32)
6776 #elif defined(__i386__)
6785 uint64_t physical_memory(void) {
6788 /* We return this as uint64_t in case we are running as 32bit
6789 * process on a 64bit kernel with huge amounts of memory */
6791 mem = sysconf(_SC_PHYS_PAGES);
6794 return (uint64_t) mem * (uint64_t) page_size();
6797 void hexdump(FILE *f, const void *p, size_t s) {
6798 const uint8_t *b = p;
6801 assert(s == 0 || b);
6806 fprintf(f, "%04x ", n);
6808 for (i = 0; i < 16; i++) {
6813 fprintf(f, "%02x ", b[i]);
6821 for (i = 0; i < 16; i++) {
6826 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6840 int update_reboot_param_file(const char *param) {
6845 r = write_string_file(REBOOT_PARAM_FILE, param);
6847 log_error("Failed to write reboot param to "
6848 REBOOT_PARAM_FILE": %s", strerror(-r));
6850 unlink(REBOOT_PARAM_FILE);
6855 int umount_recursive(const char *prefix, int flags) {
6859 /* Try to umount everything recursively below a
6860 * directory. Also, take care of stacked mounts, and keep
6861 * unmounting them until they are gone. */
6864 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6869 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6870 if (!proc_self_mountinfo)
6874 _cleanup_free_ char *path = NULL, *p = NULL;
6877 k = fscanf(proc_self_mountinfo,
6878 "%*s " /* (1) mount id */
6879 "%*s " /* (2) parent id */
6880 "%*s " /* (3) major:minor */
6881 "%*s " /* (4) root */
6882 "%ms " /* (5) mount point */
6883 "%*s" /* (6) mount options */
6884 "%*[^-]" /* (7) optional fields */
6885 "- " /* (8) separator */
6886 "%*s " /* (9) file system type */
6887 "%*s" /* (10) mount source */
6888 "%*s" /* (11) mount options 2 */
6889 "%*[^\n]", /* some rubbish at the end */
6898 p = cunescape(path);
6902 if (!path_startswith(p, prefix))
6905 if (umount2(p, flags) < 0) {
6921 static int get_mount_flags(const char *path, unsigned long *flags) {
6924 if (statvfs(path, &buf) < 0)
6926 *flags = buf.f_flag;
6930 int bind_remount_recursive(const char *prefix, bool ro) {
6931 _cleanup_set_free_free_ Set *done = NULL;
6932 _cleanup_free_ char *cleaned = NULL;
6935 /* Recursively remount a directory (and all its submounts)
6936 * read-only or read-write. If the directory is already
6937 * mounted, we reuse the mount and simply mark it
6938 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6939 * operation). If it isn't we first make it one. Afterwards we
6940 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6941 * submounts we can access, too. When mounts are stacked on
6942 * the same mount point we only care for each individual
6943 * "top-level" mount on each point, as we cannot
6944 * influence/access the underlying mounts anyway. We do not
6945 * have any effect on future submounts that might get
6946 * propagated, they migt be writable. This includes future
6947 * submounts that have been triggered via autofs. */
6949 cleaned = strdup(prefix);
6953 path_kill_slashes(cleaned);
6955 done = set_new(&string_hash_ops);
6960 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6961 _cleanup_set_free_free_ Set *todo = NULL;
6962 bool top_autofs = false;
6964 unsigned long orig_flags;
6966 todo = set_new(&string_hash_ops);
6970 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6971 if (!proc_self_mountinfo)
6975 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6978 k = fscanf(proc_self_mountinfo,
6979 "%*s " /* (1) mount id */
6980 "%*s " /* (2) parent id */
6981 "%*s " /* (3) major:minor */
6982 "%*s " /* (4) root */
6983 "%ms " /* (5) mount point */
6984 "%*s" /* (6) mount options (superblock) */
6985 "%*[^-]" /* (7) optional fields */
6986 "- " /* (8) separator */
6987 "%ms " /* (9) file system type */
6988 "%*s" /* (10) mount source */
6989 "%*s" /* (11) mount options (bind mount) */
6990 "%*[^\n]", /* some rubbish at the end */
7000 p = cunescape(path);
7004 /* Let's ignore autofs mounts. If they aren't
7005 * triggered yet, we want to avoid triggering
7006 * them, as we don't make any guarantees for
7007 * future submounts anyway. If they are
7008 * already triggered, then we will find
7009 * another entry for this. */
7010 if (streq(type, "autofs")) {
7011 top_autofs = top_autofs || path_equal(cleaned, p);
7015 if (path_startswith(p, cleaned) &&
7016 !set_contains(done, p)) {
7018 r = set_consume(todo, p);
7028 /* If we have no submounts to process anymore and if
7029 * the root is either already done, or an autofs, we
7031 if (set_isempty(todo) &&
7032 (top_autofs || set_contains(done, cleaned)))
7035 if (!set_contains(done, cleaned) &&
7036 !set_contains(todo, cleaned)) {
7037 /* The prefix directory itself is not yet a
7038 * mount, make it one. */
7039 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
7043 (void) get_mount_flags(cleaned, &orig_flags);
7044 orig_flags &= ~MS_RDONLY;
7046 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
7049 x = strdup(cleaned);
7053 r = set_consume(done, x);
7058 while ((x = set_steal_first(todo))) {
7060 r = set_consume(done, x);
7066 /* Try to reuse the original flag set, but
7067 * don't care for errors, in case of
7068 * obstructed mounts */
7070 (void) get_mount_flags(x, &orig_flags);
7071 orig_flags &= ~MS_RDONLY;
7073 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7075 /* Deal with mount points that are
7076 * obstructed by a later mount */
7078 if (errno != ENOENT)
7086 int fflush_and_check(FILE *f) {
7093 return errno ? -errno : -EIO;
7098 int tempfn_xxxxxx(const char *p, char **ret) {
7110 * /foo/bar/.#waldoXXXXXX
7114 if (!filename_is_valid(fn))
7117 t = new(char, strlen(p) + 2 + 6 + 1);
7121 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7123 *ret = path_kill_slashes(t);
7127 int tempfn_random(const char *p, char **ret) {
7141 * /foo/bar/.#waldobaa2a261115984a9
7145 if (!filename_is_valid(fn))
7148 t = new(char, strlen(p) + 2 + 16 + 1);
7152 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7155 for (i = 0; i < 16; i++) {
7156 *(x++) = hexchar(u & 0xF);
7162 *ret = path_kill_slashes(t);
7166 int tempfn_random_child(const char *p, char **ret) {
7177 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7180 t = new(char, strlen(p) + 3 + 16 + 1);
7184 x = stpcpy(stpcpy(t, p), "/.#");
7187 for (i = 0; i < 16; i++) {
7188 *(x++) = hexchar(u & 0xF);
7194 *ret = path_kill_slashes(t);
7198 /* make sure the hostname is not "localhost" */
7199 bool is_localhost(const char *hostname) {
7202 /* This tries to identify local host and domain names
7203 * described in RFC6761 plus the redhatism of .localdomain */
7205 return streq(hostname, "localhost") ||
7206 streq(hostname, "localhost.") ||
7207 streq(hostname, "localdomain.") ||
7208 streq(hostname, "localdomain") ||
7209 endswith(hostname, ".localhost") ||
7210 endswith(hostname, ".localhost.") ||
7211 endswith(hostname, ".localdomain") ||
7212 endswith(hostname, ".localdomain.");
7215 int take_password_lock(const char *root) {
7217 struct flock flock = {
7219 .l_whence = SEEK_SET,
7227 /* This is roughly the same as lckpwdf(), but not as awful. We
7228 * don't want to use alarm() and signals, hence we implement
7229 * our own trivial version of this.
7231 * Note that shadow-utils also takes per-database locks in
7232 * addition to lckpwdf(). However, we don't given that they
7233 * are redundant as they they invoke lckpwdf() first and keep
7234 * it during everything they do. The per-database locks are
7235 * awfully racy, and thus we just won't do them. */
7238 path = strjoina(root, "/etc/.pwd.lock");
7240 path = "/etc/.pwd.lock";
7242 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7246 r = fcntl(fd, F_SETLKW, &flock);
7255 int is_symlink(const char *path) {
7258 if (lstat(path, &info) < 0)
7261 return !!S_ISLNK(info.st_mode);
7264 int is_dir(const char* path, bool follow) {
7269 r = stat(path, &st);
7271 r = lstat(path, &st);
7275 return !!S_ISDIR(st.st_mode);
7278 int unquote_first_word(const char **p, char **ret, bool relax) {
7279 _cleanup_free_ char *s = NULL;
7280 size_t allocated = 0, sz = 0;
7287 SINGLE_QUOTE_ESCAPE,
7289 DOUBLE_QUOTE_ESCAPE,
7297 /* Parses the first word of a string, and returns it in
7298 * *ret. Removes all quotes in the process. When parsing fails
7299 * (because of an uneven number of quotes or similar), leaves
7300 * the pointer *p at the first invalid character. */
7310 else if (strchr(WHITESPACE, c))
7320 state = SINGLE_QUOTE;
7322 state = VALUE_ESCAPE;
7324 state = DOUBLE_QUOTE;
7325 else if (strchr(WHITESPACE, c))
7328 if (!GREEDY_REALLOC(s, allocated, sz+2))
7343 if (!GREEDY_REALLOC(s, allocated, sz+2))
7356 } else if (c == '\'')
7359 state = SINGLE_QUOTE_ESCAPE;
7361 if (!GREEDY_REALLOC(s, allocated, sz+2))
7369 case SINGLE_QUOTE_ESCAPE:
7376 if (!GREEDY_REALLOC(s, allocated, sz+2))
7380 state = SINGLE_QUOTE;
7389 state = DOUBLE_QUOTE_ESCAPE;
7391 if (!GREEDY_REALLOC(s, allocated, sz+2))
7399 case DOUBLE_QUOTE_ESCAPE:
7406 if (!GREEDY_REALLOC(s, allocated, sz+2))
7410 state = DOUBLE_QUOTE;
7416 if (!strchr(WHITESPACE, c))
7438 int unquote_many_words(const char **p, ...) {
7443 /* Parses a number of words from a string, stripping any
7444 * quotes if necessary. */
7448 /* Count how many words are expected */
7451 if (!va_arg(ap, char **))
7460 /* Read all words into a temporary array */
7461 l = newa0(char*, n);
7462 for (c = 0; c < n; c++) {
7464 r = unquote_first_word(p, &l[c], false);
7468 for (j = 0; j < c; j++)
7478 /* If we managed to parse all words, return them in the passed
7481 for (i = 0; i < n; i++) {
7484 v = va_arg(ap, char **);
7494 int free_and_strdup(char **p, const char *s) {
7499 /* Replaces a string pointer with an strdup()ed new string,
7500 * possibly freeing the old one. */
7515 int sethostname_idempotent(const char *s) {
7517 char buf[HOST_NAME_MAX + 1] = {};
7521 r = gethostname(buf, sizeof(buf));
7528 r = sethostname(s, strlen(s));
7535 int ptsname_malloc(int fd, char **ret) {
7548 if (ptsname_r(fd, c, l) == 0) {
7552 if (errno != ERANGE) {
7562 int openpt_in_namespace(pid_t pid, int flags) {
7563 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7564 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7566 struct cmsghdr cmsghdr;
7567 uint8_t buf[CMSG_SPACE(sizeof(int))];
7569 struct msghdr mh = {
7570 .msg_control = &control,
7571 .msg_controllen = sizeof(control),
7573 struct cmsghdr *cmsg;
7580 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7584 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7594 pair[0] = safe_close(pair[0]);
7596 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7598 _exit(EXIT_FAILURE);
7600 master = posix_openpt(flags);
7602 _exit(EXIT_FAILURE);
7604 cmsg = CMSG_FIRSTHDR(&mh);
7605 cmsg->cmsg_level = SOL_SOCKET;
7606 cmsg->cmsg_type = SCM_RIGHTS;
7607 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7608 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7610 mh.msg_controllen = cmsg->cmsg_len;
7612 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7613 _exit(EXIT_FAILURE);
7615 _exit(EXIT_SUCCESS);
7618 pair[1] = safe_close(pair[1]);
7620 r = wait_for_terminate(child, &si);
7623 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7626 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7629 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7630 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7634 fds = (int*) CMSG_DATA(cmsg);
7635 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7638 close_many(fds, n_fds);
7648 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7649 _cleanup_close_ int fd = -1;
7652 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7654 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7658 l = fgetxattr(fd, attribute, value, size);
7665 static int parse_crtime(le64_t le, usec_t *usec) {
7671 if (u == 0 || u == (uint64_t) -1)
7678 int fd_getcrtime(int fd, usec_t *usec) {
7685 /* Until Linux gets a real concept of birthtime/creation time,
7686 * let's fake one with xattrs */
7688 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7691 if (n != sizeof(le))
7694 return parse_crtime(le, usec);
7697 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7701 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7704 if (n != sizeof(le))
7707 return parse_crtime(le, usec);
7710 int path_getcrtime(const char *p, usec_t *usec) {
7717 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7720 if (n != sizeof(le))
7723 return parse_crtime(le, usec);
7726 int fd_setcrtime(int fd, usec_t usec) {
7732 usec = now(CLOCK_REALTIME);
7734 le = htole64((uint64_t) usec);
7735 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7741 int same_fd(int a, int b) {
7742 struct stat sta, stb;
7749 /* Compares two file descriptors. Note that semantics are
7750 * quite different depending on whether we have kcmp() or we
7751 * don't. If we have kcmp() this will only return true for
7752 * dup()ed file descriptors, but not otherwise. If we don't
7753 * have kcmp() this will also return true for two fds of the same
7754 * file, created by separate open() calls. Since we use this
7755 * call mostly for filtering out duplicates in the fd store
7756 * this difference hopefully doesn't matter too much. */
7761 /* Try to use kcmp() if we have it. */
7763 r = kcmp(pid, pid, KCMP_FILE, a, b);
7768 if (errno != ENOSYS)
7771 /* We don't have kcmp(), use fstat() instead. */
7772 if (fstat(a, &sta) < 0)
7775 if (fstat(b, &stb) < 0)
7778 if ((sta.st_mode & S_IFMT) != (stb.st_mode & S_IFMT))
7781 /* We consider all device fds different, since two device fds
7782 * might refer to quite different device contexts even though
7783 * they share the same inode and backing dev_t. */
7785 if (S_ISCHR(sta.st_mode) || S_ISBLK(sta.st_mode))
7788 if (sta.st_dev != stb.st_dev || sta.st_ino != stb.st_ino)
7791 /* The fds refer to the same inode on disk, let's also check
7792 * if they have the same fd flags. This is useful to
7793 * distuingish the read and write side of a pipe created with
7795 fa = fcntl(a, F_GETFL);
7799 fb = fcntl(b, F_GETFL);
7806 int chattr_fd(int fd, bool b, unsigned mask) {
7807 unsigned old_attr, new_attr;
7814 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7818 new_attr = old_attr | mask;
7820 new_attr = old_attr & ~mask;
7822 if (new_attr == old_attr)
7825 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7831 int chattr_path(const char *p, bool b, unsigned mask) {
7832 _cleanup_close_ int fd = -1;
7839 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7843 return chattr_fd(fd, b, mask);
7846 int change_attr_fd(int fd, unsigned value, unsigned mask) {
7847 unsigned old_attr, new_attr;
7854 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7857 new_attr = (old_attr & ~mask) |(value & mask);
7859 if (new_attr == old_attr)
7862 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7868 int read_attr_fd(int fd, unsigned *ret) {
7871 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7877 int read_attr_path(const char *p, unsigned *ret) {
7878 _cleanup_close_ int fd = -1;
7883 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7887 return read_attr_fd(fd, ret);
7890 int make_lock_file(const char *p, int operation, LockFile *ret) {
7891 _cleanup_close_ int fd = -1;
7892 _cleanup_free_ char *t = NULL;
7896 * We use UNPOSIX locks if they are available. They have nice
7897 * semantics, and are mostly compatible with NFS. However,
7898 * they are only available on new kernels. When we detect we
7899 * are running on an older kernel, then we fall back to good
7900 * old BSD locks. They also have nice semantics, but are
7901 * slightly problematic on NFS, where they are upgraded to
7902 * POSIX locks, even though locally they are orthogonal to
7912 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7913 .l_whence = SEEK_SET,
7917 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7921 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7924 /* If the kernel is too old, use good old BSD locks */
7925 if (errno == EINVAL)
7926 r = flock(fd, operation);
7929 return errno == EAGAIN ? -EBUSY : -errno;
7932 /* If we acquired the lock, let's check if the file
7933 * still exists in the file system. If not, then the
7934 * previous exclusive owner removed it and then closed
7935 * it. In such a case our acquired lock is worthless,
7936 * hence try again. */
7941 if (st.st_nlink > 0)
7944 fd = safe_close(fd);
7949 ret->operation = operation;
7957 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7965 if (!filename_is_valid(fn))
7968 t = newa(char, strlen(p) + 2 + 4 + 1);
7969 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7971 return make_lock_file(t, operation, ret);
7974 void release_lock_file(LockFile *f) {
7982 /* If we are the exclusive owner we can safely delete
7983 * the lock file itself. If we are not the exclusive
7984 * owner, we can try becoming it. */
7987 (f->operation & ~LOCK_NB) == LOCK_SH) {
7988 static const struct flock fl = {
7990 .l_whence = SEEK_SET,
7993 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7994 if (r < 0 && errno == EINVAL)
7995 r = flock(f->fd, LOCK_EX|LOCK_NB);
7998 f->operation = LOCK_EX|LOCK_NB;
8001 if ((f->operation & ~LOCK_NB) == LOCK_EX)
8002 unlink_noerrno(f->path);
8008 f->fd = safe_close(f->fd);
8012 static size_t nul_length(const uint8_t *p, size_t sz) {
8027 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
8028 const uint8_t *q, *w, *e;
8036 n = nul_length(q, e - q);
8038 /* If there are more than the specified run length of
8039 * NUL bytes, or if this is the beginning or the end
8040 * of the buffer, then seek instead of write */
8041 if ((n > run_length) ||
8042 (n > 0 && q == p) ||
8043 (n > 0 && q + n >= e)) {
8045 l = write(fd, w, q - w);
8052 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
8064 l = write(fd, w, q - w);
8071 return q - (const uint8_t*) p;
8074 void sigkill_wait(pid_t *pid) {
8080 if (kill(*pid, SIGKILL) > 0)
8081 (void) wait_for_terminate(*pid, NULL);
8084 int syslog_parse_priority(const char **p, int *priority, bool with_facility) {
8085 int a = 0, b = 0, c = 0;
8095 if (!strchr(*p, '>'))
8098 if ((*p)[2] == '>') {
8099 c = undecchar((*p)[1]);
8101 } else if ((*p)[3] == '>') {
8102 b = undecchar((*p)[1]);
8103 c = undecchar((*p)[2]);
8105 } else if ((*p)[4] == '>') {
8106 a = undecchar((*p)[1]);
8107 b = undecchar((*p)[2]);
8108 c = undecchar((*p)[3]);
8113 if (a < 0 || b < 0 || c < 0 ||
8114 (!with_facility && (a || b || c > 7)))
8118 *priority = a*100 + b*10 + c;
8120 *priority = (*priority & LOG_FACMASK) | c;
8126 ssize_t string_table_lookup(const char * const *table, size_t len, const char *key) {
8132 for (i = 0; i < len; ++i)
8133 if (streq_ptr(table[i], key))
8139 void cmsg_close_all(struct msghdr *mh) {
8140 struct cmsghdr *cmsg;
8144 for (cmsg = CMSG_FIRSTHDR(mh); cmsg; cmsg = CMSG_NXTHDR(mh, cmsg))
8145 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS)
8146 close_many((int*) CMSG_DATA(cmsg), (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int));
8149 int rename_noreplace(int olddirfd, const char *oldpath, int newdirfd, const char *newpath) {
8153 ret = renameat2(olddirfd, oldpath, newdirfd, newpath, RENAME_NOREPLACE);
8157 /* Even though renameat2() exists since Linux 3.15, btrfs added
8158 * support for it later. If it is not implemented, fallback to another
8160 if (errno != EINVAL)
8163 /* The link()/unlink() fallback does not work on directories. But
8164 * renameat() without RENAME_NOREPLACE gives the same semantics on
8165 * directories, except when newpath is an *empty* directory. This is
8167 ret = fstatat(olddirfd, oldpath, &buf, AT_SYMLINK_NOFOLLOW);
8168 if (ret >= 0 && S_ISDIR(buf.st_mode)) {
8169 ret = renameat(olddirfd, oldpath, newdirfd, newpath);
8170 return ret >= 0 ? 0 : -errno;
8173 /* If it is not a directory, use the link()/unlink() fallback. */
8174 ret = linkat(olddirfd, oldpath, newdirfd, newpath, 0);
8178 ret = unlinkat(olddirfd, oldpath, 0);
8180 /* backup errno before the following unlinkat() alters it */
8182 (void) unlinkat(newdirfd, newpath, 0);