1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
32 #include <sys/resource.h>
33 #include <linux/sched.h>
34 #include <sys/types.h>
38 #include <sys/ioctl.h>
40 #include <linux/tiocl.h>
45 #include <sys/prctl.h>
46 #include <sys/utsname.h>
48 #include <netinet/ip.h>
56 #include <sys/mount.h>
57 #include <linux/magic.h>
61 #include <sys/personality.h>
62 #include <sys/xattr.h>
63 #include <sys/statvfs.h>
67 /* When we include libgen.h because we need dirname() we immediately
68 * undefine basename() since libgen.h defines it as a macro to the XDG
69 * version which is really broken. */
73 #ifdef HAVE_SYS_AUXV_H
85 #include "path-util.h"
86 #include "exit-status.h"
90 #include "device-nodes.h"
95 #include "sparse-endian.h"
97 /* Put this test here for a lack of better place */
98 assert_cc(EAGAIN == EWOULDBLOCK);
101 char **saved_argv = NULL;
103 static volatile unsigned cached_columns = 0;
104 static volatile unsigned cached_lines = 0;
106 size_t page_size(void) {
107 static thread_local size_t pgsz = 0;
110 if (_likely_(pgsz > 0))
113 r = sysconf(_SC_PAGESIZE);
120 bool streq_ptr(const char *a, const char *b) {
122 /* Like streq(), but tries to make sense of NULL pointers */
133 char* endswith(const char *s, const char *postfix) {
140 pl = strlen(postfix);
143 return (char*) s + sl;
148 if (memcmp(s + sl - pl, postfix, pl) != 0)
151 return (char*) s + sl - pl;
154 char* first_word(const char *s, const char *word) {
161 /* Checks if the string starts with the specified word, either
162 * followed by NUL or by whitespace. Returns a pointer to the
163 * NUL or the first character after the whitespace. */
174 if (memcmp(s, word, wl) != 0)
181 if (!strchr(WHITESPACE, *p))
184 p += strspn(p, WHITESPACE);
188 static size_t cescape_char(char c, char *buf) {
189 char * buf_old = buf;
235 /* For special chars we prefer octal over
236 * hexadecimal encoding, simply because glib's
237 * g_strescape() does the same */
238 if ((c < ' ') || (c >= 127)) {
240 *(buf++) = octchar((unsigned char) c >> 6);
241 *(buf++) = octchar((unsigned char) c >> 3);
242 *(buf++) = octchar((unsigned char) c);
248 return buf - buf_old;
251 int close_nointr(int fd) {
258 * Just ignore EINTR; a retry loop is the wrong thing to do on
261 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
262 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
263 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
264 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
272 int safe_close(int fd) {
275 * Like close_nointr() but cannot fail. Guarantees errno is
276 * unchanged. Is a NOP with negative fds passed, and returns
277 * -1, so that it can be used in this syntax:
279 * fd = safe_close(fd);
285 /* The kernel might return pretty much any error code
286 * via close(), but the fd will be closed anyway. The
287 * only condition we want to check for here is whether
288 * the fd was invalid at all... */
290 assert_se(close_nointr(fd) != -EBADF);
296 void close_many(const int fds[], unsigned n_fd) {
299 assert(fds || n_fd <= 0);
301 for (i = 0; i < n_fd; i++)
305 int unlink_noerrno(const char *path) {
316 int parse_boolean(const char *v) {
319 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
321 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
327 int parse_pid(const char *s, pid_t* ret_pid) {
328 unsigned long ul = 0;
335 r = safe_atolu(s, &ul);
341 if ((unsigned long) pid != ul)
351 int parse_uid(const char *s, uid_t* ret_uid) {
352 unsigned long ul = 0;
359 r = safe_atolu(s, &ul);
365 if ((unsigned long) uid != ul)
368 /* Some libc APIs use UID_INVALID as special placeholder */
369 if (uid == (uid_t) 0xFFFFFFFF)
372 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
373 if (uid == (uid_t) 0xFFFF)
380 int safe_atou(const char *s, unsigned *ret_u) {
388 l = strtoul(s, &x, 0);
390 if (!x || x == s || *x || errno)
391 return errno > 0 ? -errno : -EINVAL;
393 if ((unsigned long) (unsigned) l != l)
396 *ret_u = (unsigned) l;
400 int safe_atoi(const char *s, int *ret_i) {
408 l = strtol(s, &x, 0);
410 if (!x || x == s || *x || errno)
411 return errno > 0 ? -errno : -EINVAL;
413 if ((long) (int) l != l)
420 int safe_atou8(const char *s, uint8_t *ret) {
428 l = strtoul(s, &x, 0);
430 if (!x || x == s || *x || errno)
431 return errno > 0 ? -errno : -EINVAL;
433 if ((unsigned long) (uint8_t) l != l)
440 int safe_atou16(const char *s, uint16_t *ret) {
448 l = strtoul(s, &x, 0);
450 if (!x || x == s || *x || errno)
451 return errno > 0 ? -errno : -EINVAL;
453 if ((unsigned long) (uint16_t) l != l)
460 int safe_atoi16(const char *s, int16_t *ret) {
468 l = strtol(s, &x, 0);
470 if (!x || x == s || *x || errno)
471 return errno > 0 ? -errno : -EINVAL;
473 if ((long) (int16_t) l != l)
480 int safe_atollu(const char *s, long long unsigned *ret_llu) {
482 unsigned long long l;
488 l = strtoull(s, &x, 0);
490 if (!x || x == s || *x || errno)
491 return errno ? -errno : -EINVAL;
497 int safe_atolli(const char *s, long long int *ret_lli) {
505 l = strtoll(s, &x, 0);
507 if (!x || x == s || *x || errno)
508 return errno ? -errno : -EINVAL;
514 int safe_atod(const char *s, double *ret_d) {
522 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
523 if (loc == (locale_t) 0)
527 d = strtod_l(s, &x, loc);
529 if (!x || x == s || *x || errno) {
531 return errno ? -errno : -EINVAL;
539 static size_t strcspn_escaped(const char *s, const char *reject) {
540 bool escaped = false;
543 for (n=0; s[n]; n++) {
546 else if (s[n] == '\\')
548 else if (strchr(reject, s[n]))
552 /* if s ends in \, return index of previous char */
556 /* Split a string into words. */
557 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
563 assert(**state == '\0');
567 current += strspn(current, separator);
573 if (quoted && strchr("\'\"", *current)) {
574 char quotechars[2] = {*current, '\0'};
576 *l = strcspn_escaped(current + 1, quotechars);
577 if (current[*l + 1] == '\0' ||
578 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
579 /* right quote missing or garbage at the end */
583 assert(current[*l + 1] == quotechars[0]);
584 *state = current++ + *l + 2;
586 *l = strcspn_escaped(current, separator);
587 if (current[*l] && !strchr(separator, current[*l])) {
588 /* unfinished escape */
592 *state = current + *l;
594 *l = strcspn(current, separator);
595 *state = current + *l;
601 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
603 _cleanup_free_ char *line = NULL;
615 p = procfs_file_alloca(pid, "stat");
616 r = read_one_line_file(p, &line);
620 /* Let's skip the pid and comm fields. The latter is enclosed
621 * in () but does not escape any () in its value, so let's
622 * skip over it manually */
624 p = strrchr(line, ')');
636 if ((long unsigned) (pid_t) ppid != ppid)
639 *_ppid = (pid_t) ppid;
644 int fchmod_umask(int fd, mode_t m) {
649 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
655 char *truncate_nl(char *s) {
658 s[strcspn(s, NEWLINE)] = 0;
662 int get_process_state(pid_t pid) {
666 _cleanup_free_ char *line = NULL;
670 p = procfs_file_alloca(pid, "stat");
671 r = read_one_line_file(p, &line);
675 p = strrchr(line, ')');
681 if (sscanf(p, " %c", &state) != 1)
684 return (unsigned char) state;
687 int get_process_comm(pid_t pid, char **name) {
694 p = procfs_file_alloca(pid, "comm");
696 r = read_one_line_file(p, name);
703 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
704 _cleanup_fclose_ FILE *f = NULL;
712 p = procfs_file_alloca(pid, "cmdline");
718 if (max_length == 0) {
719 size_t len = 0, allocated = 0;
721 while ((c = getc(f)) != EOF) {
723 if (!GREEDY_REALLOC(r, allocated, len+2)) {
728 r[len++] = isprint(c) ? c : ' ';
738 r = new(char, max_length);
744 while ((c = getc(f)) != EOF) {
766 size_t n = MIN(left-1, 3U);
773 /* Kernel threads have no argv[] */
775 _cleanup_free_ char *t = NULL;
783 h = get_process_comm(pid, &t);
787 r = strjoin("[", t, "]", NULL);
796 int is_kernel_thread(pid_t pid) {
808 p = procfs_file_alloca(pid, "cmdline");
813 count = fread(&c, 1, 1, f);
817 /* Kernel threads have an empty cmdline */
820 return eof ? 1 : -errno;
825 int get_process_capeff(pid_t pid, char **capeff) {
831 p = procfs_file_alloca(pid, "status");
833 return get_status_field(p, "\nCapEff:", capeff);
836 static int get_process_link_contents(const char *proc_file, char **name) {
842 r = readlink_malloc(proc_file, name);
844 return r == -ENOENT ? -ESRCH : r;
849 int get_process_exe(pid_t pid, char **name) {
856 p = procfs_file_alloca(pid, "exe");
857 r = get_process_link_contents(p, name);
861 d = endswith(*name, " (deleted)");
868 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
869 _cleanup_fclose_ FILE *f = NULL;
879 p = procfs_file_alloca(pid, "status");
884 FOREACH_LINE(line, f, return -errno) {
889 if (startswith(l, field)) {
891 l += strspn(l, WHITESPACE);
893 l[strcspn(l, WHITESPACE)] = 0;
895 return parse_uid(l, uid);
902 int get_process_uid(pid_t pid, uid_t *uid) {
903 return get_process_id(pid, "Uid:", uid);
906 int get_process_gid(pid_t pid, gid_t *gid) {
907 assert_cc(sizeof(uid_t) == sizeof(gid_t));
908 return get_process_id(pid, "Gid:", gid);
911 int get_process_cwd(pid_t pid, char **cwd) {
916 p = procfs_file_alloca(pid, "cwd");
918 return get_process_link_contents(p, cwd);
921 int get_process_root(pid_t pid, char **root) {
926 p = procfs_file_alloca(pid, "root");
928 return get_process_link_contents(p, root);
931 int get_process_environ(pid_t pid, char **env) {
932 _cleanup_fclose_ FILE *f = NULL;
933 _cleanup_free_ char *outcome = NULL;
936 size_t allocated = 0, sz = 0;
941 p = procfs_file_alloca(pid, "environ");
947 while ((c = fgetc(f)) != EOF) {
948 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
952 outcome[sz++] = '\n';
954 sz += cescape_char(c, outcome + sz);
964 char *strnappend(const char *s, const char *suffix, size_t b) {
972 return strndup(suffix, b);
981 if (b > ((size_t) -1) - a)
984 r = new(char, a+b+1);
989 memcpy(r+a, suffix, b);
995 char *strappend(const char *s, const char *suffix) {
996 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
999 int readlinkat_malloc(int fd, const char *p, char **ret) {
1014 n = readlinkat(fd, p, c, l-1);
1021 if ((size_t) n < l-1) {
1032 int readlink_malloc(const char *p, char **ret) {
1033 return readlinkat_malloc(AT_FDCWD, p, ret);
1036 int readlink_value(const char *p, char **ret) {
1037 _cleanup_free_ char *link = NULL;
1041 r = readlink_malloc(p, &link);
1045 value = basename(link);
1049 value = strdup(value);
1058 int readlink_and_make_absolute(const char *p, char **r) {
1059 _cleanup_free_ char *target = NULL;
1066 j = readlink_malloc(p, &target);
1070 k = file_in_same_dir(p, target);
1078 int readlink_and_canonicalize(const char *p, char **r) {
1085 j = readlink_and_make_absolute(p, &t);
1089 s = canonicalize_file_name(t);
1096 path_kill_slashes(*r);
1101 int reset_all_signal_handlers(void) {
1104 for (sig = 1; sig < _NSIG; sig++) {
1105 struct sigaction sa = {
1106 .sa_handler = SIG_DFL,
1107 .sa_flags = SA_RESTART,
1110 /* These two cannot be caught... */
1111 if (sig == SIGKILL || sig == SIGSTOP)
1114 /* On Linux the first two RT signals are reserved by
1115 * glibc, and sigaction() will return EINVAL for them. */
1116 if ((sigaction(sig, &sa, NULL) < 0))
1117 if (errno != EINVAL && r == 0)
1124 int reset_signal_mask(void) {
1127 if (sigemptyset(&ss) < 0)
1130 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1136 char *strstrip(char *s) {
1139 /* Drops trailing whitespace. Modifies the string in
1140 * place. Returns pointer to first non-space character */
1142 s += strspn(s, WHITESPACE);
1144 for (e = strchr(s, 0); e > s; e --)
1145 if (!strchr(WHITESPACE, e[-1]))
1153 char *delete_chars(char *s, const char *bad) {
1156 /* Drops all whitespace, regardless where in the string */
1158 for (f = s, t = s; *f; f++) {
1159 if (strchr(bad, *f))
1170 char *file_in_same_dir(const char *path, const char *filename) {
1177 /* This removes the last component of path and appends
1178 * filename, unless the latter is absolute anyway or the
1181 if (path_is_absolute(filename))
1182 return strdup(filename);
1184 e = strrchr(path, '/');
1186 return strdup(filename);
1188 k = strlen(filename);
1189 ret = new(char, (e + 1 - path) + k + 1);
1193 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1197 int rmdir_parents(const char *path, const char *stop) {
1206 /* Skip trailing slashes */
1207 while (l > 0 && path[l-1] == '/')
1213 /* Skip last component */
1214 while (l > 0 && path[l-1] != '/')
1217 /* Skip trailing slashes */
1218 while (l > 0 && path[l-1] == '/')
1224 if (!(t = strndup(path, l)))
1227 if (path_startswith(stop, t)) {
1236 if (errno != ENOENT)
1243 char hexchar(int x) {
1244 static const char table[16] = "0123456789abcdef";
1246 return table[x & 15];
1249 int unhexchar(char c) {
1251 if (c >= '0' && c <= '9')
1254 if (c >= 'a' && c <= 'f')
1255 return c - 'a' + 10;
1257 if (c >= 'A' && c <= 'F')
1258 return c - 'A' + 10;
1263 char *hexmem(const void *p, size_t l) {
1267 z = r = malloc(l * 2 + 1);
1271 for (x = p; x < (const uint8_t*) p + l; x++) {
1272 *(z++) = hexchar(*x >> 4);
1273 *(z++) = hexchar(*x & 15);
1280 void *unhexmem(const char *p, size_t l) {
1286 z = r = malloc((l + 1) / 2 + 1);
1290 for (x = p; x < p + l; x += 2) {
1293 a = unhexchar(x[0]);
1295 b = unhexchar(x[1]);
1299 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1306 char octchar(int x) {
1307 return '0' + (x & 7);
1310 int unoctchar(char c) {
1312 if (c >= '0' && c <= '7')
1318 char decchar(int x) {
1319 return '0' + (x % 10);
1322 int undecchar(char c) {
1324 if (c >= '0' && c <= '9')
1330 char *cescape(const char *s) {
1336 /* Does C style string escaping. */
1338 r = new(char, strlen(s)*4 + 1);
1342 for (f = s, t = r; *f; f++)
1343 t += cescape_char(*f, t);
1350 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1357 /* Undoes C style string escaping, and optionally prefixes it. */
1359 pl = prefix ? strlen(prefix) : 0;
1361 r = new(char, pl+length+1);
1366 memcpy(r, prefix, pl);
1368 for (f = s, t = r + pl; f < s + length; f++) {
1369 size_t remaining = s + length - f;
1370 assert(remaining > 0);
1372 if (*f != '\\') { /* a literal literal */
1377 if (--remaining == 0) { /* copy trailing backslash verbatim */
1418 /* This is an extension of the XDG syntax files */
1423 /* hexadecimal encoding */
1426 if (remaining >= 2) {
1427 a = unhexchar(f[1]);
1428 b = unhexchar(f[2]);
1431 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1432 /* Invalid escape code, let's take it literal then */
1436 *(t++) = (char) ((a << 4) | b);
1451 /* octal encoding */
1452 int a = -1, b = -1, c = -1;
1454 if (remaining >= 3) {
1455 a = unoctchar(f[0]);
1456 b = unoctchar(f[1]);
1457 c = unoctchar(f[2]);
1460 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1461 /* Invalid escape code, let's take it literal then */
1465 *(t++) = (char) ((a << 6) | (b << 3) | c);
1473 /* Invalid escape code, let's take it literal then */
1484 char *cunescape_length(const char *s, size_t length) {
1485 return cunescape_length_with_prefix(s, length, NULL);
1488 char *cunescape(const char *s) {
1491 return cunescape_length(s, strlen(s));
1494 char *xescape(const char *s, const char *bad) {
1498 /* Escapes all chars in bad, in addition to \ and all special
1499 * chars, in \xFF style escaping. May be reversed with
1502 r = new(char, strlen(s) * 4 + 1);
1506 for (f = s, t = r; *f; f++) {
1508 if ((*f < ' ') || (*f >= 127) ||
1509 (*f == '\\') || strchr(bad, *f)) {
1512 *(t++) = hexchar(*f >> 4);
1513 *(t++) = hexchar(*f);
1523 char *ascii_strlower(char *t) {
1528 for (p = t; *p; p++)
1529 if (*p >= 'A' && *p <= 'Z')
1530 *p = *p - 'A' + 'a';
1535 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1539 filename[0] == '.' ||
1540 streq(filename, "lost+found") ||
1541 streq(filename, "aquota.user") ||
1542 streq(filename, "aquota.group") ||
1543 endswith(filename, ".rpmnew") ||
1544 endswith(filename, ".rpmsave") ||
1545 endswith(filename, ".rpmorig") ||
1546 endswith(filename, ".dpkg-old") ||
1547 endswith(filename, ".dpkg-new") ||
1548 endswith(filename, ".dpkg-tmp") ||
1549 endswith(filename, ".dpkg-dist") ||
1550 endswith(filename, ".dpkg-bak") ||
1551 endswith(filename, ".dpkg-backup") ||
1552 endswith(filename, ".dpkg-remove") ||
1553 endswith(filename, ".swp");
1556 bool hidden_file(const char *filename) {
1559 if (endswith(filename, "~"))
1562 return hidden_file_allow_backup(filename);
1565 int fd_nonblock(int fd, bool nonblock) {
1570 flags = fcntl(fd, F_GETFL, 0);
1575 nflags = flags | O_NONBLOCK;
1577 nflags = flags & ~O_NONBLOCK;
1579 if (nflags == flags)
1582 if (fcntl(fd, F_SETFL, nflags) < 0)
1588 int fd_cloexec(int fd, bool cloexec) {
1593 flags = fcntl(fd, F_GETFD, 0);
1598 nflags = flags | FD_CLOEXEC;
1600 nflags = flags & ~FD_CLOEXEC;
1602 if (nflags == flags)
1605 if (fcntl(fd, F_SETFD, nflags) < 0)
1611 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1614 assert(n_fdset == 0 || fdset);
1616 for (i = 0; i < n_fdset; i++)
1623 int close_all_fds(const int except[], unsigned n_except) {
1624 _cleanup_closedir_ DIR *d = NULL;
1628 assert(n_except == 0 || except);
1630 d = opendir("/proc/self/fd");
1635 /* When /proc isn't available (for example in chroots)
1636 * the fallback is brute forcing through the fd
1639 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1640 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1642 if (fd_in_set(fd, except, n_except))
1645 if (close_nointr(fd) < 0)
1646 if (errno != EBADF && r == 0)
1653 while ((de = readdir(d))) {
1656 if (hidden_file(de->d_name))
1659 if (safe_atoi(de->d_name, &fd) < 0)
1660 /* Let's better ignore this, just in case */
1669 if (fd_in_set(fd, except, n_except))
1672 if (close_nointr(fd) < 0) {
1673 /* Valgrind has its own FD and doesn't want to have it closed */
1674 if (errno != EBADF && r == 0)
1682 bool chars_intersect(const char *a, const char *b) {
1685 /* Returns true if any of the chars in a are in b. */
1686 for (p = a; *p; p++)
1693 bool fstype_is_network(const char *fstype) {
1694 static const char table[] =
1709 x = startswith(fstype, "fuse.");
1713 return nulstr_contains(table, fstype);
1716 bool fstype_is_deviceless(const char *fstype) {
1717 static const char table[] =
1741 return !isempty(fstype) && (
1742 nulstr_contains(table, fstype) || fstype_is_network(fstype));
1746 _cleanup_close_ int fd;
1748 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1754 TIOCL_GETKMSGREDIRECT,
1758 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1761 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1764 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1770 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1771 struct termios old_termios, new_termios;
1772 char c, line[LINE_MAX];
1777 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1778 new_termios = old_termios;
1780 new_termios.c_lflag &= ~ICANON;
1781 new_termios.c_cc[VMIN] = 1;
1782 new_termios.c_cc[VTIME] = 0;
1784 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1787 if (t != USEC_INFINITY) {
1788 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1789 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1794 k = fread(&c, 1, 1, f);
1796 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1802 *need_nl = c != '\n';
1809 if (t != USEC_INFINITY) {
1810 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1815 if (!fgets(line, sizeof(line), f))
1816 return errno ? -errno : -EIO;
1820 if (strlen(line) != 1)
1830 int ask_char(char *ret, const char *replies, const char *text, ...) {
1840 bool need_nl = true;
1843 fputs(ANSI_HIGHLIGHT_ON, stdout);
1850 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1854 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1857 if (r == -EBADMSG) {
1858 puts("Bad input, please try again.");
1869 if (strchr(replies, c)) {
1874 puts("Read unexpected character, please try again.");
1878 int ask_string(char **ret, const char *text, ...) {
1883 char line[LINE_MAX];
1887 fputs(ANSI_HIGHLIGHT_ON, stdout);
1894 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1899 if (!fgets(line, sizeof(line), stdin))
1900 return errno ? -errno : -EIO;
1902 if (!endswith(line, "\n"))
1921 int reset_terminal_fd(int fd, bool switch_to_text) {
1922 struct termios termios;
1925 /* Set terminal to some sane defaults */
1929 /* We leave locked terminal attributes untouched, so that
1930 * Plymouth may set whatever it wants to set, and we don't
1931 * interfere with that. */
1933 /* Disable exclusive mode, just in case */
1934 ioctl(fd, TIOCNXCL);
1936 /* Switch to text mode */
1938 ioctl(fd, KDSETMODE, KD_TEXT);
1940 /* Enable console unicode mode */
1941 ioctl(fd, KDSKBMODE, K_UNICODE);
1943 if (tcgetattr(fd, &termios) < 0) {
1948 /* We only reset the stuff that matters to the software. How
1949 * hardware is set up we don't touch assuming that somebody
1950 * else will do that for us */
1952 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1953 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1954 termios.c_oflag |= ONLCR;
1955 termios.c_cflag |= CREAD;
1956 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1958 termios.c_cc[VINTR] = 03; /* ^C */
1959 termios.c_cc[VQUIT] = 034; /* ^\ */
1960 termios.c_cc[VERASE] = 0177;
1961 termios.c_cc[VKILL] = 025; /* ^X */
1962 termios.c_cc[VEOF] = 04; /* ^D */
1963 termios.c_cc[VSTART] = 021; /* ^Q */
1964 termios.c_cc[VSTOP] = 023; /* ^S */
1965 termios.c_cc[VSUSP] = 032; /* ^Z */
1966 termios.c_cc[VLNEXT] = 026; /* ^V */
1967 termios.c_cc[VWERASE] = 027; /* ^W */
1968 termios.c_cc[VREPRINT] = 022; /* ^R */
1969 termios.c_cc[VEOL] = 0;
1970 termios.c_cc[VEOL2] = 0;
1972 termios.c_cc[VTIME] = 0;
1973 termios.c_cc[VMIN] = 1;
1975 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1979 /* Just in case, flush all crap out */
1980 tcflush(fd, TCIOFLUSH);
1985 int reset_terminal(const char *name) {
1986 _cleanup_close_ int fd = -1;
1988 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1992 return reset_terminal_fd(fd, true);
1995 int open_terminal(const char *name, int mode) {
2000 * If a TTY is in the process of being closed opening it might
2001 * cause EIO. This is horribly awful, but unlikely to be
2002 * changed in the kernel. Hence we work around this problem by
2003 * retrying a couple of times.
2005 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
2008 assert(!(mode & O_CREAT));
2011 fd = open(name, mode, 0);
2018 /* Max 1s in total */
2022 usleep(50 * USEC_PER_MSEC);
2040 int flush_fd(int fd) {
2041 struct pollfd pollfd = {
2051 r = poll(&pollfd, 1, 0);
2061 l = read(fd, buf, sizeof(buf));
2067 if (errno == EAGAIN)
2076 int acquire_terminal(
2080 bool ignore_tiocstty_eperm,
2083 int fd = -1, notify = -1, r = 0, wd = -1;
2088 /* We use inotify to be notified when the tty is closed. We
2089 * create the watch before checking if we can actually acquire
2090 * it, so that we don't lose any event.
2092 * Note: strictly speaking this actually watches for the
2093 * device being closed, it does *not* really watch whether a
2094 * tty loses its controlling process. However, unless some
2095 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2096 * its tty otherwise this will not become a problem. As long
2097 * as the administrator makes sure not configure any service
2098 * on the same tty as an untrusted user this should not be a
2099 * problem. (Which he probably should not do anyway.) */
2101 if (timeout != USEC_INFINITY)
2102 ts = now(CLOCK_MONOTONIC);
2104 if (!fail && !force) {
2105 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2111 wd = inotify_add_watch(notify, name, IN_CLOSE);
2119 struct sigaction sa_old, sa_new = {
2120 .sa_handler = SIG_IGN,
2121 .sa_flags = SA_RESTART,
2125 r = flush_fd(notify);
2130 /* We pass here O_NOCTTY only so that we can check the return
2131 * value TIOCSCTTY and have a reliable way to figure out if we
2132 * successfully became the controlling process of the tty */
2133 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2137 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2138 * if we already own the tty. */
2139 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2141 /* First, try to get the tty */
2142 if (ioctl(fd, TIOCSCTTY, force) < 0)
2145 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2147 /* Sometimes it makes sense to ignore TIOCSCTTY
2148 * returning EPERM, i.e. when very likely we already
2149 * are have this controlling terminal. */
2150 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2153 if (r < 0 && (force || fail || r != -EPERM)) {
2162 assert(notify >= 0);
2165 union inotify_event_buffer buffer;
2166 struct inotify_event *e;
2169 if (timeout != USEC_INFINITY) {
2172 n = now(CLOCK_MONOTONIC);
2173 if (ts + timeout < n) {
2178 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2188 l = read(notify, &buffer, sizeof(buffer));
2190 if (errno == EINTR || errno == EAGAIN)
2197 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2198 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2207 /* We close the tty fd here since if the old session
2208 * ended our handle will be dead. It's important that
2209 * we do this after sleeping, so that we don't enter
2210 * an endless loop. */
2211 fd = safe_close(fd);
2216 r = reset_terminal_fd(fd, true);
2218 log_warning_errno(r, "Failed to reset terminal: %m");
2229 int release_terminal(void) {
2230 static const struct sigaction sa_new = {
2231 .sa_handler = SIG_IGN,
2232 .sa_flags = SA_RESTART,
2235 _cleanup_close_ int fd = -1;
2236 struct sigaction sa_old;
2239 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2243 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2244 * by our own TIOCNOTTY */
2245 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2247 if (ioctl(fd, TIOCNOTTY) < 0)
2250 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2255 int sigaction_many(const struct sigaction *sa, ...) {
2260 while ((sig = va_arg(ap, int)) > 0)
2261 if (sigaction(sig, sa, NULL) < 0)
2268 int ignore_signals(int sig, ...) {
2269 struct sigaction sa = {
2270 .sa_handler = SIG_IGN,
2271 .sa_flags = SA_RESTART,
2276 if (sigaction(sig, &sa, NULL) < 0)
2280 while ((sig = va_arg(ap, int)) > 0)
2281 if (sigaction(sig, &sa, NULL) < 0)
2288 int default_signals(int sig, ...) {
2289 struct sigaction sa = {
2290 .sa_handler = SIG_DFL,
2291 .sa_flags = SA_RESTART,
2296 if (sigaction(sig, &sa, NULL) < 0)
2300 while ((sig = va_arg(ap, int)) > 0)
2301 if (sigaction(sig, &sa, NULL) < 0)
2308 void safe_close_pair(int p[]) {
2312 /* Special case pairs which use the same fd in both
2314 p[0] = p[1] = safe_close(p[0]);
2318 p[0] = safe_close(p[0]);
2319 p[1] = safe_close(p[1]);
2322 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2329 while (nbytes > 0) {
2332 k = read(fd, p, nbytes);
2337 if (errno == EAGAIN && do_poll) {
2339 /* We knowingly ignore any return value here,
2340 * and expect that any error/EOF is reported
2343 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2347 return n > 0 ? n : -errno;
2361 int loop_read_exact(int fd, void *buf, size_t nbytes, bool do_poll) {
2364 n = loop_read(fd, buf, nbytes, do_poll);
2367 if ((size_t) n != nbytes)
2372 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2373 const uint8_t *p = buf;
2380 while (nbytes > 0) {
2383 k = write(fd, p, nbytes);
2388 if (errno == EAGAIN && do_poll) {
2389 /* We knowingly ignore any return value here,
2390 * and expect that any error/EOF is reported
2393 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2400 if (k == 0) /* Can't really happen */
2410 int parse_size(const char *t, off_t base, off_t *size) {
2412 /* Soo, sometimes we want to parse IEC binary suffxies, and
2413 * sometimes SI decimal suffixes. This function can parse
2414 * both. Which one is the right way depends on the
2415 * context. Wikipedia suggests that SI is customary for
2416 * hardrware metrics and network speeds, while IEC is
2417 * customary for most data sizes used by software and volatile
2418 * (RAM) memory. Hence be careful which one you pick!
2420 * In either case we use just K, M, G as suffix, and not Ki,
2421 * Mi, Gi or so (as IEC would suggest). That's because that's
2422 * frickin' ugly. But this means you really need to make sure
2423 * to document which base you are parsing when you use this
2428 unsigned long long factor;
2431 static const struct table iec[] = {
2432 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2433 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2434 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2435 { "G", 1024ULL*1024ULL*1024ULL },
2436 { "M", 1024ULL*1024ULL },
2442 static const struct table si[] = {
2443 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2444 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2445 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2446 { "G", 1000ULL*1000ULL*1000ULL },
2447 { "M", 1000ULL*1000ULL },
2453 const struct table *table;
2455 unsigned long long r = 0;
2456 unsigned n_entries, start_pos = 0;
2459 assert(base == 1000 || base == 1024);
2464 n_entries = ELEMENTSOF(si);
2467 n_entries = ELEMENTSOF(iec);
2473 unsigned long long l2;
2479 l = strtoll(p, &e, 10);
2492 if (*e >= '0' && *e <= '9') {
2495 /* strotoull itself would accept space/+/- */
2496 l2 = strtoull(e, &e2, 10);
2498 if (errno == ERANGE)
2501 /* Ignore failure. E.g. 10.M is valid */
2508 e += strspn(e, WHITESPACE);
2510 for (i = start_pos; i < n_entries; i++)
2511 if (startswith(e, table[i].suffix)) {
2512 unsigned long long tmp;
2513 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2515 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2516 if (tmp > ULLONG_MAX - r)
2520 if ((unsigned long long) (off_t) r != r)
2523 p = e + strlen(table[i].suffix);
2539 int make_stdio(int fd) {
2544 r = dup2(fd, STDIN_FILENO);
2545 s = dup2(fd, STDOUT_FILENO);
2546 t = dup2(fd, STDERR_FILENO);
2551 if (r < 0 || s < 0 || t < 0)
2554 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2555 * dup2() was a NOP and the bit hence possibly set. */
2556 fd_cloexec(STDIN_FILENO, false);
2557 fd_cloexec(STDOUT_FILENO, false);
2558 fd_cloexec(STDERR_FILENO, false);
2563 int make_null_stdio(void) {
2566 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2570 return make_stdio(null_fd);
2573 bool is_device_path(const char *path) {
2575 /* Returns true on paths that refer to a device, either in
2576 * sysfs or in /dev */
2579 path_startswith(path, "/dev/") ||
2580 path_startswith(path, "/sys/");
2583 int dir_is_empty(const char *path) {
2584 _cleanup_closedir_ DIR *d;
2595 if (!de && errno != 0)
2601 if (!hidden_file(de->d_name))
2606 char* dirname_malloc(const char *path) {
2607 char *d, *dir, *dir2;
2624 int dev_urandom(void *p, size_t n) {
2625 static int have_syscall = -1;
2627 _cleanup_close_ int fd = -1;
2630 /* Gathers some randomness from the kernel. This call will
2631 * never block, and will always return some data from the
2632 * kernel, regardless if the random pool is fully initialized
2633 * or not. It thus makes no guarantee for the quality of the
2634 * returned entropy, but is good enough for or usual usecases
2635 * of seeding the hash functions for hashtable */
2637 /* Use the getrandom() syscall unless we know we don't have
2638 * it, or when the requested size is too large for it. */
2639 if (have_syscall != 0 || (size_t) (int) n != n) {
2640 r = getrandom(p, n, GRND_NONBLOCK);
2642 have_syscall = true;
2647 if (errno == ENOSYS)
2648 /* we lack the syscall, continue with
2649 * reading from /dev/urandom */
2650 have_syscall = false;
2651 else if (errno == EAGAIN)
2652 /* not enough entropy for now. Let's
2653 * remember to use the syscall the
2654 * next time, again, but also read
2655 * from /dev/urandom for now, which
2656 * doesn't care about the current
2657 * amount of entropy. */
2658 have_syscall = true;
2662 /* too short read? */
2666 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2668 return errno == ENOENT ? -ENOSYS : -errno;
2670 return loop_read_exact(fd, p, n, true);
2673 void initialize_srand(void) {
2674 static bool srand_called = false;
2676 #ifdef HAVE_SYS_AUXV_H
2685 #ifdef HAVE_SYS_AUXV_H
2686 /* The kernel provides us with a bit of entropy in auxv, so
2687 * let's try to make use of that to seed the pseudo-random
2688 * generator. It's better than nothing... */
2690 auxv = (void*) getauxval(AT_RANDOM);
2692 x ^= *(unsigned*) auxv;
2695 x ^= (unsigned) now(CLOCK_REALTIME);
2696 x ^= (unsigned) gettid();
2699 srand_called = true;
2702 void random_bytes(void *p, size_t n) {
2706 r = dev_urandom(p, n);
2710 /* If some idiot made /dev/urandom unavailable to us, he'll
2711 * get a PRNG instead. */
2715 for (q = p; q < (uint8_t*) p + n; q ++)
2719 void rename_process(const char name[8]) {
2722 /* This is a like a poor man's setproctitle(). It changes the
2723 * comm field, argv[0], and also the glibc's internally used
2724 * name of the process. For the first one a limit of 16 chars
2725 * applies, to the second one usually one of 10 (i.e. length
2726 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2727 * "systemd"). If you pass a longer string it will be
2730 prctl(PR_SET_NAME, name);
2732 if (program_invocation_name)
2733 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2735 if (saved_argc > 0) {
2739 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2741 for (i = 1; i < saved_argc; i++) {
2745 memzero(saved_argv[i], strlen(saved_argv[i]));
2750 void sigset_add_many(sigset_t *ss, ...) {
2757 while ((sig = va_arg(ap, int)) > 0)
2758 assert_se(sigaddset(ss, sig) == 0);
2762 int sigprocmask_many(int how, ...) {
2767 assert_se(sigemptyset(&ss) == 0);
2770 while ((sig = va_arg(ap, int)) > 0)
2771 assert_se(sigaddset(&ss, sig) == 0);
2774 if (sigprocmask(how, &ss, NULL) < 0)
2780 char* gethostname_malloc(void) {
2783 assert_se(uname(&u) >= 0);
2785 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2786 return strdup(u.nodename);
2788 return strdup(u.sysname);
2791 bool hostname_is_set(void) {
2794 assert_se(uname(&u) >= 0);
2796 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2799 char *lookup_uid(uid_t uid) {
2802 _cleanup_free_ char *buf = NULL;
2803 struct passwd pwbuf, *pw = NULL;
2805 /* Shortcut things to avoid NSS lookups */
2807 return strdup("root");
2809 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2813 buf = malloc(bufsize);
2817 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2818 return strdup(pw->pw_name);
2820 if (asprintf(&name, UID_FMT, uid) < 0)
2826 char* getlogname_malloc(void) {
2830 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2835 return lookup_uid(uid);
2838 char *getusername_malloc(void) {
2845 return lookup_uid(getuid());
2848 int getttyname_malloc(int fd, char **ret) {
2858 r = ttyname_r(fd, path, sizeof(path));
2863 p = startswith(path, "/dev/");
2864 c = strdup(p ?: path);
2881 int getttyname_harder(int fd, char **r) {
2885 k = getttyname_malloc(fd, &s);
2889 if (streq(s, "tty")) {
2891 return get_ctty(0, NULL, r);
2898 int get_ctty_devnr(pid_t pid, dev_t *d) {
2900 _cleanup_free_ char *line = NULL;
2902 unsigned long ttynr;
2906 p = procfs_file_alloca(pid, "stat");
2907 r = read_one_line_file(p, &line);
2911 p = strrchr(line, ')');
2921 "%*d " /* session */
2926 if (major(ttynr) == 0 && minor(ttynr) == 0)
2935 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2936 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2937 _cleanup_free_ char *s = NULL;
2944 k = get_ctty_devnr(pid, &devnr);
2948 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
2950 k = readlink_malloc(fn, &s);
2956 /* This is an ugly hack */
2957 if (major(devnr) == 136) {
2958 if (asprintf(&b, "pts/%u", minor(devnr)) < 0)
2961 /* Probably something like the ptys which have no
2962 * symlink in /dev/char. Let's return something
2963 * vaguely useful. */
2970 if (startswith(s, "/dev/"))
2972 else if (startswith(s, "../"))
2989 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2990 _cleanup_closedir_ DIR *d = NULL;
2995 /* This returns the first error we run into, but nevertheless
2996 * tries to go on. This closes the passed fd. */
3002 return errno == ENOENT ? 0 : -errno;
3007 bool is_dir, keep_around;
3014 if (errno != 0 && ret == 0)
3019 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
3022 if (de->d_type == DT_UNKNOWN ||
3024 (de->d_type == DT_DIR && root_dev)) {
3025 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
3026 if (ret == 0 && errno != ENOENT)
3031 is_dir = S_ISDIR(st.st_mode);
3034 (st.st_uid == 0 || st.st_uid == getuid()) &&
3035 (st.st_mode & S_ISVTX);
3037 is_dir = de->d_type == DT_DIR;
3038 keep_around = false;
3044 /* if root_dev is set, remove subdirectories only, if device is same as dir */
3045 if (root_dev && st.st_dev != root_dev->st_dev)
3048 subdir_fd = openat(fd, de->d_name,
3049 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3050 if (subdir_fd < 0) {
3051 if (ret == 0 && errno != ENOENT)
3056 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
3057 if (r < 0 && ret == 0)
3061 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
3062 if (ret == 0 && errno != ENOENT)
3066 } else if (!only_dirs && !keep_around) {
3068 if (unlinkat(fd, de->d_name, 0) < 0) {
3069 if (ret == 0 && errno != ENOENT)
3076 _pure_ static int is_temporary_fs(struct statfs *s) {
3079 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3080 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3083 int is_fd_on_temporary_fs(int fd) {
3086 if (fstatfs(fd, &s) < 0)
3089 return is_temporary_fs(&s);
3092 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
3097 if (fstatfs(fd, &s) < 0) {
3102 /* We refuse to clean disk file systems with this call. This
3103 * is extra paranoia just to be sure we never ever remove
3105 if (!is_temporary_fs(&s)) {
3106 log_error("Attempted to remove disk file system, and we can't allow that.");
3111 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
3114 static int file_is_priv_sticky(const char *p) {
3119 if (lstat(p, &st) < 0)
3123 (st.st_uid == 0 || st.st_uid == getuid()) &&
3124 (st.st_mode & S_ISVTX);
3127 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
3133 /* We refuse to clean the root file system with this
3134 * call. This is extra paranoia to never cause a really
3135 * seriously broken system. */
3136 if (path_equal(path, "/")) {
3137 log_error("Attempted to remove entire root file system, and we can't allow that.");
3141 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3144 if (errno != ENOTDIR && errno != ELOOP)
3148 if (statfs(path, &s) < 0)
3151 if (!is_temporary_fs(&s)) {
3152 log_error("Attempted to remove disk file system, and we can't allow that.");
3157 if (delete_root && !only_dirs)
3158 if (unlink(path) < 0 && errno != ENOENT)
3165 if (fstatfs(fd, &s) < 0) {
3170 if (!is_temporary_fs(&s)) {
3171 log_error("Attempted to remove disk file system, and we can't allow that.");
3177 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
3180 if (honour_sticky && file_is_priv_sticky(path) > 0)
3183 if (rmdir(path) < 0 && errno != ENOENT) {
3192 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3193 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
3196 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3197 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
3200 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3203 /* Under the assumption that we are running privileged we
3204 * first change the access mode and only then hand out
3205 * ownership to avoid a window where access is too open. */
3207 if (mode != MODE_INVALID)
3208 if (chmod(path, mode) < 0)
3211 if (uid != UID_INVALID || gid != GID_INVALID)
3212 if (chown(path, uid, gid) < 0)
3218 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3221 /* Under the assumption that we are running privileged we
3222 * first change the access mode and only then hand out
3223 * ownership to avoid a window where access is too open. */
3225 if (mode != MODE_INVALID)
3226 if (fchmod(fd, mode) < 0)
3229 if (uid != UID_INVALID || gid != GID_INVALID)
3230 if (fchown(fd, uid, gid) < 0)
3236 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3240 /* Allocates the cpuset in the right size */
3243 if (!(r = CPU_ALLOC(n)))
3246 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3247 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3257 if (errno != EINVAL)
3264 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3265 static const char status_indent[] = " "; /* "[" STATUS "] " */
3266 _cleanup_free_ char *s = NULL;
3267 _cleanup_close_ int fd = -1;
3268 struct iovec iovec[6] = {};
3270 static bool prev_ephemeral;
3274 /* This is independent of logging, as status messages are
3275 * optional and go exclusively to the console. */
3277 if (vasprintf(&s, format, ap) < 0)
3280 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3293 sl = status ? sizeof(status_indent)-1 : 0;
3299 e = ellipsize(s, emax, 50);
3307 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3308 prev_ephemeral = ephemeral;
3311 if (!isempty(status)) {
3312 IOVEC_SET_STRING(iovec[n++], "[");
3313 IOVEC_SET_STRING(iovec[n++], status);
3314 IOVEC_SET_STRING(iovec[n++], "] ");
3316 IOVEC_SET_STRING(iovec[n++], status_indent);
3319 IOVEC_SET_STRING(iovec[n++], s);
3321 IOVEC_SET_STRING(iovec[n++], "\n");
3323 if (writev(fd, iovec, n) < 0)
3329 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3335 va_start(ap, format);
3336 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3342 char *replace_env(const char *format, char **env) {
3349 const char *e, *word = format;
3354 for (e = format; *e; e ++) {
3365 k = strnappend(r, word, e-word-1);
3375 } else if (*e == '$') {
3376 k = strnappend(r, word, e-word);
3393 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3395 k = strappend(r, t);
3409 k = strnappend(r, word, e-word);
3421 char **replace_env_argv(char **argv, char **env) {
3423 unsigned k = 0, l = 0;
3425 l = strv_length(argv);
3427 ret = new(char*, l+1);
3431 STRV_FOREACH(i, argv) {
3433 /* If $FOO appears as single word, replace it by the split up variable */
3434 if ((*i)[0] == '$' && (*i)[1] != '{') {
3439 e = strv_env_get(env, *i+1);
3443 r = strv_split_quoted(&m, e, true);
3455 w = realloc(ret, sizeof(char*) * (l+1));
3465 memcpy(ret + k, m, q * sizeof(char*));
3473 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3474 ret[k] = replace_env(*i, env);
3486 int fd_columns(int fd) {
3487 struct winsize ws = {};
3489 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3498 unsigned columns(void) {
3502 if (_likely_(cached_columns > 0))
3503 return cached_columns;
3506 e = getenv("COLUMNS");
3508 (void) safe_atoi(e, &c);
3511 c = fd_columns(STDOUT_FILENO);
3517 return cached_columns;
3520 int fd_lines(int fd) {
3521 struct winsize ws = {};
3523 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3532 unsigned lines(void) {
3536 if (_likely_(cached_lines > 0))
3537 return cached_lines;
3540 e = getenv("LINES");
3542 (void) safe_atoi(e, &l);
3545 l = fd_lines(STDOUT_FILENO);
3551 return cached_lines;
3554 /* intended to be used as a SIGWINCH sighandler */
3555 void columns_lines_cache_reset(int signum) {
3561 static int cached_on_tty = -1;
3563 if (_unlikely_(cached_on_tty < 0))
3564 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3566 return cached_on_tty;
3569 int files_same(const char *filea, const char *fileb) {
3572 if (stat(filea, &a) < 0)
3575 if (stat(fileb, &b) < 0)
3578 return a.st_dev == b.st_dev &&
3579 a.st_ino == b.st_ino;
3582 int running_in_chroot(void) {
3585 ret = files_same("/proc/1/root", "/");
3592 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3597 assert(percent <= 100);
3598 assert(new_length >= 3);
3600 if (old_length <= 3 || old_length <= new_length)
3601 return strndup(s, old_length);
3603 r = new0(char, new_length+1);
3607 x = (new_length * percent) / 100;
3609 if (x > new_length - 3)
3617 s + old_length - (new_length - x - 3),
3618 new_length - x - 3);
3623 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3627 unsigned k, len, len2;
3630 assert(percent <= 100);
3631 assert(new_length >= 3);
3633 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3634 if (ascii_is_valid(s))
3635 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3637 if (old_length <= 3 || old_length <= new_length)
3638 return strndup(s, old_length);
3640 x = (new_length * percent) / 100;
3642 if (x > new_length - 3)
3646 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3649 c = utf8_encoded_to_unichar(i);
3652 k += unichar_iswide(c) ? 2 : 1;
3655 if (k > x) /* last character was wide and went over quota */
3658 for (j = s + old_length; k < new_length && j > i; ) {
3661 j = utf8_prev_char(j);
3662 c = utf8_encoded_to_unichar(j);
3665 k += unichar_iswide(c) ? 2 : 1;
3669 /* we don't actually need to ellipsize */
3671 return memdup(s, old_length + 1);
3673 /* make space for ellipsis */
3674 j = utf8_next_char(j);
3677 len2 = s + old_length - j;
3678 e = new(char, len + 3 + len2 + 1);
3683 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3684 old_length, new_length, x, len, len2, k);
3688 e[len] = 0xe2; /* tri-dot ellipsis: … */
3692 memcpy(e + len + 3, j, len2 + 1);
3697 char *ellipsize(const char *s, size_t length, unsigned percent) {
3698 return ellipsize_mem(s, strlen(s), length, percent);
3701 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3702 _cleanup_close_ int fd;
3708 mkdir_parents(path, 0755);
3710 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3715 r = fchmod(fd, mode);
3720 if (uid != UID_INVALID || gid != GID_INVALID) {
3721 r = fchown(fd, uid, gid);
3726 if (stamp != USEC_INFINITY) {
3727 struct timespec ts[2];
3729 timespec_store(&ts[0], stamp);
3731 r = futimens(fd, ts);
3733 r = futimens(fd, NULL);
3740 int touch(const char *path) {
3741 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3744 char *unquote(const char *s, const char* quotes) {
3748 /* This is rather stupid, simply removes the heading and
3749 * trailing quotes if there is one. Doesn't care about
3750 * escaping or anything. We should make this smarter one
3757 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3758 return strndup(s+1, l-2);
3763 char *normalize_env_assignment(const char *s) {
3764 _cleanup_free_ char *value = NULL;
3768 eq = strchr(s, '=');
3778 memmove(r, t, strlen(t) + 1);
3783 name = strndupa(s, eq - s);
3784 p = strdupa(eq + 1);
3786 value = unquote(strstrip(p), QUOTES);
3790 return strjoin(strstrip(name), "=", value, NULL);
3793 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3804 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3818 * < 0 : wait_for_terminate() failed to get the state of the
3819 * process, the process was terminated by a signal, or
3820 * failed for an unknown reason.
3821 * >=0 : The process terminated normally, and its exit code is
3824 * That is, success is indicated by a return value of zero, and an
3825 * error is indicated by a non-zero value.
3827 * A warning is emitted if the process terminates abnormally,
3828 * and also if it returns non-zero unless check_exit_code is true.
3830 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3837 r = wait_for_terminate(pid, &status);
3839 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3841 if (status.si_code == CLD_EXITED) {
3842 if (status.si_status != 0)
3843 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3844 "%s failed with error code %i.", name, status.si_status);
3846 log_debug("%s succeeded.", name);
3848 return status.si_status;
3849 } else if (status.si_code == CLD_KILLED ||
3850 status.si_code == CLD_DUMPED) {
3852 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3856 log_warning("%s failed due to unknown reason.", name);
3860 noreturn void freeze(void) {
3862 /* Make sure nobody waits for us on a socket anymore */
3863 close_all_fds(NULL, 0);
3871 bool null_or_empty(struct stat *st) {
3874 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3877 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3883 int null_or_empty_path(const char *fn) {
3888 if (stat(fn, &st) < 0)
3891 return null_or_empty(&st);
3894 int null_or_empty_fd(int fd) {
3899 if (fstat(fd, &st) < 0)
3902 return null_or_empty(&st);
3905 DIR *xopendirat(int fd, const char *name, int flags) {
3909 assert(!(flags & O_CREAT));
3911 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3924 int signal_from_string_try_harder(const char *s) {
3928 signo = signal_from_string(s);
3930 if (startswith(s, "SIG"))
3931 return signal_from_string(s+3);
3936 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3937 _cleanup_free_ char *t = NULL, *u = NULL;
3940 u = unquote(tagvalue, "\"\'");
3944 enc_len = strlen(u) * 4 + 1;
3945 t = new(char, enc_len);
3949 if (encode_devnode_name(u, t, enc_len) < 0)
3952 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3955 char *fstab_node_to_udev_node(const char *p) {
3958 if (startswith(p, "LABEL="))
3959 return tag_to_udev_node(p+6, "label");
3961 if (startswith(p, "UUID="))
3962 return tag_to_udev_node(p+5, "uuid");
3964 if (startswith(p, "PARTUUID="))
3965 return tag_to_udev_node(p+9, "partuuid");
3967 if (startswith(p, "PARTLABEL="))
3968 return tag_to_udev_node(p+10, "partlabel");
3973 bool tty_is_vc(const char *tty) {
3976 return vtnr_from_tty(tty) >= 0;
3979 bool tty_is_console(const char *tty) {
3982 if (startswith(tty, "/dev/"))
3985 return streq(tty, "console");
3988 int vtnr_from_tty(const char *tty) {
3993 if (startswith(tty, "/dev/"))
3996 if (!startswith(tty, "tty") )
3999 if (tty[3] < '0' || tty[3] > '9')
4002 r = safe_atoi(tty+3, &i);
4006 if (i < 0 || i > 63)
4012 char *resolve_dev_console(char **active) {
4015 /* Resolve where /dev/console is pointing to, if /sys is actually ours
4016 * (i.e. not read-only-mounted which is a sign for container setups) */
4018 if (path_is_read_only_fs("/sys") > 0)
4021 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
4024 /* If multiple log outputs are configured the last one is what
4025 * /dev/console points to */
4026 tty = strrchr(*active, ' ');
4032 if (streq(tty, "tty0")) {
4035 /* Get the active VC (e.g. tty1) */
4036 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
4038 tty = *active = tmp;
4045 bool tty_is_vc_resolve(const char *tty) {
4046 _cleanup_free_ char *active = NULL;
4050 if (startswith(tty, "/dev/"))
4053 if (streq(tty, "console")) {
4054 tty = resolve_dev_console(&active);
4059 return tty_is_vc(tty);
4062 const char *default_term_for_tty(const char *tty) {
4065 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
4068 bool dirent_is_file(const struct dirent *de) {
4071 if (hidden_file(de->d_name))
4074 if (de->d_type != DT_REG &&
4075 de->d_type != DT_LNK &&
4076 de->d_type != DT_UNKNOWN)
4082 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
4085 if (de->d_type != DT_REG &&
4086 de->d_type != DT_LNK &&
4087 de->d_type != DT_UNKNOWN)
4090 if (hidden_file_allow_backup(de->d_name))
4093 return endswith(de->d_name, suffix);
4096 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4097 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4098 _cleanup_set_free_free_ Set *seen = NULL;
4101 /* We fork this all off from a child process so that we can
4102 * somewhat cleanly make use of SIGALRM to set a time limit */
4104 reset_all_signal_handlers();
4105 reset_signal_mask();
4107 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4109 pids = hashmap_new(NULL);
4113 seen = set_new(&string_hash_ops);
4117 STRV_FOREACH(directory, directories) {
4118 _cleanup_closedir_ DIR *d;
4121 d = opendir(*directory);
4123 if (errno == ENOENT)
4126 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4129 FOREACH_DIRENT(de, d, break) {
4130 _cleanup_free_ char *path = NULL;
4134 if (!dirent_is_file(de))
4137 if (set_contains(seen, de->d_name)) {
4138 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4142 r = set_put_strdup(seen, de->d_name);
4146 path = strjoin(*directory, "/", de->d_name, NULL);
4150 if (null_or_empty_path(path)) {
4151 log_debug("%s is empty (a mask).", path);
4157 log_error_errno(errno, "Failed to fork: %m");
4159 } else if (pid == 0) {
4162 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4172 return log_error_errno(errno, "Failed to execute %s: %m", path);
4175 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4177 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4184 /* Abort execution of this process after the timout. We simply
4185 * rely on SIGALRM as default action terminating the process,
4186 * and turn on alarm(). */
4188 if (timeout != USEC_INFINITY)
4189 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4191 while (!hashmap_isempty(pids)) {
4192 _cleanup_free_ char *path = NULL;
4195 pid = PTR_TO_UINT(hashmap_first_key(pids));
4198 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4201 wait_for_terminate_and_warn(path, pid, true);
4207 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4211 char **dirs = (char**) directories;
4213 assert(!strv_isempty(dirs));
4215 name = basename(dirs[0]);
4216 assert(!isempty(name));
4218 /* Executes all binaries in the directories in parallel and waits
4219 * for them to finish. Optionally a timeout is applied. If a file
4220 * with the same name exists in more than one directory, the
4221 * earliest one wins. */
4223 executor_pid = fork();
4224 if (executor_pid < 0) {
4225 log_error_errno(errno, "Failed to fork: %m");
4228 } else if (executor_pid == 0) {
4229 r = do_execute(dirs, timeout, argv);
4230 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4233 wait_for_terminate_and_warn(name, executor_pid, true);
4236 int kill_and_sigcont(pid_t pid, int sig) {
4239 r = kill(pid, sig) < 0 ? -errno : 0;
4247 bool nulstr_contains(const char*nulstr, const char *needle) {
4253 NULSTR_FOREACH(i, nulstr)
4254 if (streq(i, needle))
4260 bool plymouth_running(void) {
4261 return access("/run/plymouth/pid", F_OK) >= 0;
4264 char* strshorten(char *s, size_t l) {
4273 static bool hostname_valid_char(char c) {
4275 (c >= 'a' && c <= 'z') ||
4276 (c >= 'A' && c <= 'Z') ||
4277 (c >= '0' && c <= '9') ||
4283 bool hostname_is_valid(const char *s) {
4290 /* Doesn't accept empty hostnames, hostnames with trailing or
4291 * leading dots, and hostnames with multiple dots in a
4292 * sequence. Also ensures that the length stays below
4295 for (p = s, dot = true; *p; p++) {
4302 if (!hostname_valid_char(*p))
4312 if (p-s > HOST_NAME_MAX)
4318 char* hostname_cleanup(char *s, bool lowercase) {
4322 for (p = s, d = s, dot = true; *p; p++) {
4329 } else if (hostname_valid_char(*p)) {
4330 *(d++) = lowercase ? tolower(*p) : *p;
4341 strshorten(s, HOST_NAME_MAX);
4346 bool machine_name_is_valid(const char *s) {
4348 if (!hostname_is_valid(s))
4351 /* Machine names should be useful hostnames, but also be
4352 * useful in unit names, hence we enforce a stricter length
4361 int pipe_eof(int fd) {
4362 struct pollfd pollfd = {
4364 .events = POLLIN|POLLHUP,
4369 r = poll(&pollfd, 1, 0);
4376 return pollfd.revents & POLLHUP;
4379 int fd_wait_for_event(int fd, int event, usec_t t) {
4381 struct pollfd pollfd = {
4389 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4396 return pollfd.revents;
4399 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4408 r = tempfn_xxxxxx(path, &t);
4412 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4418 f = fdopen(fd, "we");
4431 int terminal_vhangup_fd(int fd) {
4434 if (ioctl(fd, TIOCVHANGUP) < 0)
4440 int terminal_vhangup(const char *name) {
4441 _cleanup_close_ int fd;
4443 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4447 return terminal_vhangup_fd(fd);
4450 int vt_disallocate(const char *name) {
4454 /* Deallocate the VT if possible. If not possible
4455 * (i.e. because it is the active one), at least clear it
4456 * entirely (including the scrollback buffer) */
4458 if (!startswith(name, "/dev/"))
4461 if (!tty_is_vc(name)) {
4462 /* So this is not a VT. I guess we cannot deallocate
4463 * it then. But let's at least clear the screen */
4465 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4470 "\033[r" /* clear scrolling region */
4471 "\033[H" /* move home */
4472 "\033[2J", /* clear screen */
4479 if (!startswith(name, "/dev/tty"))
4482 r = safe_atou(name+8, &u);
4489 /* Try to deallocate */
4490 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4494 r = ioctl(fd, VT_DISALLOCATE, u);
4503 /* Couldn't deallocate, so let's clear it fully with
4505 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4510 "\033[r" /* clear scrolling region */
4511 "\033[H" /* move home */
4512 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4519 int symlink_atomic(const char *from, const char *to) {
4520 _cleanup_free_ char *t = NULL;
4526 r = tempfn_random(to, &t);
4530 if (symlink(from, t) < 0)
4533 if (rename(t, to) < 0) {
4541 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4542 _cleanup_free_ char *t = NULL;
4547 r = tempfn_random(path, &t);
4551 if (mknod(t, mode, dev) < 0)
4554 if (rename(t, path) < 0) {
4562 int mkfifo_atomic(const char *path, mode_t mode) {
4563 _cleanup_free_ char *t = NULL;
4568 r = tempfn_random(path, &t);
4572 if (mkfifo(t, mode) < 0)
4575 if (rename(t, path) < 0) {
4583 bool display_is_local(const char *display) {
4587 display[0] == ':' &&
4588 display[1] >= '0' &&
4592 int socket_from_display(const char *display, char **path) {
4599 if (!display_is_local(display))
4602 k = strspn(display+1, "0123456789");
4604 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4608 c = stpcpy(f, "/tmp/.X11-unix/X");
4609 memcpy(c, display+1, k);
4618 const char **username,
4619 uid_t *uid, gid_t *gid,
4621 const char **shell) {
4629 /* We enforce some special rules for uid=0: in order to avoid
4630 * NSS lookups for root we hardcode its data. */
4632 if (streq(*username, "root") || streq(*username, "0")) {
4650 if (parse_uid(*username, &u) >= 0) {
4654 /* If there are multiple users with the same id, make
4655 * sure to leave $USER to the configured value instead
4656 * of the first occurrence in the database. However if
4657 * the uid was configured by a numeric uid, then let's
4658 * pick the real username from /etc/passwd. */
4660 *username = p->pw_name;
4663 p = getpwnam(*username);
4667 return errno > 0 ? -errno : -ESRCH;
4679 *shell = p->pw_shell;
4684 char* uid_to_name(uid_t uid) {
4689 return strdup("root");
4693 return strdup(p->pw_name);
4695 if (asprintf(&r, UID_FMT, uid) < 0)
4701 char* gid_to_name(gid_t gid) {
4706 return strdup("root");
4710 return strdup(p->gr_name);
4712 if (asprintf(&r, GID_FMT, gid) < 0)
4718 int get_group_creds(const char **groupname, gid_t *gid) {
4724 /* We enforce some special rules for gid=0: in order to avoid
4725 * NSS lookups for root we hardcode its data. */
4727 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4728 *groupname = "root";
4736 if (parse_gid(*groupname, &id) >= 0) {
4741 *groupname = g->gr_name;
4744 g = getgrnam(*groupname);
4748 return errno > 0 ? -errno : -ESRCH;
4756 int in_gid(gid_t gid) {
4758 int ngroups_max, r, i;
4760 if (getgid() == gid)
4763 if (getegid() == gid)
4766 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4767 assert(ngroups_max > 0);
4769 gids = alloca(sizeof(gid_t) * ngroups_max);
4771 r = getgroups(ngroups_max, gids);
4775 for (i = 0; i < r; i++)
4782 int in_group(const char *name) {
4786 r = get_group_creds(&name, &gid);
4793 int glob_exists(const char *path) {
4794 _cleanup_globfree_ glob_t g = {};
4800 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4802 if (k == GLOB_NOMATCH)
4804 else if (k == GLOB_NOSPACE)
4807 return !strv_isempty(g.gl_pathv);
4809 return errno ? -errno : -EIO;
4812 int glob_extend(char ***strv, const char *path) {
4813 _cleanup_globfree_ glob_t g = {};
4818 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4820 if (k == GLOB_NOMATCH)
4822 else if (k == GLOB_NOSPACE)
4824 else if (k != 0 || strv_isempty(g.gl_pathv))
4825 return errno ? -errno : -EIO;
4827 STRV_FOREACH(p, g.gl_pathv) {
4828 k = strv_extend(strv, *p);
4836 int dirent_ensure_type(DIR *d, struct dirent *de) {
4842 if (de->d_type != DT_UNKNOWN)
4845 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4849 S_ISREG(st.st_mode) ? DT_REG :
4850 S_ISDIR(st.st_mode) ? DT_DIR :
4851 S_ISLNK(st.st_mode) ? DT_LNK :
4852 S_ISFIFO(st.st_mode) ? DT_FIFO :
4853 S_ISSOCK(st.st_mode) ? DT_SOCK :
4854 S_ISCHR(st.st_mode) ? DT_CHR :
4855 S_ISBLK(st.st_mode) ? DT_BLK :
4861 int get_files_in_directory(const char *path, char ***list) {
4862 _cleanup_closedir_ DIR *d = NULL;
4863 size_t bufsize = 0, n = 0;
4864 _cleanup_strv_free_ char **l = NULL;
4868 /* Returns all files in a directory in *list, and the number
4869 * of files as return value. If list is NULL returns only the
4881 if (!de && errno != 0)
4886 dirent_ensure_type(d, de);
4888 if (!dirent_is_file(de))
4892 /* one extra slot is needed for the terminating NULL */
4893 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4896 l[n] = strdup(de->d_name);
4907 l = NULL; /* avoid freeing */
4913 char *strjoin(const char *x, ...) {
4927 t = va_arg(ap, const char *);
4932 if (n > ((size_t) -1) - l) {
4956 t = va_arg(ap, const char *);
4970 bool is_main_thread(void) {
4971 static thread_local int cached = 0;
4973 if (_unlikely_(cached == 0))
4974 cached = getpid() == gettid() ? 1 : -1;
4979 int block_get_whole_disk(dev_t d, dev_t *ret) {
4986 /* If it has a queue this is good enough for us */
4987 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4990 r = access(p, F_OK);
4998 /* If it is a partition find the originating device */
4999 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
5002 r = access(p, F_OK);
5008 /* Get parent dev_t */
5009 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
5012 r = read_one_line_file(p, &s);
5018 r = sscanf(s, "%u:%u", &m, &n);
5024 /* Only return this if it is really good enough for us. */
5025 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
5028 r = access(p, F_OK);
5032 *ret = makedev(m, n);
5039 static const char *const ioprio_class_table[] = {
5040 [IOPRIO_CLASS_NONE] = "none",
5041 [IOPRIO_CLASS_RT] = "realtime",
5042 [IOPRIO_CLASS_BE] = "best-effort",
5043 [IOPRIO_CLASS_IDLE] = "idle"
5046 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
5048 static const char *const sigchld_code_table[] = {
5049 [CLD_EXITED] = "exited",
5050 [CLD_KILLED] = "killed",
5051 [CLD_DUMPED] = "dumped",
5052 [CLD_TRAPPED] = "trapped",
5053 [CLD_STOPPED] = "stopped",
5054 [CLD_CONTINUED] = "continued",
5057 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
5059 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
5060 [LOG_FAC(LOG_KERN)] = "kern",
5061 [LOG_FAC(LOG_USER)] = "user",
5062 [LOG_FAC(LOG_MAIL)] = "mail",
5063 [LOG_FAC(LOG_DAEMON)] = "daemon",
5064 [LOG_FAC(LOG_AUTH)] = "auth",
5065 [LOG_FAC(LOG_SYSLOG)] = "syslog",
5066 [LOG_FAC(LOG_LPR)] = "lpr",
5067 [LOG_FAC(LOG_NEWS)] = "news",
5068 [LOG_FAC(LOG_UUCP)] = "uucp",
5069 [LOG_FAC(LOG_CRON)] = "cron",
5070 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
5071 [LOG_FAC(LOG_FTP)] = "ftp",
5072 [LOG_FAC(LOG_LOCAL0)] = "local0",
5073 [LOG_FAC(LOG_LOCAL1)] = "local1",
5074 [LOG_FAC(LOG_LOCAL2)] = "local2",
5075 [LOG_FAC(LOG_LOCAL3)] = "local3",
5076 [LOG_FAC(LOG_LOCAL4)] = "local4",
5077 [LOG_FAC(LOG_LOCAL5)] = "local5",
5078 [LOG_FAC(LOG_LOCAL6)] = "local6",
5079 [LOG_FAC(LOG_LOCAL7)] = "local7"
5082 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
5084 static const char *const log_level_table[] = {
5085 [LOG_EMERG] = "emerg",
5086 [LOG_ALERT] = "alert",
5087 [LOG_CRIT] = "crit",
5089 [LOG_WARNING] = "warning",
5090 [LOG_NOTICE] = "notice",
5091 [LOG_INFO] = "info",
5092 [LOG_DEBUG] = "debug"
5095 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5097 static const char* const sched_policy_table[] = {
5098 [SCHED_OTHER] = "other",
5099 [SCHED_BATCH] = "batch",
5100 [SCHED_IDLE] = "idle",
5101 [SCHED_FIFO] = "fifo",
5105 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5107 static const char* const rlimit_table[_RLIMIT_MAX] = {
5108 [RLIMIT_CPU] = "LimitCPU",
5109 [RLIMIT_FSIZE] = "LimitFSIZE",
5110 [RLIMIT_DATA] = "LimitDATA",
5111 [RLIMIT_STACK] = "LimitSTACK",
5112 [RLIMIT_CORE] = "LimitCORE",
5113 [RLIMIT_RSS] = "LimitRSS",
5114 [RLIMIT_NOFILE] = "LimitNOFILE",
5115 [RLIMIT_AS] = "LimitAS",
5116 [RLIMIT_NPROC] = "LimitNPROC",
5117 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5118 [RLIMIT_LOCKS] = "LimitLOCKS",
5119 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5120 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5121 [RLIMIT_NICE] = "LimitNICE",
5122 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5123 [RLIMIT_RTTIME] = "LimitRTTIME"
5126 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5128 static const char* const ip_tos_table[] = {
5129 [IPTOS_LOWDELAY] = "low-delay",
5130 [IPTOS_THROUGHPUT] = "throughput",
5131 [IPTOS_RELIABILITY] = "reliability",
5132 [IPTOS_LOWCOST] = "low-cost",
5135 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5137 static const char *const __signal_table[] = {
5154 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5165 [SIGVTALRM] = "VTALRM",
5167 [SIGWINCH] = "WINCH",
5173 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5175 const char *signal_to_string(int signo) {
5176 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5179 name = __signal_to_string(signo);
5183 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5184 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5186 snprintf(buf, sizeof(buf), "%d", signo);
5191 int signal_from_string(const char *s) {
5196 signo = __signal_from_string(s);
5200 if (startswith(s, "RTMIN+")) {
5204 if (safe_atou(s, &u) >= 0) {
5205 signo = (int) u + offset;
5206 if (signo > 0 && signo < _NSIG)
5212 bool kexec_loaded(void) {
5213 bool loaded = false;
5216 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5224 int prot_from_flags(int flags) {
5226 switch (flags & O_ACCMODE) {
5235 return PROT_READ|PROT_WRITE;
5242 char *format_bytes(char *buf, size_t l, off_t t) {
5245 static const struct {
5249 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5250 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5251 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5252 { "G", 1024ULL*1024ULL*1024ULL },
5253 { "M", 1024ULL*1024ULL },
5257 if (t == (off_t) -1)
5260 for (i = 0; i < ELEMENTSOF(table); i++) {
5262 if (t >= table[i].factor) {
5265 (unsigned long long) (t / table[i].factor),
5266 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5273 snprintf(buf, l, "%lluB", (unsigned long long) t);
5281 void* memdup(const void *p, size_t l) {
5294 int fd_inc_sndbuf(int fd, size_t n) {
5296 socklen_t l = sizeof(value);
5298 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5299 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5302 /* If we have the privileges we will ignore the kernel limit. */
5305 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5306 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5312 int fd_inc_rcvbuf(int fd, size_t n) {
5314 socklen_t l = sizeof(value);
5316 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5317 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5320 /* If we have the privileges we will ignore the kernel limit. */
5323 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5324 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5329 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5330 bool stdout_is_tty, stderr_is_tty;
5331 pid_t parent_pid, agent_pid;
5332 sigset_t ss, saved_ss;
5340 /* Spawns a temporary TTY agent, making sure it goes away when
5343 parent_pid = getpid();
5345 /* First we temporarily block all signals, so that the new
5346 * child has them blocked initially. This way, we can be sure
5347 * that SIGTERMs are not lost we might send to the agent. */
5348 assert_se(sigfillset(&ss) >= 0);
5349 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5352 if (agent_pid < 0) {
5353 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5357 if (agent_pid != 0) {
5358 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5365 * Make sure the agent goes away when the parent dies */
5366 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5367 _exit(EXIT_FAILURE);
5369 /* Make sure we actually can kill the agent, if we need to, in
5370 * case somebody invoked us from a shell script that trapped
5371 * SIGTERM or so... */
5372 reset_all_signal_handlers();
5373 reset_signal_mask();
5375 /* Check whether our parent died before we were able
5376 * to set the death signal and unblock the signals */
5377 if (getppid() != parent_pid)
5378 _exit(EXIT_SUCCESS);
5380 /* Don't leak fds to the agent */
5381 close_all_fds(except, n_except);
5383 stdout_is_tty = isatty(STDOUT_FILENO);
5384 stderr_is_tty = isatty(STDERR_FILENO);
5386 if (!stdout_is_tty || !stderr_is_tty) {
5389 /* Detach from stdout/stderr. and reopen
5390 * /dev/tty for them. This is important to
5391 * ensure that when systemctl is started via
5392 * popen() or a similar call that expects to
5393 * read EOF we actually do generate EOF and
5394 * not delay this indefinitely by because we
5395 * keep an unused copy of stdin around. */
5396 fd = open("/dev/tty", O_WRONLY);
5398 log_error_errno(errno, "Failed to open /dev/tty: %m");
5399 _exit(EXIT_FAILURE);
5403 dup2(fd, STDOUT_FILENO);
5406 dup2(fd, STDERR_FILENO);
5412 /* Count arguments */
5414 for (n = 0; va_arg(ap, char*); n++)
5419 l = alloca(sizeof(char *) * (n + 1));
5421 /* Fill in arguments */
5423 for (i = 0; i <= n; i++)
5424 l[i] = va_arg(ap, char*);
5428 _exit(EXIT_FAILURE);
5431 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5432 struct rlimit highest, fixed;
5436 if (setrlimit(resource, rlim) >= 0)
5442 /* So we failed to set the desired setrlimit, then let's try
5443 * to get as close as we can */
5444 assert_se(getrlimit(resource, &highest) == 0);
5446 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5447 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5449 if (setrlimit(resource, &fixed) < 0)
5455 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5456 _cleanup_fclose_ FILE *f = NULL;
5467 path = procfs_file_alloca(pid, "environ");
5469 f = fopen(path, "re");
5477 char line[LINE_MAX];
5480 for (i = 0; i < sizeof(line)-1; i++) {
5484 if (_unlikely_(c == EOF)) {
5494 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5495 value = strdup(line + l + 1);
5509 bool http_etag_is_valid(const char *etag) {
5513 if (!endswith(etag, "\""))
5516 if (!startswith(etag, "\"") && !startswith(etag, "W/\""))
5522 bool http_url_is_valid(const char *url) {
5528 p = startswith(url, "http://");
5530 p = startswith(url, "https://");
5537 return ascii_is_valid(p);
5540 bool documentation_url_is_valid(const char *url) {
5546 if (http_url_is_valid(url))
5549 p = startswith(url, "file:/");
5551 p = startswith(url, "info:");
5553 p = startswith(url, "man:");
5558 return ascii_is_valid(p);
5561 bool in_initrd(void) {
5562 static int saved = -1;
5568 /* We make two checks here:
5570 * 1. the flag file /etc/initrd-release must exist
5571 * 2. the root file system must be a memory file system
5573 * The second check is extra paranoia, since misdetecting an
5574 * initrd can have bad bad consequences due the initrd
5575 * emptying when transititioning to the main systemd.
5578 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5579 statfs("/", &s) >= 0 &&
5580 is_temporary_fs(&s);
5585 void warn_melody(void) {
5586 _cleanup_close_ int fd = -1;
5588 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5592 /* Yeah, this is synchronous. Kinda sucks. But well... */
5594 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5595 usleep(125*USEC_PER_MSEC);
5597 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5598 usleep(125*USEC_PER_MSEC);
5600 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5601 usleep(125*USEC_PER_MSEC);
5603 ioctl(fd, KIOCSOUND, 0);
5606 int make_console_stdio(void) {
5609 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5611 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5613 return log_error_errno(fd, "Failed to acquire terminal: %m");
5617 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5622 int get_home_dir(char **_h) {
5630 /* Take the user specified one */
5631 e = secure_getenv("HOME");
5632 if (e && path_is_absolute(e)) {
5641 /* Hardcode home directory for root to avoid NSS */
5644 h = strdup("/root");
5652 /* Check the database... */
5656 return errno > 0 ? -errno : -ESRCH;
5658 if (!path_is_absolute(p->pw_dir))
5661 h = strdup(p->pw_dir);
5669 int get_shell(char **_s) {
5677 /* Take the user specified one */
5678 e = getenv("SHELL");
5688 /* Hardcode home directory for root to avoid NSS */
5691 s = strdup("/bin/sh");
5699 /* Check the database... */
5703 return errno > 0 ? -errno : -ESRCH;
5705 if (!path_is_absolute(p->pw_shell))
5708 s = strdup(p->pw_shell);
5716 bool filename_is_valid(const char *p) {
5730 if (strlen(p) > FILENAME_MAX)
5736 bool string_is_safe(const char *p) {
5742 for (t = p; *t; t++) {
5743 if (*t > 0 && *t < ' ')
5746 if (strchr("\\\"\'\0x7f", *t))
5754 * Check if a string contains control characters. If 'ok' is non-NULL
5755 * it may be a string containing additional CCs to be considered OK.
5757 bool string_has_cc(const char *p, const char *ok) {
5762 for (t = p; *t; t++) {
5763 if (ok && strchr(ok, *t))
5766 if (*t > 0 && *t < ' ')
5776 bool path_is_safe(const char *p) {
5781 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5784 if (strlen(p) > PATH_MAX)
5787 /* The following two checks are not really dangerous, but hey, they still are confusing */
5788 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5791 if (strstr(p, "//"))
5797 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5798 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5799 int (*compar) (const void *, const void *, void *), void *arg) {
5808 p = (void *)(((const char *) base) + (idx * size));
5809 comparison = compar(key, p, arg);
5812 else if (comparison > 0)
5820 void init_gettext(void) {
5821 setlocale(LC_ALL, "");
5822 textdomain(GETTEXT_PACKAGE);
5825 bool is_locale_utf8(void) {
5827 static int cached_answer = -1;
5829 if (cached_answer >= 0)
5832 if (!setlocale(LC_ALL, "")) {
5833 cached_answer = true;
5837 set = nl_langinfo(CODESET);
5839 cached_answer = true;
5843 if (streq(set, "UTF-8")) {
5844 cached_answer = true;
5848 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5849 * unset and everything can do to UTF-8 nowadays. */
5850 set = setlocale(LC_CTYPE, NULL);
5852 cached_answer = true;
5856 /* Check result, but ignore the result if C was set
5860 !getenv("LC_ALL") &&
5861 !getenv("LC_CTYPE") &&
5865 return (bool) cached_answer;
5868 const char *draw_special_char(DrawSpecialChar ch) {
5869 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5872 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5873 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5874 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5875 [DRAW_TREE_SPACE] = " ", /* */
5876 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5877 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5878 [DRAW_ARROW] = "\342\206\222", /* → */
5879 [DRAW_DASH] = "\342\200\223", /* – */
5882 /* ASCII fallback */ {
5883 [DRAW_TREE_VERTICAL] = "| ",
5884 [DRAW_TREE_BRANCH] = "|-",
5885 [DRAW_TREE_RIGHT] = "`-",
5886 [DRAW_TREE_SPACE] = " ",
5887 [DRAW_TRIANGULAR_BULLET] = ">",
5888 [DRAW_BLACK_CIRCLE] = "*",
5889 [DRAW_ARROW] = "->",
5894 return draw_table[!is_locale_utf8()][ch];
5897 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5900 size_t l, old_len, new_len;
5906 old_len = strlen(old_string);
5907 new_len = strlen(new_string);
5920 if (!startswith(f, old_string)) {
5926 nl = l - old_len + new_len;
5927 a = realloc(r, nl + 1);
5935 t = stpcpy(t, new_string);
5947 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5948 const char *i, *begin = NULL;
5953 } state = STATE_OTHER;
5955 size_t osz = 0, isz;
5961 /* Strips ANSI color and replaces TABs by 8 spaces */
5963 isz = _isz ? *_isz : strlen(*ibuf);
5965 f = open_memstream(&obuf, &osz);
5969 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5974 if (i >= *ibuf + isz) /* EOT */
5976 else if (*i == '\x1B')
5977 state = STATE_ESCAPE;
5978 else if (*i == '\t')
5985 if (i >= *ibuf + isz) { /* EOT */
5988 } else if (*i == '[') {
5989 state = STATE_BRACKET;
5994 state = STATE_OTHER;
6001 if (i >= *ibuf + isz || /* EOT */
6002 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
6005 state = STATE_OTHER;
6007 } else if (*i == 'm')
6008 state = STATE_OTHER;
6030 int on_ac_power(void) {
6031 bool found_offline = false, found_online = false;
6032 _cleanup_closedir_ DIR *d = NULL;
6034 d = opendir("/sys/class/power_supply");
6036 return errno == ENOENT ? true : -errno;
6040 _cleanup_close_ int fd = -1, device = -1;
6046 if (!de && errno != 0)
6052 if (hidden_file(de->d_name))
6055 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
6057 if (errno == ENOENT || errno == ENOTDIR)
6063 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6065 if (errno == ENOENT)
6071 n = read(fd, contents, sizeof(contents));
6075 if (n != 6 || memcmp(contents, "Mains\n", 6))
6079 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6081 if (errno == ENOENT)
6087 n = read(fd, contents, sizeof(contents));
6091 if (n != 2 || contents[1] != '\n')
6094 if (contents[0] == '1') {
6095 found_online = true;
6097 } else if (contents[0] == '0')
6098 found_offline = true;
6103 return found_online || !found_offline;
6106 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6113 if (!path_strv_resolve_uniq(search, root))
6116 STRV_FOREACH(i, search) {
6117 _cleanup_free_ char *p = NULL;
6121 p = strjoin(root, *i, "/", path, NULL);
6123 p = strjoin(*i, "/", path, NULL);
6133 if (errno != ENOENT)
6140 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6141 _cleanup_strv_free_ char **copy = NULL;
6147 if (path_is_absolute(path)) {
6150 f = fopen(path, mode);
6159 copy = strv_copy((char**) search);
6163 return search_and_fopen_internal(path, mode, root, copy, _f);
6166 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6167 _cleanup_strv_free_ char **s = NULL;
6169 if (path_is_absolute(path)) {
6172 f = fopen(path, mode);
6181 s = strv_split_nulstr(search);
6185 return search_and_fopen_internal(path, mode, root, s, _f);
6188 char *strextend(char **x, ...) {
6195 l = f = *x ? strlen(*x) : 0;
6202 t = va_arg(ap, const char *);
6207 if (n > ((size_t) -1) - l) {
6216 r = realloc(*x, l+1);
6226 t = va_arg(ap, const char *);
6240 char *strrep(const char *s, unsigned n) {
6248 p = r = malloc(l * n + 1);
6252 for (i = 0; i < n; i++)
6259 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6266 if (*allocated >= need)
6269 newalloc = MAX(need * 2, 64u / size);
6270 a = newalloc * size;
6272 /* check for overflows */
6273 if (a < size * need)
6281 *allocated = newalloc;
6285 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6294 q = greedy_realloc(p, allocated, need, size);
6298 if (*allocated > prev)
6299 memzero(q + prev * size, (*allocated - prev) * size);
6304 bool id128_is_valid(const char *s) {
6310 /* Simple formatted 128bit hex string */
6312 for (i = 0; i < l; i++) {
6315 if (!(c >= '0' && c <= '9') &&
6316 !(c >= 'a' && c <= 'z') &&
6317 !(c >= 'A' && c <= 'Z'))
6321 } else if (l == 36) {
6323 /* Formatted UUID */
6325 for (i = 0; i < l; i++) {
6328 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6332 if (!(c >= '0' && c <= '9') &&
6333 !(c >= 'a' && c <= 'z') &&
6334 !(c >= 'A' && c <= 'Z'))
6345 int split_pair(const char *s, const char *sep, char **l, char **r) {
6360 a = strndup(s, x - s);
6364 b = strdup(x + strlen(sep));
6376 int shall_restore_state(void) {
6377 _cleanup_free_ char *value = NULL;
6380 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6386 return parse_boolean(value) != 0;
6389 int proc_cmdline(char **ret) {
6392 if (detect_container(NULL) > 0)
6393 return get_process_cmdline(1, 0, false, ret);
6395 return read_one_line_file("/proc/cmdline", ret);
6398 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6399 _cleanup_free_ char *line = NULL;
6405 r = proc_cmdline(&line);
6411 _cleanup_free_ char *word = NULL;
6414 r = unquote_first_word(&p, &word, true);
6420 /* Filter out arguments that are intended only for the
6422 if (!in_initrd() && startswith(word, "rd."))
6425 value = strchr(word, '=');
6429 r = parse_item(word, value);
6437 int get_proc_cmdline_key(const char *key, char **value) {
6438 _cleanup_free_ char *line = NULL, *ret = NULL;
6445 r = proc_cmdline(&line);
6451 _cleanup_free_ char *word = NULL;
6454 r = unquote_first_word(&p, &word, true);
6460 /* Filter out arguments that are intended only for the
6462 if (!in_initrd() && startswith(word, "rd."))
6466 e = startswith(word, key);
6470 r = free_and_strdup(&ret, e);
6476 if (streq(word, key))
6490 int container_get_leader(const char *machine, pid_t *pid) {
6491 _cleanup_free_ char *s = NULL, *class = NULL;
6499 p = strjoina("/run/systemd/machines/", machine);
6500 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6508 if (!streq_ptr(class, "container"))
6511 r = parse_pid(s, &leader);
6521 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6522 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6530 mntns = procfs_file_alloca(pid, "ns/mnt");
6531 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6539 pidns = procfs_file_alloca(pid, "ns/pid");
6540 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6548 netns = procfs_file_alloca(pid, "ns/net");
6549 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6557 root = procfs_file_alloca(pid, "root");
6558 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6564 *pidns_fd = pidnsfd;
6567 *mntns_fd = mntnsfd;
6570 *netns_fd = netnsfd;
6575 pidnsfd = mntnsfd = netnsfd = -1;
6580 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6583 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6587 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6591 if (setns(netns_fd, CLONE_NEWNET) < 0)
6595 if (fchdir(root_fd) < 0)
6598 if (chroot(".") < 0)
6602 if (setresgid(0, 0, 0) < 0)
6605 if (setgroups(0, NULL) < 0)
6608 if (setresuid(0, 0, 0) < 0)
6614 bool pid_is_unwaited(pid_t pid) {
6615 /* Checks whether a PID is still valid at all, including a zombie */
6620 if (kill(pid, 0) >= 0)
6623 return errno != ESRCH;
6626 bool pid_is_alive(pid_t pid) {
6629 /* Checks whether a PID is still valid and not a zombie */
6634 r = get_process_state(pid);
6635 if (r == -ENOENT || r == 'Z')
6641 int getpeercred(int fd, struct ucred *ucred) {
6642 socklen_t n = sizeof(struct ucred);
6649 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6653 if (n != sizeof(struct ucred))
6656 /* Check if the data is actually useful and not suppressed due
6657 * to namespacing issues */
6660 if (u.uid == UID_INVALID)
6662 if (u.gid == GID_INVALID)
6669 int getpeersec(int fd, char **ret) {
6681 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6685 if (errno != ERANGE)
6692 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6708 /* This is much like like mkostemp() but is subject to umask(). */
6709 int mkostemp_safe(char *pattern, int flags) {
6710 _cleanup_umask_ mode_t u;
6717 fd = mkostemp(pattern, flags);
6724 int open_tmpfile(const char *path, int flags) {
6731 /* Try O_TMPFILE first, if it is supported */
6732 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6737 /* Fall back to unguessable name + unlinking */
6738 p = strjoina(path, "/systemd-tmp-XXXXXX");
6740 fd = mkostemp_safe(p, flags);
6748 int fd_warn_permissions(const char *path, int fd) {
6751 if (fstat(fd, &st) < 0)
6754 if (st.st_mode & 0111)
6755 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6757 if (st.st_mode & 0002)
6758 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6760 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6761 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6766 unsigned long personality_from_string(const char *p) {
6768 /* Parse a personality specifier. We introduce our own
6769 * identifiers that indicate specific ABIs, rather than just
6770 * hints regarding the register size, since we want to keep
6771 * things open for multiple locally supported ABIs for the
6772 * same register size. We try to reuse the ABI identifiers
6773 * used by libseccomp. */
6775 #if defined(__x86_64__)
6777 if (streq(p, "x86"))
6780 if (streq(p, "x86-64"))
6783 #elif defined(__i386__)
6785 if (streq(p, "x86"))
6789 /* personality(7) documents that 0xffffffffUL is used for
6790 * querying the current personality, hence let's use that here
6791 * as error indicator. */
6792 return 0xffffffffUL;
6795 const char* personality_to_string(unsigned long p) {
6797 #if defined(__x86_64__)
6799 if (p == PER_LINUX32)
6805 #elif defined(__i386__)
6814 uint64_t physical_memory(void) {
6817 /* We return this as uint64_t in case we are running as 32bit
6818 * process on a 64bit kernel with huge amounts of memory */
6820 mem = sysconf(_SC_PHYS_PAGES);
6823 return (uint64_t) mem * (uint64_t) page_size();
6826 void hexdump(FILE *f, const void *p, size_t s) {
6827 const uint8_t *b = p;
6830 assert(s == 0 || b);
6835 fprintf(f, "%04x ", n);
6837 for (i = 0; i < 16; i++) {
6842 fprintf(f, "%02x ", b[i]);
6850 for (i = 0; i < 16; i++) {
6855 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6869 int update_reboot_param_file(const char *param) {
6874 r = write_string_file(REBOOT_PARAM_FILE, param);
6876 log_error("Failed to write reboot param to "
6877 REBOOT_PARAM_FILE": %s", strerror(-r));
6879 unlink(REBOOT_PARAM_FILE);
6884 int umount_recursive(const char *prefix, int flags) {
6888 /* Try to umount everything recursively below a
6889 * directory. Also, take care of stacked mounts, and keep
6890 * unmounting them until they are gone. */
6893 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6898 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6899 if (!proc_self_mountinfo)
6903 _cleanup_free_ char *path = NULL, *p = NULL;
6906 k = fscanf(proc_self_mountinfo,
6907 "%*s " /* (1) mount id */
6908 "%*s " /* (2) parent id */
6909 "%*s " /* (3) major:minor */
6910 "%*s " /* (4) root */
6911 "%ms " /* (5) mount point */
6912 "%*s" /* (6) mount options */
6913 "%*[^-]" /* (7) optional fields */
6914 "- " /* (8) separator */
6915 "%*s " /* (9) file system type */
6916 "%*s" /* (10) mount source */
6917 "%*s" /* (11) mount options 2 */
6918 "%*[^\n]", /* some rubbish at the end */
6927 p = cunescape(path);
6931 if (!path_startswith(p, prefix))
6934 if (umount2(p, flags) < 0) {
6950 static int get_mount_flags(const char *path, unsigned long *flags) {
6953 if (statvfs(path, &buf) < 0)
6955 *flags = buf.f_flag;
6959 int bind_remount_recursive(const char *prefix, bool ro) {
6960 _cleanup_set_free_free_ Set *done = NULL;
6961 _cleanup_free_ char *cleaned = NULL;
6964 /* Recursively remount a directory (and all its submounts)
6965 * read-only or read-write. If the directory is already
6966 * mounted, we reuse the mount and simply mark it
6967 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6968 * operation). If it isn't we first make it one. Afterwards we
6969 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6970 * submounts we can access, too. When mounts are stacked on
6971 * the same mount point we only care for each individual
6972 * "top-level" mount on each point, as we cannot
6973 * influence/access the underlying mounts anyway. We do not
6974 * have any effect on future submounts that might get
6975 * propagated, they migt be writable. This includes future
6976 * submounts that have been triggered via autofs. */
6978 cleaned = strdup(prefix);
6982 path_kill_slashes(cleaned);
6984 done = set_new(&string_hash_ops);
6989 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6990 _cleanup_set_free_free_ Set *todo = NULL;
6991 bool top_autofs = false;
6993 unsigned long orig_flags;
6995 todo = set_new(&string_hash_ops);
6999 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
7000 if (!proc_self_mountinfo)
7004 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
7007 k = fscanf(proc_self_mountinfo,
7008 "%*s " /* (1) mount id */
7009 "%*s " /* (2) parent id */
7010 "%*s " /* (3) major:minor */
7011 "%*s " /* (4) root */
7012 "%ms " /* (5) mount point */
7013 "%*s" /* (6) mount options (superblock) */
7014 "%*[^-]" /* (7) optional fields */
7015 "- " /* (8) separator */
7016 "%ms " /* (9) file system type */
7017 "%*s" /* (10) mount source */
7018 "%*s" /* (11) mount options (bind mount) */
7019 "%*[^\n]", /* some rubbish at the end */
7029 p = cunescape(path);
7033 /* Let's ignore autofs mounts. If they aren't
7034 * triggered yet, we want to avoid triggering
7035 * them, as we don't make any guarantees for
7036 * future submounts anyway. If they are
7037 * already triggered, then we will find
7038 * another entry for this. */
7039 if (streq(type, "autofs")) {
7040 top_autofs = top_autofs || path_equal(cleaned, p);
7044 if (path_startswith(p, cleaned) &&
7045 !set_contains(done, p)) {
7047 r = set_consume(todo, p);
7057 /* If we have no submounts to process anymore and if
7058 * the root is either already done, or an autofs, we
7060 if (set_isempty(todo) &&
7061 (top_autofs || set_contains(done, cleaned)))
7064 if (!set_contains(done, cleaned) &&
7065 !set_contains(todo, cleaned)) {
7066 /* The prefix directory itself is not yet a
7067 * mount, make it one. */
7068 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
7072 (void) get_mount_flags(cleaned, &orig_flags);
7073 orig_flags &= ~MS_RDONLY;
7075 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
7078 x = strdup(cleaned);
7082 r = set_consume(done, x);
7087 while ((x = set_steal_first(todo))) {
7089 r = set_consume(done, x);
7095 /* Try to reuse the original flag set, but
7096 * don't care for errors, in case of
7097 * obstructed mounts */
7099 (void) get_mount_flags(x, &orig_flags);
7100 orig_flags &= ~MS_RDONLY;
7102 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7104 /* Deal with mount points that are
7105 * obstructed by a later mount */
7107 if (errno != ENOENT)
7115 int fflush_and_check(FILE *f) {
7122 return errno ? -errno : -EIO;
7127 int tempfn_xxxxxx(const char *p, char **ret) {
7139 * /foo/bar/.#waldoXXXXXX
7143 if (!filename_is_valid(fn))
7146 t = new(char, strlen(p) + 2 + 6 + 1);
7150 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7152 *ret = path_kill_slashes(t);
7156 int tempfn_random(const char *p, char **ret) {
7170 * /foo/bar/.#waldobaa2a261115984a9
7174 if (!filename_is_valid(fn))
7177 t = new(char, strlen(p) + 2 + 16 + 1);
7181 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7184 for (i = 0; i < 16; i++) {
7185 *(x++) = hexchar(u & 0xF);
7191 *ret = path_kill_slashes(t);
7195 int tempfn_random_child(const char *p, char **ret) {
7206 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7209 t = new(char, strlen(p) + 3 + 16 + 1);
7213 x = stpcpy(stpcpy(t, p), "/.#");
7216 for (i = 0; i < 16; i++) {
7217 *(x++) = hexchar(u & 0xF);
7223 *ret = path_kill_slashes(t);
7227 /* make sure the hostname is not "localhost" */
7228 bool is_localhost(const char *hostname) {
7231 /* This tries to identify local host and domain names
7232 * described in RFC6761 plus the redhatism of .localdomain */
7234 return streq(hostname, "localhost") ||
7235 streq(hostname, "localhost.") ||
7236 streq(hostname, "localdomain.") ||
7237 streq(hostname, "localdomain") ||
7238 endswith(hostname, ".localhost") ||
7239 endswith(hostname, ".localhost.") ||
7240 endswith(hostname, ".localdomain") ||
7241 endswith(hostname, ".localdomain.");
7244 int take_password_lock(const char *root) {
7246 struct flock flock = {
7248 .l_whence = SEEK_SET,
7256 /* This is roughly the same as lckpwdf(), but not as awful. We
7257 * don't want to use alarm() and signals, hence we implement
7258 * our own trivial version of this.
7260 * Note that shadow-utils also takes per-database locks in
7261 * addition to lckpwdf(). However, we don't given that they
7262 * are redundant as they they invoke lckpwdf() first and keep
7263 * it during everything they do. The per-database locks are
7264 * awfully racy, and thus we just won't do them. */
7267 path = strjoina(root, "/etc/.pwd.lock");
7269 path = "/etc/.pwd.lock";
7271 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7275 r = fcntl(fd, F_SETLKW, &flock);
7284 int is_symlink(const char *path) {
7287 if (lstat(path, &info) < 0)
7290 return !!S_ISLNK(info.st_mode);
7293 int is_dir(const char* path, bool follow) {
7298 r = stat(path, &st);
7300 r = lstat(path, &st);
7304 return !!S_ISDIR(st.st_mode);
7307 int unquote_first_word(const char **p, char **ret, bool relax) {
7308 _cleanup_free_ char *s = NULL;
7309 size_t allocated = 0, sz = 0;
7316 SINGLE_QUOTE_ESCAPE,
7318 DOUBLE_QUOTE_ESCAPE,
7326 /* Parses the first word of a string, and returns it in
7327 * *ret. Removes all quotes in the process. When parsing fails
7328 * (because of an uneven number of quotes or similar), leaves
7329 * the pointer *p at the first invalid character. */
7339 else if (strchr(WHITESPACE, c))
7349 state = SINGLE_QUOTE;
7351 state = VALUE_ESCAPE;
7353 state = DOUBLE_QUOTE;
7354 else if (strchr(WHITESPACE, c))
7357 if (!GREEDY_REALLOC(s, allocated, sz+2))
7372 if (!GREEDY_REALLOC(s, allocated, sz+2))
7385 } else if (c == '\'')
7388 state = SINGLE_QUOTE_ESCAPE;
7390 if (!GREEDY_REALLOC(s, allocated, sz+2))
7398 case SINGLE_QUOTE_ESCAPE:
7405 if (!GREEDY_REALLOC(s, allocated, sz+2))
7409 state = SINGLE_QUOTE;
7418 state = DOUBLE_QUOTE_ESCAPE;
7420 if (!GREEDY_REALLOC(s, allocated, sz+2))
7428 case DOUBLE_QUOTE_ESCAPE:
7435 if (!GREEDY_REALLOC(s, allocated, sz+2))
7439 state = DOUBLE_QUOTE;
7445 if (!strchr(WHITESPACE, c))
7467 int unquote_many_words(const char **p, ...) {
7472 /* Parses a number of words from a string, stripping any
7473 * quotes if necessary. */
7477 /* Count how many words are expected */
7480 if (!va_arg(ap, char **))
7489 /* Read all words into a temporary array */
7490 l = newa0(char*, n);
7491 for (c = 0; c < n; c++) {
7493 r = unquote_first_word(p, &l[c], false);
7497 for (j = 0; j < c; j++)
7507 /* If we managed to parse all words, return them in the passed
7510 for (i = 0; i < n; i++) {
7513 v = va_arg(ap, char **);
7523 int free_and_strdup(char **p, const char *s) {
7528 /* Replaces a string pointer with an strdup()ed new string,
7529 * possibly freeing the old one. */
7544 int sethostname_idempotent(const char *s) {
7546 char buf[HOST_NAME_MAX + 1] = {};
7550 r = gethostname(buf, sizeof(buf));
7557 r = sethostname(s, strlen(s));
7564 int ptsname_malloc(int fd, char **ret) {
7577 if (ptsname_r(fd, c, l) == 0) {
7581 if (errno != ERANGE) {
7591 int openpt_in_namespace(pid_t pid, int flags) {
7592 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7593 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7595 struct cmsghdr cmsghdr;
7596 uint8_t buf[CMSG_SPACE(sizeof(int))];
7598 struct msghdr mh = {
7599 .msg_control = &control,
7600 .msg_controllen = sizeof(control),
7602 struct cmsghdr *cmsg;
7609 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7613 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7623 pair[0] = safe_close(pair[0]);
7625 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7627 _exit(EXIT_FAILURE);
7629 master = posix_openpt(flags);
7631 _exit(EXIT_FAILURE);
7633 cmsg = CMSG_FIRSTHDR(&mh);
7634 cmsg->cmsg_level = SOL_SOCKET;
7635 cmsg->cmsg_type = SCM_RIGHTS;
7636 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7637 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7639 mh.msg_controllen = cmsg->cmsg_len;
7641 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7642 _exit(EXIT_FAILURE);
7644 _exit(EXIT_SUCCESS);
7647 pair[1] = safe_close(pair[1]);
7649 r = wait_for_terminate(child, &si);
7652 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7655 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7658 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7659 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7663 fds = (int*) CMSG_DATA(cmsg);
7664 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7667 close_many(fds, n_fds);
7677 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7678 _cleanup_close_ int fd = -1;
7681 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7683 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7687 l = fgetxattr(fd, attribute, value, size);
7694 static int parse_crtime(le64_t le, usec_t *usec) {
7700 if (u == 0 || u == (uint64_t) -1)
7707 int fd_getcrtime(int fd, usec_t *usec) {
7714 /* Until Linux gets a real concept of birthtime/creation time,
7715 * let's fake one with xattrs */
7717 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7720 if (n != sizeof(le))
7723 return parse_crtime(le, usec);
7726 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7730 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7733 if (n != sizeof(le))
7736 return parse_crtime(le, usec);
7739 int path_getcrtime(const char *p, usec_t *usec) {
7746 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7749 if (n != sizeof(le))
7752 return parse_crtime(le, usec);
7755 int fd_setcrtime(int fd, usec_t usec) {
7761 usec = now(CLOCK_REALTIME);
7763 le = htole64((uint64_t) usec);
7764 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7770 int same_fd(int a, int b) {
7771 struct stat sta, stb;
7778 /* Compares two file descriptors. Note that semantics are
7779 * quite different depending on whether we have kcmp() or we
7780 * don't. If we have kcmp() this will only return true for
7781 * dup()ed file descriptors, but not otherwise. If we don't
7782 * have kcmp() this will also return true for two fds of the same
7783 * file, created by separate open() calls. Since we use this
7784 * call mostly for filtering out duplicates in the fd store
7785 * this difference hopefully doesn't matter too much. */
7790 /* Try to use kcmp() if we have it. */
7792 r = kcmp(pid, pid, KCMP_FILE, a, b);
7797 if (errno != ENOSYS)
7800 /* We don't have kcmp(), use fstat() instead. */
7801 if (fstat(a, &sta) < 0)
7804 if (fstat(b, &stb) < 0)
7807 if ((sta.st_mode & S_IFMT) != (stb.st_mode & S_IFMT))
7810 /* We consider all device fds different, since two device fds
7811 * might refer to quite different device contexts even though
7812 * they share the same inode and backing dev_t. */
7814 if (S_ISCHR(sta.st_mode) || S_ISBLK(sta.st_mode))
7817 if (sta.st_dev != stb.st_dev || sta.st_ino != stb.st_ino)
7820 /* The fds refer to the same inode on disk, let's also check
7821 * if they have the same fd flags. This is useful to
7822 * distuingish the read and write side of a pipe created with
7824 fa = fcntl(a, F_GETFL);
7828 fb = fcntl(b, F_GETFL);
7835 int chattr_fd(int fd, bool b, unsigned mask) {
7836 unsigned old_attr, new_attr;
7843 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7847 new_attr = old_attr | mask;
7849 new_attr = old_attr & ~mask;
7851 if (new_attr == old_attr)
7854 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7860 int chattr_path(const char *p, bool b, unsigned mask) {
7861 _cleanup_close_ int fd = -1;
7868 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7872 return chattr_fd(fd, b, mask);
7875 int change_attr_fd(int fd, unsigned value, unsigned mask) {
7876 unsigned old_attr, new_attr;
7883 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7886 new_attr = (old_attr & ~mask) |(value & mask);
7888 if (new_attr == old_attr)
7891 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7897 int read_attr_fd(int fd, unsigned *ret) {
7900 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7906 int read_attr_path(const char *p, unsigned *ret) {
7907 _cleanup_close_ int fd = -1;
7912 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7916 return read_attr_fd(fd, ret);
7919 int make_lock_file(const char *p, int operation, LockFile *ret) {
7920 _cleanup_close_ int fd = -1;
7921 _cleanup_free_ char *t = NULL;
7925 * We use UNPOSIX locks if they are available. They have nice
7926 * semantics, and are mostly compatible with NFS. However,
7927 * they are only available on new kernels. When we detect we
7928 * are running on an older kernel, then we fall back to good
7929 * old BSD locks. They also have nice semantics, but are
7930 * slightly problematic on NFS, where they are upgraded to
7931 * POSIX locks, even though locally they are orthogonal to
7941 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7942 .l_whence = SEEK_SET,
7946 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7950 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7953 /* If the kernel is too old, use good old BSD locks */
7954 if (errno == EINVAL)
7955 r = flock(fd, operation);
7958 return errno == EAGAIN ? -EBUSY : -errno;
7961 /* If we acquired the lock, let's check if the file
7962 * still exists in the file system. If not, then the
7963 * previous exclusive owner removed it and then closed
7964 * it. In such a case our acquired lock is worthless,
7965 * hence try again. */
7970 if (st.st_nlink > 0)
7973 fd = safe_close(fd);
7978 ret->operation = operation;
7986 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7994 if (!filename_is_valid(fn))
7997 t = newa(char, strlen(p) + 2 + 4 + 1);
7998 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
8000 return make_lock_file(t, operation, ret);
8003 void release_lock_file(LockFile *f) {
8011 /* If we are the exclusive owner we can safely delete
8012 * the lock file itself. If we are not the exclusive
8013 * owner, we can try becoming it. */
8016 (f->operation & ~LOCK_NB) == LOCK_SH) {
8017 static const struct flock fl = {
8019 .l_whence = SEEK_SET,
8022 r = fcntl(f->fd, F_OFD_SETLK, &fl);
8023 if (r < 0 && errno == EINVAL)
8024 r = flock(f->fd, LOCK_EX|LOCK_NB);
8027 f->operation = LOCK_EX|LOCK_NB;
8030 if ((f->operation & ~LOCK_NB) == LOCK_EX)
8031 unlink_noerrno(f->path);
8037 f->fd = safe_close(f->fd);
8041 static size_t nul_length(const uint8_t *p, size_t sz) {
8056 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
8057 const uint8_t *q, *w, *e;
8065 n = nul_length(q, e - q);
8067 /* If there are more than the specified run length of
8068 * NUL bytes, or if this is the beginning or the end
8069 * of the buffer, then seek instead of write */
8070 if ((n > run_length) ||
8071 (n > 0 && q == p) ||
8072 (n > 0 && q + n >= e)) {
8074 l = write(fd, w, q - w);
8081 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
8093 l = write(fd, w, q - w);
8100 return q - (const uint8_t*) p;
8103 void sigkill_wait(pid_t *pid) {
8109 if (kill(*pid, SIGKILL) > 0)
8110 (void) wait_for_terminate(*pid, NULL);
8113 int syslog_parse_priority(const char **p, int *priority, bool with_facility) {
8114 int a = 0, b = 0, c = 0;
8124 if (!strchr(*p, '>'))
8127 if ((*p)[2] == '>') {
8128 c = undecchar((*p)[1]);
8130 } else if ((*p)[3] == '>') {
8131 b = undecchar((*p)[1]);
8132 c = undecchar((*p)[2]);
8134 } else if ((*p)[4] == '>') {
8135 a = undecchar((*p)[1]);
8136 b = undecchar((*p)[2]);
8137 c = undecchar((*p)[3]);
8142 if (a < 0 || b < 0 || c < 0 ||
8143 (!with_facility && (a || b || c > 7)))
8147 *priority = a*100 + b*10 + c;
8149 *priority = (*priority & LOG_FACMASK) | c;
8155 ssize_t string_table_lookup(const char * const *table, size_t len, const char *key) {
8161 for (i = 0; i < len; ++i)
8162 if (streq_ptr(table[i], key))
8168 void cmsg_close_all(struct msghdr *mh) {
8169 struct cmsghdr *cmsg;
8173 for (cmsg = CMSG_FIRSTHDR(mh); cmsg; cmsg = CMSG_NXTHDR(mh, cmsg))
8174 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS)
8175 close_many((int*) CMSG_DATA(cmsg), (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int));
8178 int rename_noreplace(int olddirfd, const char *oldpath, int newdirfd, const char *newpath) {
8182 ret = renameat2(olddirfd, oldpath, newdirfd, newpath, RENAME_NOREPLACE);
8186 /* Even though renameat2() exists since Linux 3.15, btrfs added
8187 * support for it later. If it is not implemented, fallback to another
8189 if (errno != EINVAL)
8192 /* The link()/unlink() fallback does not work on directories. But
8193 * renameat() without RENAME_NOREPLACE gives the same semantics on
8194 * directories, except when newpath is an *empty* directory. This is
8196 ret = fstatat(olddirfd, oldpath, &buf, AT_SYMLINK_NOFOLLOW);
8197 if (ret >= 0 && S_ISDIR(buf.st_mode)) {
8198 ret = renameat(olddirfd, oldpath, newdirfd, newpath);
8199 return ret >= 0 ? 0 : -errno;
8202 /* If it is not a directory, use the link()/unlink() fallback. */
8203 ret = linkat(olddirfd, oldpath, newdirfd, newpath, 0);
8207 ret = unlinkat(olddirfd, oldpath, 0);
8209 /* backup errno before the following unlinkat() alters it */
8211 (void) unlinkat(newdirfd, newpath, 0);