1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
31 #include <sys/resource.h>
32 #include <linux/sched.h>
33 #include <sys/types.h>
37 #include <sys/ioctl.h>
39 #include <linux/tiocl.h>
44 #include <sys/prctl.h>
45 #include <sys/utsname.h>
47 #include <netinet/ip.h>
56 #include <sys/mount.h>
57 #include <linux/magic.h>
61 #include <sys/personality.h>
62 #include <sys/xattr.h>
63 #include <sys/statvfs.h>
67 /* When we include libgen.h because we need dirname() we immediately
68 * undefine basename() since libgen.h defines it as a macro to the XDG
69 * version which is really broken. */
73 #ifdef HAVE_SYS_AUXV_H
85 #include "path-util.h"
86 #include "exit-status.h"
90 #include "device-nodes.h"
95 #include "sparse-endian.h"
98 char **saved_argv = NULL;
100 static volatile unsigned cached_columns = 0;
101 static volatile unsigned cached_lines = 0;
103 size_t page_size(void) {
104 static thread_local size_t pgsz = 0;
107 if (_likely_(pgsz > 0))
110 r = sysconf(_SC_PAGESIZE);
117 bool streq_ptr(const char *a, const char *b) {
119 /* Like streq(), but tries to make sense of NULL pointers */
130 char* endswith(const char *s, const char *postfix) {
137 pl = strlen(postfix);
140 return (char*) s + sl;
145 if (memcmp(s + sl - pl, postfix, pl) != 0)
148 return (char*) s + sl - pl;
151 char* first_word(const char *s, const char *word) {
158 /* Checks if the string starts with the specified word, either
159 * followed by NUL or by whitespace. Returns a pointer to the
160 * NUL or the first character after the whitespace. */
171 if (memcmp(s, word, wl) != 0)
178 if (!strchr(WHITESPACE, *p))
181 p += strspn(p, WHITESPACE);
185 static size_t cescape_char(char c, char *buf) {
186 char * buf_old = buf;
232 /* For special chars we prefer octal over
233 * hexadecimal encoding, simply because glib's
234 * g_strescape() does the same */
235 if ((c < ' ') || (c >= 127)) {
237 *(buf++) = octchar((unsigned char) c >> 6);
238 *(buf++) = octchar((unsigned char) c >> 3);
239 *(buf++) = octchar((unsigned char) c);
245 return buf - buf_old;
248 int close_nointr(int fd) {
255 * Just ignore EINTR; a retry loop is the wrong thing to do on
258 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
259 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
260 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
261 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
269 int safe_close(int fd) {
272 * Like close_nointr() but cannot fail. Guarantees errno is
273 * unchanged. Is a NOP with negative fds passed, and returns
274 * -1, so that it can be used in this syntax:
276 * fd = safe_close(fd);
282 /* The kernel might return pretty much any error code
283 * via close(), but the fd will be closed anyway. The
284 * only condition we want to check for here is whether
285 * the fd was invalid at all... */
287 assert_se(close_nointr(fd) != -EBADF);
293 void close_many(const int fds[], unsigned n_fd) {
296 assert(fds || n_fd <= 0);
298 for (i = 0; i < n_fd; i++)
302 int unlink_noerrno(const char *path) {
313 int parse_boolean(const char *v) {
316 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
318 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
324 int parse_pid(const char *s, pid_t* ret_pid) {
325 unsigned long ul = 0;
332 r = safe_atolu(s, &ul);
338 if ((unsigned long) pid != ul)
348 int parse_uid(const char *s, uid_t* ret_uid) {
349 unsigned long ul = 0;
356 r = safe_atolu(s, &ul);
362 if ((unsigned long) uid != ul)
365 /* Some libc APIs use UID_INVALID as special placeholder */
366 if (uid == (uid_t) 0xFFFFFFFF)
369 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
370 if (uid == (uid_t) 0xFFFF)
377 int safe_atou(const char *s, unsigned *ret_u) {
385 l = strtoul(s, &x, 0);
387 if (!x || x == s || *x || errno)
388 return errno > 0 ? -errno : -EINVAL;
390 if ((unsigned long) (unsigned) l != l)
393 *ret_u = (unsigned) l;
397 int safe_atoi(const char *s, int *ret_i) {
405 l = strtol(s, &x, 0);
407 if (!x || x == s || *x || errno)
408 return errno > 0 ? -errno : -EINVAL;
410 if ((long) (int) l != l)
417 int safe_atou8(const char *s, uint8_t *ret) {
425 l = strtoul(s, &x, 0);
427 if (!x || x == s || *x || errno)
428 return errno > 0 ? -errno : -EINVAL;
430 if ((unsigned long) (uint8_t) l != l)
437 int safe_atou16(const char *s, uint16_t *ret) {
445 l = strtoul(s, &x, 0);
447 if (!x || x == s || *x || errno)
448 return errno > 0 ? -errno : -EINVAL;
450 if ((unsigned long) (uint16_t) l != l)
457 int safe_atoi16(const char *s, int16_t *ret) {
465 l = strtol(s, &x, 0);
467 if (!x || x == s || *x || errno)
468 return errno > 0 ? -errno : -EINVAL;
470 if ((long) (int16_t) l != l)
477 int safe_atollu(const char *s, long long unsigned *ret_llu) {
479 unsigned long long l;
485 l = strtoull(s, &x, 0);
487 if (!x || x == s || *x || errno)
488 return errno ? -errno : -EINVAL;
494 int safe_atolli(const char *s, long long int *ret_lli) {
502 l = strtoll(s, &x, 0);
504 if (!x || x == s || *x || errno)
505 return errno ? -errno : -EINVAL;
511 int safe_atod(const char *s, double *ret_d) {
519 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
520 if (loc == (locale_t) 0)
524 d = strtod_l(s, &x, loc);
526 if (!x || x == s || *x || errno) {
528 return errno ? -errno : -EINVAL;
536 static size_t strcspn_escaped(const char *s, const char *reject) {
537 bool escaped = false;
540 for (n=0; s[n]; n++) {
543 else if (s[n] == '\\')
545 else if (strchr(reject, s[n]))
549 /* if s ends in \, return index of previous char */
553 /* Split a string into words. */
554 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
560 assert(**state == '\0');
564 current += strspn(current, separator);
570 if (quoted && strchr("\'\"", *current)) {
571 char quotechars[2] = {*current, '\0'};
573 *l = strcspn_escaped(current + 1, quotechars);
574 if (current[*l + 1] == '\0' ||
575 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
576 /* right quote missing or garbage at the end */
580 assert(current[*l + 1] == quotechars[0]);
581 *state = current++ + *l + 2;
583 *l = strcspn_escaped(current, separator);
584 if (current[*l] && !strchr(separator, current[*l])) {
585 /* unfinished escape */
589 *state = current + *l;
591 *l = strcspn(current, separator);
592 *state = current + *l;
598 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
600 _cleanup_free_ char *line = NULL;
612 p = procfs_file_alloca(pid, "stat");
613 r = read_one_line_file(p, &line);
617 /* Let's skip the pid and comm fields. The latter is enclosed
618 * in () but does not escape any () in its value, so let's
619 * skip over it manually */
621 p = strrchr(line, ')');
633 if ((long unsigned) (pid_t) ppid != ppid)
636 *_ppid = (pid_t) ppid;
641 int fchmod_umask(int fd, mode_t m) {
646 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
652 char *truncate_nl(char *s) {
655 s[strcspn(s, NEWLINE)] = 0;
659 int get_process_state(pid_t pid) {
663 _cleanup_free_ char *line = NULL;
667 p = procfs_file_alloca(pid, "stat");
668 r = read_one_line_file(p, &line);
672 p = strrchr(line, ')');
678 if (sscanf(p, " %c", &state) != 1)
681 return (unsigned char) state;
684 int get_process_comm(pid_t pid, char **name) {
691 p = procfs_file_alloca(pid, "comm");
693 r = read_one_line_file(p, name);
700 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
701 _cleanup_fclose_ FILE *f = NULL;
709 p = procfs_file_alloca(pid, "cmdline");
715 if (max_length == 0) {
716 size_t len = 0, allocated = 0;
718 while ((c = getc(f)) != EOF) {
720 if (!GREEDY_REALLOC(r, allocated, len+2)) {
725 r[len++] = isprint(c) ? c : ' ';
735 r = new(char, max_length);
741 while ((c = getc(f)) != EOF) {
763 size_t n = MIN(left-1, 3U);
770 /* Kernel threads have no argv[] */
772 _cleanup_free_ char *t = NULL;
780 h = get_process_comm(pid, &t);
784 r = strjoin("[", t, "]", NULL);
793 int is_kernel_thread(pid_t pid) {
805 p = procfs_file_alloca(pid, "cmdline");
810 count = fread(&c, 1, 1, f);
814 /* Kernel threads have an empty cmdline */
817 return eof ? 1 : -errno;
822 int get_process_capeff(pid_t pid, char **capeff) {
828 p = procfs_file_alloca(pid, "status");
830 return get_status_field(p, "\nCapEff:", capeff);
833 static int get_process_link_contents(const char *proc_file, char **name) {
839 r = readlink_malloc(proc_file, name);
841 return r == -ENOENT ? -ESRCH : r;
846 int get_process_exe(pid_t pid, char **name) {
853 p = procfs_file_alloca(pid, "exe");
854 r = get_process_link_contents(p, name);
858 d = endswith(*name, " (deleted)");
865 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
866 _cleanup_fclose_ FILE *f = NULL;
876 p = procfs_file_alloca(pid, "status");
881 FOREACH_LINE(line, f, return -errno) {
886 if (startswith(l, field)) {
888 l += strspn(l, WHITESPACE);
890 l[strcspn(l, WHITESPACE)] = 0;
892 return parse_uid(l, uid);
899 int get_process_uid(pid_t pid, uid_t *uid) {
900 return get_process_id(pid, "Uid:", uid);
903 int get_process_gid(pid_t pid, gid_t *gid) {
904 assert_cc(sizeof(uid_t) == sizeof(gid_t));
905 return get_process_id(pid, "Gid:", gid);
908 int get_process_cwd(pid_t pid, char **cwd) {
913 p = procfs_file_alloca(pid, "cwd");
915 return get_process_link_contents(p, cwd);
918 int get_process_root(pid_t pid, char **root) {
923 p = procfs_file_alloca(pid, "root");
925 return get_process_link_contents(p, root);
928 int get_process_environ(pid_t pid, char **env) {
929 _cleanup_fclose_ FILE *f = NULL;
930 _cleanup_free_ char *outcome = NULL;
933 size_t allocated = 0, sz = 0;
938 p = procfs_file_alloca(pid, "environ");
944 while ((c = fgetc(f)) != EOF) {
945 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
949 outcome[sz++] = '\n';
951 sz += cescape_char(c, outcome + sz);
961 char *strnappend(const char *s, const char *suffix, size_t b) {
969 return strndup(suffix, b);
978 if (b > ((size_t) -1) - a)
981 r = new(char, a+b+1);
986 memcpy(r+a, suffix, b);
992 char *strappend(const char *s, const char *suffix) {
993 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
996 int readlinkat_malloc(int fd, const char *p, char **ret) {
1011 n = readlinkat(fd, p, c, l-1);
1018 if ((size_t) n < l-1) {
1029 int readlink_malloc(const char *p, char **ret) {
1030 return readlinkat_malloc(AT_FDCWD, p, ret);
1033 int readlink_value(const char *p, char **ret) {
1034 _cleanup_free_ char *link = NULL;
1038 r = readlink_malloc(p, &link);
1042 value = basename(link);
1046 value = strdup(value);
1055 int readlink_and_make_absolute(const char *p, char **r) {
1056 _cleanup_free_ char *target = NULL;
1063 j = readlink_malloc(p, &target);
1067 k = file_in_same_dir(p, target);
1075 int readlink_and_canonicalize(const char *p, char **r) {
1082 j = readlink_and_make_absolute(p, &t);
1086 s = canonicalize_file_name(t);
1093 path_kill_slashes(*r);
1098 int reset_all_signal_handlers(void) {
1101 for (sig = 1; sig < _NSIG; sig++) {
1102 struct sigaction sa = {
1103 .sa_handler = SIG_DFL,
1104 .sa_flags = SA_RESTART,
1107 /* These two cannot be caught... */
1108 if (sig == SIGKILL || sig == SIGSTOP)
1111 /* On Linux the first two RT signals are reserved by
1112 * glibc, and sigaction() will return EINVAL for them. */
1113 if ((sigaction(sig, &sa, NULL) < 0))
1114 if (errno != EINVAL && r == 0)
1121 int reset_signal_mask(void) {
1124 if (sigemptyset(&ss) < 0)
1127 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1133 char *strstrip(char *s) {
1136 /* Drops trailing whitespace. Modifies the string in
1137 * place. Returns pointer to first non-space character */
1139 s += strspn(s, WHITESPACE);
1141 for (e = strchr(s, 0); e > s; e --)
1142 if (!strchr(WHITESPACE, e[-1]))
1150 char *delete_chars(char *s, const char *bad) {
1153 /* Drops all whitespace, regardless where in the string */
1155 for (f = s, t = s; *f; f++) {
1156 if (strchr(bad, *f))
1167 char *file_in_same_dir(const char *path, const char *filename) {
1174 /* This removes the last component of path and appends
1175 * filename, unless the latter is absolute anyway or the
1178 if (path_is_absolute(filename))
1179 return strdup(filename);
1181 e = strrchr(path, '/');
1183 return strdup(filename);
1185 k = strlen(filename);
1186 ret = new(char, (e + 1 - path) + k + 1);
1190 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1194 int rmdir_parents(const char *path, const char *stop) {
1203 /* Skip trailing slashes */
1204 while (l > 0 && path[l-1] == '/')
1210 /* Skip last component */
1211 while (l > 0 && path[l-1] != '/')
1214 /* Skip trailing slashes */
1215 while (l > 0 && path[l-1] == '/')
1221 if (!(t = strndup(path, l)))
1224 if (path_startswith(stop, t)) {
1233 if (errno != ENOENT)
1240 char hexchar(int x) {
1241 static const char table[16] = "0123456789abcdef";
1243 return table[x & 15];
1246 int unhexchar(char c) {
1248 if (c >= '0' && c <= '9')
1251 if (c >= 'a' && c <= 'f')
1252 return c - 'a' + 10;
1254 if (c >= 'A' && c <= 'F')
1255 return c - 'A' + 10;
1260 char *hexmem(const void *p, size_t l) {
1264 z = r = malloc(l * 2 + 1);
1268 for (x = p; x < (const uint8_t*) p + l; x++) {
1269 *(z++) = hexchar(*x >> 4);
1270 *(z++) = hexchar(*x & 15);
1277 void *unhexmem(const char *p, size_t l) {
1283 z = r = malloc((l + 1) / 2 + 1);
1287 for (x = p; x < p + l; x += 2) {
1290 a = unhexchar(x[0]);
1292 b = unhexchar(x[1]);
1296 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1303 char octchar(int x) {
1304 return '0' + (x & 7);
1307 int unoctchar(char c) {
1309 if (c >= '0' && c <= '7')
1315 char decchar(int x) {
1316 return '0' + (x % 10);
1319 int undecchar(char c) {
1321 if (c >= '0' && c <= '9')
1327 char *cescape(const char *s) {
1333 /* Does C style string escaping. */
1335 r = new(char, strlen(s)*4 + 1);
1339 for (f = s, t = r; *f; f++)
1340 t += cescape_char(*f, t);
1347 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1354 /* Undoes C style string escaping, and optionally prefixes it. */
1356 pl = prefix ? strlen(prefix) : 0;
1358 r = new(char, pl+length+1);
1363 memcpy(r, prefix, pl);
1365 for (f = s, t = r + pl; f < s + length; f++) {
1366 size_t remaining = s + length - f;
1367 assert(remaining > 0);
1369 if (*f != '\\') { /* a literal literal */
1374 if (--remaining == 0) { /* copy trailing backslash verbatim */
1415 /* This is an extension of the XDG syntax files */
1420 /* hexadecimal encoding */
1423 if (remaining >= 2) {
1424 a = unhexchar(f[1]);
1425 b = unhexchar(f[2]);
1428 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1429 /* Invalid escape code, let's take it literal then */
1433 *(t++) = (char) ((a << 4) | b);
1448 /* octal encoding */
1449 int a = -1, b = -1, c = -1;
1451 if (remaining >= 3) {
1452 a = unoctchar(f[0]);
1453 b = unoctchar(f[1]);
1454 c = unoctchar(f[2]);
1457 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1458 /* Invalid escape code, let's take it literal then */
1462 *(t++) = (char) ((a << 6) | (b << 3) | c);
1470 /* Invalid escape code, let's take it literal then */
1481 char *cunescape_length(const char *s, size_t length) {
1482 return cunescape_length_with_prefix(s, length, NULL);
1485 char *cunescape(const char *s) {
1488 return cunescape_length(s, strlen(s));
1491 char *xescape(const char *s, const char *bad) {
1495 /* Escapes all chars in bad, in addition to \ and all special
1496 * chars, in \xFF style escaping. May be reversed with
1499 r = new(char, strlen(s) * 4 + 1);
1503 for (f = s, t = r; *f; f++) {
1505 if ((*f < ' ') || (*f >= 127) ||
1506 (*f == '\\') || strchr(bad, *f)) {
1509 *(t++) = hexchar(*f >> 4);
1510 *(t++) = hexchar(*f);
1520 char *ascii_strlower(char *t) {
1525 for (p = t; *p; p++)
1526 if (*p >= 'A' && *p <= 'Z')
1527 *p = *p - 'A' + 'a';
1532 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1536 filename[0] == '.' ||
1537 streq(filename, "lost+found") ||
1538 streq(filename, "aquota.user") ||
1539 streq(filename, "aquota.group") ||
1540 endswith(filename, ".rpmnew") ||
1541 endswith(filename, ".rpmsave") ||
1542 endswith(filename, ".rpmorig") ||
1543 endswith(filename, ".dpkg-old") ||
1544 endswith(filename, ".dpkg-new") ||
1545 endswith(filename, ".dpkg-tmp") ||
1546 endswith(filename, ".dpkg-dist") ||
1547 endswith(filename, ".dpkg-bak") ||
1548 endswith(filename, ".dpkg-backup") ||
1549 endswith(filename, ".dpkg-remove") ||
1550 endswith(filename, ".swp");
1553 bool hidden_file(const char *filename) {
1556 if (endswith(filename, "~"))
1559 return hidden_file_allow_backup(filename);
1562 int fd_nonblock(int fd, bool nonblock) {
1567 flags = fcntl(fd, F_GETFL, 0);
1572 nflags = flags | O_NONBLOCK;
1574 nflags = flags & ~O_NONBLOCK;
1576 if (nflags == flags)
1579 if (fcntl(fd, F_SETFL, nflags) < 0)
1585 int fd_cloexec(int fd, bool cloexec) {
1590 flags = fcntl(fd, F_GETFD, 0);
1595 nflags = flags | FD_CLOEXEC;
1597 nflags = flags & ~FD_CLOEXEC;
1599 if (nflags == flags)
1602 if (fcntl(fd, F_SETFD, nflags) < 0)
1608 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1611 assert(n_fdset == 0 || fdset);
1613 for (i = 0; i < n_fdset; i++)
1620 int close_all_fds(const int except[], unsigned n_except) {
1621 _cleanup_closedir_ DIR *d = NULL;
1625 assert(n_except == 0 || except);
1627 d = opendir("/proc/self/fd");
1632 /* When /proc isn't available (for example in chroots)
1633 * the fallback is brute forcing through the fd
1636 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1637 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1639 if (fd_in_set(fd, except, n_except))
1642 if (close_nointr(fd) < 0)
1643 if (errno != EBADF && r == 0)
1650 while ((de = readdir(d))) {
1653 if (hidden_file(de->d_name))
1656 if (safe_atoi(de->d_name, &fd) < 0)
1657 /* Let's better ignore this, just in case */
1666 if (fd_in_set(fd, except, n_except))
1669 if (close_nointr(fd) < 0) {
1670 /* Valgrind has its own FD and doesn't want to have it closed */
1671 if (errno != EBADF && r == 0)
1679 bool chars_intersect(const char *a, const char *b) {
1682 /* Returns true if any of the chars in a are in b. */
1683 for (p = a; *p; p++)
1690 bool fstype_is_network(const char *fstype) {
1691 static const char table[] =
1705 x = startswith(fstype, "fuse.");
1709 return nulstr_contains(table, fstype);
1713 _cleanup_close_ int fd;
1715 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1721 TIOCL_GETKMSGREDIRECT,
1725 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1728 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1731 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1737 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1738 struct termios old_termios, new_termios;
1739 char c, line[LINE_MAX];
1744 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1745 new_termios = old_termios;
1747 new_termios.c_lflag &= ~ICANON;
1748 new_termios.c_cc[VMIN] = 1;
1749 new_termios.c_cc[VTIME] = 0;
1751 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1754 if (t != USEC_INFINITY) {
1755 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1756 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1761 k = fread(&c, 1, 1, f);
1763 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1769 *need_nl = c != '\n';
1776 if (t != USEC_INFINITY) {
1777 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1782 if (!fgets(line, sizeof(line), f))
1783 return errno ? -errno : -EIO;
1787 if (strlen(line) != 1)
1797 int ask_char(char *ret, const char *replies, const char *text, ...) {
1807 bool need_nl = true;
1810 fputs(ANSI_HIGHLIGHT_ON, stdout);
1817 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1821 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1824 if (r == -EBADMSG) {
1825 puts("Bad input, please try again.");
1836 if (strchr(replies, c)) {
1841 puts("Read unexpected character, please try again.");
1845 int ask_string(char **ret, const char *text, ...) {
1850 char line[LINE_MAX];
1854 fputs(ANSI_HIGHLIGHT_ON, stdout);
1861 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1866 if (!fgets(line, sizeof(line), stdin))
1867 return errno ? -errno : -EIO;
1869 if (!endswith(line, "\n"))
1888 int reset_terminal_fd(int fd, bool switch_to_text) {
1889 struct termios termios;
1892 /* Set terminal to some sane defaults */
1896 /* We leave locked terminal attributes untouched, so that
1897 * Plymouth may set whatever it wants to set, and we don't
1898 * interfere with that. */
1900 /* Disable exclusive mode, just in case */
1901 ioctl(fd, TIOCNXCL);
1903 /* Switch to text mode */
1905 ioctl(fd, KDSETMODE, KD_TEXT);
1907 /* Enable console unicode mode */
1908 ioctl(fd, KDSKBMODE, K_UNICODE);
1910 if (tcgetattr(fd, &termios) < 0) {
1915 /* We only reset the stuff that matters to the software. How
1916 * hardware is set up we don't touch assuming that somebody
1917 * else will do that for us */
1919 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1920 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1921 termios.c_oflag |= ONLCR;
1922 termios.c_cflag |= CREAD;
1923 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1925 termios.c_cc[VINTR] = 03; /* ^C */
1926 termios.c_cc[VQUIT] = 034; /* ^\ */
1927 termios.c_cc[VERASE] = 0177;
1928 termios.c_cc[VKILL] = 025; /* ^X */
1929 termios.c_cc[VEOF] = 04; /* ^D */
1930 termios.c_cc[VSTART] = 021; /* ^Q */
1931 termios.c_cc[VSTOP] = 023; /* ^S */
1932 termios.c_cc[VSUSP] = 032; /* ^Z */
1933 termios.c_cc[VLNEXT] = 026; /* ^V */
1934 termios.c_cc[VWERASE] = 027; /* ^W */
1935 termios.c_cc[VREPRINT] = 022; /* ^R */
1936 termios.c_cc[VEOL] = 0;
1937 termios.c_cc[VEOL2] = 0;
1939 termios.c_cc[VTIME] = 0;
1940 termios.c_cc[VMIN] = 1;
1942 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1946 /* Just in case, flush all crap out */
1947 tcflush(fd, TCIOFLUSH);
1952 int reset_terminal(const char *name) {
1953 _cleanup_close_ int fd = -1;
1955 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1959 return reset_terminal_fd(fd, true);
1962 int open_terminal(const char *name, int mode) {
1967 * If a TTY is in the process of being closed opening it might
1968 * cause EIO. This is horribly awful, but unlikely to be
1969 * changed in the kernel. Hence we work around this problem by
1970 * retrying a couple of times.
1972 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
1975 assert(!(mode & O_CREAT));
1978 fd = open(name, mode, 0);
1985 /* Max 1s in total */
1989 usleep(50 * USEC_PER_MSEC);
2007 int flush_fd(int fd) {
2008 struct pollfd pollfd = {
2018 r = poll(&pollfd, 1, 0);
2028 l = read(fd, buf, sizeof(buf));
2034 if (errno == EAGAIN)
2043 int acquire_terminal(
2047 bool ignore_tiocstty_eperm,
2050 int fd = -1, notify = -1, r = 0, wd = -1;
2055 /* We use inotify to be notified when the tty is closed. We
2056 * create the watch before checking if we can actually acquire
2057 * it, so that we don't lose any event.
2059 * Note: strictly speaking this actually watches for the
2060 * device being closed, it does *not* really watch whether a
2061 * tty loses its controlling process. However, unless some
2062 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2063 * its tty otherwise this will not become a problem. As long
2064 * as the administrator makes sure not configure any service
2065 * on the same tty as an untrusted user this should not be a
2066 * problem. (Which he probably should not do anyway.) */
2068 if (timeout != USEC_INFINITY)
2069 ts = now(CLOCK_MONOTONIC);
2071 if (!fail && !force) {
2072 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2078 wd = inotify_add_watch(notify, name, IN_CLOSE);
2086 struct sigaction sa_old, sa_new = {
2087 .sa_handler = SIG_IGN,
2088 .sa_flags = SA_RESTART,
2092 r = flush_fd(notify);
2097 /* We pass here O_NOCTTY only so that we can check the return
2098 * value TIOCSCTTY and have a reliable way to figure out if we
2099 * successfully became the controlling process of the tty */
2100 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2104 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2105 * if we already own the tty. */
2106 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2108 /* First, try to get the tty */
2109 if (ioctl(fd, TIOCSCTTY, force) < 0)
2112 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2114 /* Sometimes it makes sense to ignore TIOCSCTTY
2115 * returning EPERM, i.e. when very likely we already
2116 * are have this controlling terminal. */
2117 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2120 if (r < 0 && (force || fail || r != -EPERM)) {
2129 assert(notify >= 0);
2132 union inotify_event_buffer buffer;
2133 struct inotify_event *e;
2136 if (timeout != USEC_INFINITY) {
2139 n = now(CLOCK_MONOTONIC);
2140 if (ts + timeout < n) {
2145 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2155 l = read(notify, &buffer, sizeof(buffer));
2157 if (errno == EINTR || errno == EAGAIN)
2164 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2165 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2174 /* We close the tty fd here since if the old session
2175 * ended our handle will be dead. It's important that
2176 * we do this after sleeping, so that we don't enter
2177 * an endless loop. */
2178 fd = safe_close(fd);
2183 r = reset_terminal_fd(fd, true);
2185 log_warning_errno(r, "Failed to reset terminal: %m");
2196 int release_terminal(void) {
2197 static const struct sigaction sa_new = {
2198 .sa_handler = SIG_IGN,
2199 .sa_flags = SA_RESTART,
2202 _cleanup_close_ int fd = -1;
2203 struct sigaction sa_old;
2206 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2210 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2211 * by our own TIOCNOTTY */
2212 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2214 if (ioctl(fd, TIOCNOTTY) < 0)
2217 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2222 int sigaction_many(const struct sigaction *sa, ...) {
2227 while ((sig = va_arg(ap, int)) > 0)
2228 if (sigaction(sig, sa, NULL) < 0)
2235 int ignore_signals(int sig, ...) {
2236 struct sigaction sa = {
2237 .sa_handler = SIG_IGN,
2238 .sa_flags = SA_RESTART,
2243 if (sigaction(sig, &sa, NULL) < 0)
2247 while ((sig = va_arg(ap, int)) > 0)
2248 if (sigaction(sig, &sa, NULL) < 0)
2255 int default_signals(int sig, ...) {
2256 struct sigaction sa = {
2257 .sa_handler = SIG_DFL,
2258 .sa_flags = SA_RESTART,
2263 if (sigaction(sig, &sa, NULL) < 0)
2267 while ((sig = va_arg(ap, int)) > 0)
2268 if (sigaction(sig, &sa, NULL) < 0)
2275 void safe_close_pair(int p[]) {
2279 /* Special case pairs which use the same fd in both
2281 p[0] = p[1] = safe_close(p[0]);
2285 p[0] = safe_close(p[0]);
2286 p[1] = safe_close(p[1]);
2289 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2296 while (nbytes > 0) {
2299 k = read(fd, p, nbytes);
2304 if (errno == EAGAIN && do_poll) {
2306 /* We knowingly ignore any return value here,
2307 * and expect that any error/EOF is reported
2310 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2314 return n > 0 ? n : -errno;
2328 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2329 const uint8_t *p = buf;
2336 while (nbytes > 0) {
2339 k = write(fd, p, nbytes);
2344 if (errno == EAGAIN && do_poll) {
2345 /* We knowingly ignore any return value here,
2346 * and expect that any error/EOF is reported
2349 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2356 if (k == 0) /* Can't really happen */
2366 int parse_size(const char *t, off_t base, off_t *size) {
2368 /* Soo, sometimes we want to parse IEC binary suffxies, and
2369 * sometimes SI decimal suffixes. This function can parse
2370 * both. Which one is the right way depends on the
2371 * context. Wikipedia suggests that SI is customary for
2372 * hardrware metrics and network speeds, while IEC is
2373 * customary for most data sizes used by software and volatile
2374 * (RAM) memory. Hence be careful which one you pick!
2376 * In either case we use just K, M, G as suffix, and not Ki,
2377 * Mi, Gi or so (as IEC would suggest). That's because that's
2378 * frickin' ugly. But this means you really need to make sure
2379 * to document which base you are parsing when you use this
2384 unsigned long long factor;
2387 static const struct table iec[] = {
2388 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2389 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2390 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2391 { "G", 1024ULL*1024ULL*1024ULL },
2392 { "M", 1024ULL*1024ULL },
2398 static const struct table si[] = {
2399 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2400 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2401 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2402 { "G", 1000ULL*1000ULL*1000ULL },
2403 { "M", 1000ULL*1000ULL },
2409 const struct table *table;
2411 unsigned long long r = 0;
2412 unsigned n_entries, start_pos = 0;
2415 assert(base == 1000 || base == 1024);
2420 n_entries = ELEMENTSOF(si);
2423 n_entries = ELEMENTSOF(iec);
2429 unsigned long long l2;
2435 l = strtoll(p, &e, 10);
2448 if (*e >= '0' && *e <= '9') {
2451 /* strotoull itself would accept space/+/- */
2452 l2 = strtoull(e, &e2, 10);
2454 if (errno == ERANGE)
2457 /* Ignore failure. E.g. 10.M is valid */
2464 e += strspn(e, WHITESPACE);
2466 for (i = start_pos; i < n_entries; i++)
2467 if (startswith(e, table[i].suffix)) {
2468 unsigned long long tmp;
2469 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2471 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2472 if (tmp > ULLONG_MAX - r)
2476 if ((unsigned long long) (off_t) r != r)
2479 p = e + strlen(table[i].suffix);
2495 int make_stdio(int fd) {
2500 r = dup2(fd, STDIN_FILENO);
2501 s = dup2(fd, STDOUT_FILENO);
2502 t = dup2(fd, STDERR_FILENO);
2507 if (r < 0 || s < 0 || t < 0)
2510 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2511 * dup2() was a NOP and the bit hence possibly set. */
2512 fd_cloexec(STDIN_FILENO, false);
2513 fd_cloexec(STDOUT_FILENO, false);
2514 fd_cloexec(STDERR_FILENO, false);
2519 int make_null_stdio(void) {
2522 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2526 return make_stdio(null_fd);
2529 bool is_device_path(const char *path) {
2531 /* Returns true on paths that refer to a device, either in
2532 * sysfs or in /dev */
2535 path_startswith(path, "/dev/") ||
2536 path_startswith(path, "/sys/");
2539 int dir_is_empty(const char *path) {
2540 _cleanup_closedir_ DIR *d;
2551 if (!de && errno != 0)
2557 if (!hidden_file(de->d_name))
2562 char* dirname_malloc(const char *path) {
2563 char *d, *dir, *dir2;
2580 int dev_urandom(void *p, size_t n) {
2581 static int have_syscall = -1;
2585 /* Gathers some randomness from the kernel. This call will
2586 * never block, and will always return some data from the
2587 * kernel, regardless if the random pool is fully initialized
2588 * or not. It thus makes no guarantee for the quality of the
2589 * returned entropy, but is good enough for or usual usecases
2590 * of seeding the hash functions for hashtable */
2592 /* Use the getrandom() syscall unless we know we don't have
2593 * it, or when the requested size is too large for it. */
2594 if (have_syscall != 0 || (size_t) (int) n != n) {
2595 r = getrandom(p, n, GRND_NONBLOCK);
2597 have_syscall = true;
2602 if (errno == ENOSYS)
2603 /* we lack the syscall, continue with
2604 * reading from /dev/urandom */
2605 have_syscall = false;
2606 else if (errno == EAGAIN)
2607 /* not enough entropy for now. Let's
2608 * remember to use the syscall the
2609 * next time, again, but also read
2610 * from /dev/urandom for now, which
2611 * doesn't care about the current
2612 * amount of entropy. */
2613 have_syscall = true;
2617 /* too short read? */
2621 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2623 return errno == ENOENT ? -ENOSYS : -errno;
2625 k = loop_read(fd, p, n, true);
2630 if ((size_t) k != n)
2636 void initialize_srand(void) {
2637 static bool srand_called = false;
2639 #ifdef HAVE_SYS_AUXV_H
2648 #ifdef HAVE_SYS_AUXV_H
2649 /* The kernel provides us with a bit of entropy in auxv, so
2650 * let's try to make use of that to seed the pseudo-random
2651 * generator. It's better than nothing... */
2653 auxv = (void*) getauxval(AT_RANDOM);
2655 x ^= *(unsigned*) auxv;
2658 x ^= (unsigned) now(CLOCK_REALTIME);
2659 x ^= (unsigned) gettid();
2662 srand_called = true;
2665 void random_bytes(void *p, size_t n) {
2669 r = dev_urandom(p, n);
2673 /* If some idiot made /dev/urandom unavailable to us, he'll
2674 * get a PRNG instead. */
2678 for (q = p; q < (uint8_t*) p + n; q ++)
2682 void rename_process(const char name[8]) {
2685 /* This is a like a poor man's setproctitle(). It changes the
2686 * comm field, argv[0], and also the glibc's internally used
2687 * name of the process. For the first one a limit of 16 chars
2688 * applies, to the second one usually one of 10 (i.e. length
2689 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2690 * "systemd"). If you pass a longer string it will be
2693 prctl(PR_SET_NAME, name);
2695 if (program_invocation_name)
2696 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2698 if (saved_argc > 0) {
2702 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2704 for (i = 1; i < saved_argc; i++) {
2708 memzero(saved_argv[i], strlen(saved_argv[i]));
2713 void sigset_add_many(sigset_t *ss, ...) {
2720 while ((sig = va_arg(ap, int)) > 0)
2721 assert_se(sigaddset(ss, sig) == 0);
2725 int sigprocmask_many(int how, ...) {
2730 assert_se(sigemptyset(&ss) == 0);
2733 while ((sig = va_arg(ap, int)) > 0)
2734 assert_se(sigaddset(&ss, sig) == 0);
2737 if (sigprocmask(how, &ss, NULL) < 0)
2743 char* gethostname_malloc(void) {
2746 assert_se(uname(&u) >= 0);
2748 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2749 return strdup(u.nodename);
2751 return strdup(u.sysname);
2754 bool hostname_is_set(void) {
2757 assert_se(uname(&u) >= 0);
2759 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2762 char *lookup_uid(uid_t uid) {
2765 _cleanup_free_ char *buf = NULL;
2766 struct passwd pwbuf, *pw = NULL;
2768 /* Shortcut things to avoid NSS lookups */
2770 return strdup("root");
2772 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2776 buf = malloc(bufsize);
2780 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2781 return strdup(pw->pw_name);
2783 if (asprintf(&name, UID_FMT, uid) < 0)
2789 char* getlogname_malloc(void) {
2793 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2798 return lookup_uid(uid);
2801 char *getusername_malloc(void) {
2808 return lookup_uid(getuid());
2811 int getttyname_malloc(int fd, char **ret) {
2821 r = ttyname_r(fd, path, sizeof(path));
2826 p = startswith(path, "/dev/");
2827 c = strdup(p ?: path);
2844 int getttyname_harder(int fd, char **r) {
2848 k = getttyname_malloc(fd, &s);
2852 if (streq(s, "tty")) {
2854 return get_ctty(0, NULL, r);
2861 int get_ctty_devnr(pid_t pid, dev_t *d) {
2863 _cleanup_free_ char *line = NULL;
2865 unsigned long ttynr;
2869 p = procfs_file_alloca(pid, "stat");
2870 r = read_one_line_file(p, &line);
2874 p = strrchr(line, ')');
2884 "%*d " /* session */
2889 if (major(ttynr) == 0 && minor(ttynr) == 0)
2898 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2899 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2900 _cleanup_free_ char *s = NULL;
2907 k = get_ctty_devnr(pid, &devnr);
2911 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
2913 k = readlink_malloc(fn, &s);
2919 /* This is an ugly hack */
2920 if (major(devnr) == 136) {
2921 asprintf(&b, "pts/%u", minor(devnr));
2925 /* Probably something like the ptys which have no
2926 * symlink in /dev/char. Let's return something
2927 * vaguely useful. */
2933 if (startswith(s, "/dev/"))
2935 else if (startswith(s, "../"))
2953 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2954 _cleanup_closedir_ DIR *d = NULL;
2959 /* This returns the first error we run into, but nevertheless
2960 * tries to go on. This closes the passed fd. */
2966 return errno == ENOENT ? 0 : -errno;
2971 bool is_dir, keep_around;
2978 if (errno != 0 && ret == 0)
2983 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
2986 if (de->d_type == DT_UNKNOWN ||
2988 (de->d_type == DT_DIR && root_dev)) {
2989 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
2990 if (ret == 0 && errno != ENOENT)
2995 is_dir = S_ISDIR(st.st_mode);
2998 (st.st_uid == 0 || st.st_uid == getuid()) &&
2999 (st.st_mode & S_ISVTX);
3001 is_dir = de->d_type == DT_DIR;
3002 keep_around = false;
3008 /* if root_dev is set, remove subdirectories only, if device is same as dir */
3009 if (root_dev && st.st_dev != root_dev->st_dev)
3012 subdir_fd = openat(fd, de->d_name,
3013 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3014 if (subdir_fd < 0) {
3015 if (ret == 0 && errno != ENOENT)
3020 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
3021 if (r < 0 && ret == 0)
3025 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
3026 if (ret == 0 && errno != ENOENT)
3030 } else if (!only_dirs && !keep_around) {
3032 if (unlinkat(fd, de->d_name, 0) < 0) {
3033 if (ret == 0 && errno != ENOENT)
3040 _pure_ static int is_temporary_fs(struct statfs *s) {
3043 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3044 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3047 int is_fd_on_temporary_fs(int fd) {
3050 if (fstatfs(fd, &s) < 0)
3053 return is_temporary_fs(&s);
3056 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
3061 if (fstatfs(fd, &s) < 0) {
3066 /* We refuse to clean disk file systems with this call. This
3067 * is extra paranoia just to be sure we never ever remove
3069 if (!is_temporary_fs(&s)) {
3070 log_error("Attempted to remove disk file system, and we can't allow that.");
3075 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
3078 static int file_is_priv_sticky(const char *p) {
3083 if (lstat(p, &st) < 0)
3087 (st.st_uid == 0 || st.st_uid == getuid()) &&
3088 (st.st_mode & S_ISVTX);
3091 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
3097 /* We refuse to clean the root file system with this
3098 * call. This is extra paranoia to never cause a really
3099 * seriously broken system. */
3100 if (path_equal(path, "/")) {
3101 log_error("Attempted to remove entire root file system, and we can't allow that.");
3105 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3108 if (errno != ENOTDIR && errno != ELOOP)
3112 if (statfs(path, &s) < 0)
3115 if (!is_temporary_fs(&s)) {
3116 log_error("Attempted to remove disk file system, and we can't allow that.");
3121 if (delete_root && !only_dirs)
3122 if (unlink(path) < 0 && errno != ENOENT)
3129 if (fstatfs(fd, &s) < 0) {
3134 if (!is_temporary_fs(&s)) {
3135 log_error("Attempted to remove disk file system, and we can't allow that.");
3141 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
3144 if (honour_sticky && file_is_priv_sticky(path) > 0)
3147 if (rmdir(path) < 0 && errno != ENOENT) {
3156 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3157 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
3160 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3161 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
3164 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3167 /* Under the assumption that we are running privileged we
3168 * first change the access mode and only then hand out
3169 * ownership to avoid a window where access is too open. */
3171 if (mode != MODE_INVALID)
3172 if (chmod(path, mode) < 0)
3175 if (uid != UID_INVALID || gid != GID_INVALID)
3176 if (chown(path, uid, gid) < 0)
3182 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3185 /* Under the assumption that we are running privileged we
3186 * first change the access mode and only then hand out
3187 * ownership to avoid a window where access is too open. */
3189 if (mode != MODE_INVALID)
3190 if (fchmod(fd, mode) < 0)
3193 if (uid != UID_INVALID || gid != GID_INVALID)
3194 if (fchown(fd, uid, gid) < 0)
3200 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3204 /* Allocates the cpuset in the right size */
3207 if (!(r = CPU_ALLOC(n)))
3210 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3211 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3221 if (errno != EINVAL)
3228 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3229 static const char status_indent[] = " "; /* "[" STATUS "] " */
3230 _cleanup_free_ char *s = NULL;
3231 _cleanup_close_ int fd = -1;
3232 struct iovec iovec[6] = {};
3234 static bool prev_ephemeral;
3238 /* This is independent of logging, as status messages are
3239 * optional and go exclusively to the console. */
3241 if (vasprintf(&s, format, ap) < 0)
3244 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3257 sl = status ? sizeof(status_indent)-1 : 0;
3263 e = ellipsize(s, emax, 50);
3271 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3272 prev_ephemeral = ephemeral;
3275 if (!isempty(status)) {
3276 IOVEC_SET_STRING(iovec[n++], "[");
3277 IOVEC_SET_STRING(iovec[n++], status);
3278 IOVEC_SET_STRING(iovec[n++], "] ");
3280 IOVEC_SET_STRING(iovec[n++], status_indent);
3283 IOVEC_SET_STRING(iovec[n++], s);
3285 IOVEC_SET_STRING(iovec[n++], "\n");
3287 if (writev(fd, iovec, n) < 0)
3293 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3299 va_start(ap, format);
3300 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3306 char *replace_env(const char *format, char **env) {
3313 const char *e, *word = format;
3318 for (e = format; *e; e ++) {
3329 k = strnappend(r, word, e-word-1);
3339 } else if (*e == '$') {
3340 k = strnappend(r, word, e-word);
3357 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3359 k = strappend(r, t);
3373 k = strnappend(r, word, e-word);
3385 char **replace_env_argv(char **argv, char **env) {
3387 unsigned k = 0, l = 0;
3389 l = strv_length(argv);
3391 ret = new(char*, l+1);
3395 STRV_FOREACH(i, argv) {
3397 /* If $FOO appears as single word, replace it by the split up variable */
3398 if ((*i)[0] == '$' && (*i)[1] != '{') {
3403 e = strv_env_get(env, *i+1);
3407 r = strv_split_quoted(&m, e, true);
3419 w = realloc(ret, sizeof(char*) * (l+1));
3429 memcpy(ret + k, m, q * sizeof(char*));
3437 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3438 ret[k] = replace_env(*i, env);
3450 int fd_columns(int fd) {
3451 struct winsize ws = {};
3453 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3462 unsigned columns(void) {
3466 if (_likely_(cached_columns > 0))
3467 return cached_columns;
3470 e = getenv("COLUMNS");
3472 (void) safe_atoi(e, &c);
3475 c = fd_columns(STDOUT_FILENO);
3481 return cached_columns;
3484 int fd_lines(int fd) {
3485 struct winsize ws = {};
3487 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3496 unsigned lines(void) {
3500 if (_likely_(cached_lines > 0))
3501 return cached_lines;
3504 e = getenv("LINES");
3506 (void) safe_atoi(e, &l);
3509 l = fd_lines(STDOUT_FILENO);
3515 return cached_lines;
3518 /* intended to be used as a SIGWINCH sighandler */
3519 void columns_lines_cache_reset(int signum) {
3525 static int cached_on_tty = -1;
3527 if (_unlikely_(cached_on_tty < 0))
3528 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3530 return cached_on_tty;
3533 int files_same(const char *filea, const char *fileb) {
3536 if (stat(filea, &a) < 0)
3539 if (stat(fileb, &b) < 0)
3542 return a.st_dev == b.st_dev &&
3543 a.st_ino == b.st_ino;
3546 int running_in_chroot(void) {
3549 ret = files_same("/proc/1/root", "/");
3556 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3561 assert(percent <= 100);
3562 assert(new_length >= 3);
3564 if (old_length <= 3 || old_length <= new_length)
3565 return strndup(s, old_length);
3567 r = new0(char, new_length+1);
3571 x = (new_length * percent) / 100;
3573 if (x > new_length - 3)
3581 s + old_length - (new_length - x - 3),
3582 new_length - x - 3);
3587 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3591 unsigned k, len, len2;
3594 assert(percent <= 100);
3595 assert(new_length >= 3);
3597 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3598 if (ascii_is_valid(s))
3599 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3601 if (old_length <= 3 || old_length <= new_length)
3602 return strndup(s, old_length);
3604 x = (new_length * percent) / 100;
3606 if (x > new_length - 3)
3610 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3613 c = utf8_encoded_to_unichar(i);
3616 k += unichar_iswide(c) ? 2 : 1;
3619 if (k > x) /* last character was wide and went over quota */
3622 for (j = s + old_length; k < new_length && j > i; ) {
3625 j = utf8_prev_char(j);
3626 c = utf8_encoded_to_unichar(j);
3629 k += unichar_iswide(c) ? 2 : 1;
3633 /* we don't actually need to ellipsize */
3635 return memdup(s, old_length + 1);
3637 /* make space for ellipsis */
3638 j = utf8_next_char(j);
3641 len2 = s + old_length - j;
3642 e = new(char, len + 3 + len2 + 1);
3647 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3648 old_length, new_length, x, len, len2, k);
3652 e[len] = 0xe2; /* tri-dot ellipsis: … */
3656 memcpy(e + len + 3, j, len2 + 1);
3661 char *ellipsize(const char *s, size_t length, unsigned percent) {
3662 return ellipsize_mem(s, strlen(s), length, percent);
3665 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3666 _cleanup_close_ int fd;
3672 mkdir_parents(path, 0755);
3674 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3679 r = fchmod(fd, mode);
3684 if (uid != UID_INVALID || gid != GID_INVALID) {
3685 r = fchown(fd, uid, gid);
3690 if (stamp != USEC_INFINITY) {
3691 struct timespec ts[2];
3693 timespec_store(&ts[0], stamp);
3695 r = futimens(fd, ts);
3697 r = futimens(fd, NULL);
3704 int touch(const char *path) {
3705 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3708 char *unquote(const char *s, const char* quotes) {
3712 /* This is rather stupid, simply removes the heading and
3713 * trailing quotes if there is one. Doesn't care about
3714 * escaping or anything. We should make this smarter one
3721 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3722 return strndup(s+1, l-2);
3727 char *normalize_env_assignment(const char *s) {
3728 _cleanup_free_ char *value = NULL;
3732 eq = strchr(s, '=');
3742 memmove(r, t, strlen(t) + 1);
3747 name = strndupa(s, eq - s);
3748 p = strdupa(eq + 1);
3750 value = unquote(strstrip(p), QUOTES);
3754 return strjoin(strstrip(name), "=", value, NULL);
3757 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3768 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3782 * < 0 : wait_for_terminate() failed to get the state of the
3783 * process, the process was terminated by a signal, or
3784 * failed for an unknown reason.
3785 * >=0 : The process terminated normally, and its exit code is
3788 * That is, success is indicated by a return value of zero, and an
3789 * error is indicated by a non-zero value.
3791 * A warning is emitted if the process terminates abnormally,
3792 * and also if it returns non-zero unless check_exit_code is true.
3794 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3801 r = wait_for_terminate(pid, &status);
3803 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3805 if (status.si_code == CLD_EXITED) {
3806 if (status.si_status != 0)
3807 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3808 "%s failed with error code %i.", name, status.si_status);
3810 log_debug("%s succeeded.", name);
3812 return status.si_status;
3813 } else if (status.si_code == CLD_KILLED ||
3814 status.si_code == CLD_DUMPED) {
3816 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3820 log_warning("%s failed due to unknown reason.", name);
3824 noreturn void freeze(void) {
3826 /* Make sure nobody waits for us on a socket anymore */
3827 close_all_fds(NULL, 0);
3835 bool null_or_empty(struct stat *st) {
3838 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3841 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3847 int null_or_empty_path(const char *fn) {
3852 if (stat(fn, &st) < 0)
3855 return null_or_empty(&st);
3858 int null_or_empty_fd(int fd) {
3863 if (fstat(fd, &st) < 0)
3866 return null_or_empty(&st);
3869 DIR *xopendirat(int fd, const char *name, int flags) {
3873 assert(!(flags & O_CREAT));
3875 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3888 int signal_from_string_try_harder(const char *s) {
3892 signo = signal_from_string(s);
3894 if (startswith(s, "SIG"))
3895 return signal_from_string(s+3);
3900 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3901 _cleanup_free_ char *t = NULL, *u = NULL;
3904 u = unquote(tagvalue, "\"\'");
3908 enc_len = strlen(u) * 4 + 1;
3909 t = new(char, enc_len);
3913 if (encode_devnode_name(u, t, enc_len) < 0)
3916 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3919 char *fstab_node_to_udev_node(const char *p) {
3922 if (startswith(p, "LABEL="))
3923 return tag_to_udev_node(p+6, "label");
3925 if (startswith(p, "UUID="))
3926 return tag_to_udev_node(p+5, "uuid");
3928 if (startswith(p, "PARTUUID="))
3929 return tag_to_udev_node(p+9, "partuuid");
3931 if (startswith(p, "PARTLABEL="))
3932 return tag_to_udev_node(p+10, "partlabel");
3937 bool tty_is_vc(const char *tty) {
3940 return vtnr_from_tty(tty) >= 0;
3943 bool tty_is_console(const char *tty) {
3946 if (startswith(tty, "/dev/"))
3949 return streq(tty, "console");
3952 int vtnr_from_tty(const char *tty) {
3957 if (startswith(tty, "/dev/"))
3960 if (!startswith(tty, "tty") )
3963 if (tty[3] < '0' || tty[3] > '9')
3966 r = safe_atoi(tty+3, &i);
3970 if (i < 0 || i > 63)
3976 char *resolve_dev_console(char **active) {
3979 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3980 * (i.e. not read-only-mounted which is a sign for container setups) */
3982 if (path_is_read_only_fs("/sys") > 0)
3985 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3988 /* If multiple log outputs are configured the last one is what
3989 * /dev/console points to */
3990 tty = strrchr(*active, ' ');
3996 if (streq(tty, "tty0")) {
3999 /* Get the active VC (e.g. tty1) */
4000 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
4002 tty = *active = tmp;
4009 bool tty_is_vc_resolve(const char *tty) {
4010 _cleanup_free_ char *active = NULL;
4014 if (startswith(tty, "/dev/"))
4017 if (streq(tty, "console")) {
4018 tty = resolve_dev_console(&active);
4023 return tty_is_vc(tty);
4026 const char *default_term_for_tty(const char *tty) {
4029 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
4032 bool dirent_is_file(const struct dirent *de) {
4035 if (hidden_file(de->d_name))
4038 if (de->d_type != DT_REG &&
4039 de->d_type != DT_LNK &&
4040 de->d_type != DT_UNKNOWN)
4046 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
4049 if (de->d_type != DT_REG &&
4050 de->d_type != DT_LNK &&
4051 de->d_type != DT_UNKNOWN)
4054 if (hidden_file_allow_backup(de->d_name))
4057 return endswith(de->d_name, suffix);
4060 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4061 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4062 _cleanup_set_free_free_ Set *seen = NULL;
4065 /* We fork this all off from a child process so that we can
4066 * somewhat cleanly make use of SIGALRM to set a time limit */
4068 reset_all_signal_handlers();
4069 reset_signal_mask();
4071 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4073 pids = hashmap_new(NULL);
4077 seen = set_new(&string_hash_ops);
4081 STRV_FOREACH(directory, directories) {
4082 _cleanup_closedir_ DIR *d;
4085 d = opendir(*directory);
4087 if (errno == ENOENT)
4090 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4093 FOREACH_DIRENT(de, d, break) {
4094 _cleanup_free_ char *path = NULL;
4098 if (!dirent_is_file(de))
4101 if (set_contains(seen, de->d_name)) {
4102 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4106 r = set_put_strdup(seen, de->d_name);
4110 path = strjoin(*directory, "/", de->d_name, NULL);
4114 if (null_or_empty_path(path)) {
4115 log_debug("%s is empty (a mask).", path);
4118 log_debug("%s will be executed.", path);
4122 log_error_errno(errno, "Failed to fork: %m");
4124 } else if (pid == 0) {
4127 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4137 return log_error_errno(errno, "Failed to execute %s: %m", path);
4140 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4142 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4149 /* Abort execution of this process after the timout. We simply
4150 * rely on SIGALRM as default action terminating the process,
4151 * and turn on alarm(). */
4153 if (timeout != USEC_INFINITY)
4154 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4156 while (!hashmap_isempty(pids)) {
4157 _cleanup_free_ char *path = NULL;
4160 pid = PTR_TO_UINT(hashmap_first_key(pids));
4163 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4166 wait_for_terminate_and_warn(path, pid, true);
4172 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4176 char **dirs = (char**) directories;
4178 assert(!strv_isempty(dirs));
4180 name = basename(dirs[0]);
4181 assert(!isempty(name));
4183 /* Executes all binaries in the directories in parallel and waits
4184 * for them to finish. Optionally a timeout is applied. If a file
4185 * with the same name exists in more than one directory, the
4186 * earliest one wins. */
4188 executor_pid = fork();
4189 if (executor_pid < 0) {
4190 log_error_errno(errno, "Failed to fork: %m");
4193 } else if (executor_pid == 0) {
4194 r = do_execute(dirs, timeout, argv);
4195 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4198 wait_for_terminate_and_warn(name, executor_pid, true);
4201 int kill_and_sigcont(pid_t pid, int sig) {
4204 r = kill(pid, sig) < 0 ? -errno : 0;
4212 bool nulstr_contains(const char*nulstr, const char *needle) {
4218 NULSTR_FOREACH(i, nulstr)
4219 if (streq(i, needle))
4225 bool plymouth_running(void) {
4226 return access("/run/plymouth/pid", F_OK) >= 0;
4229 char* strshorten(char *s, size_t l) {
4238 static bool hostname_valid_char(char c) {
4240 (c >= 'a' && c <= 'z') ||
4241 (c >= 'A' && c <= 'Z') ||
4242 (c >= '0' && c <= '9') ||
4248 bool hostname_is_valid(const char *s) {
4255 /* Doesn't accept empty hostnames, hostnames with trailing or
4256 * leading dots, and hostnames with multiple dots in a
4257 * sequence. Also ensures that the length stays below
4260 for (p = s, dot = true; *p; p++) {
4267 if (!hostname_valid_char(*p))
4277 if (p-s > HOST_NAME_MAX)
4283 char* hostname_cleanup(char *s, bool lowercase) {
4287 for (p = s, d = s, dot = true; *p; p++) {
4294 } else if (hostname_valid_char(*p)) {
4295 *(d++) = lowercase ? tolower(*p) : *p;
4306 strshorten(s, HOST_NAME_MAX);
4311 bool machine_name_is_valid(const char *s) {
4313 if (!hostname_is_valid(s))
4316 /* Machine names should be useful hostnames, but also be
4317 * useful in unit names, hence we enforce a stricter length
4326 int pipe_eof(int fd) {
4327 struct pollfd pollfd = {
4329 .events = POLLIN|POLLHUP,
4334 r = poll(&pollfd, 1, 0);
4341 return pollfd.revents & POLLHUP;
4344 int fd_wait_for_event(int fd, int event, usec_t t) {
4346 struct pollfd pollfd = {
4354 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4361 return pollfd.revents;
4364 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4373 r = tempfn_xxxxxx(path, &t);
4377 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4383 f = fdopen(fd, "we");
4396 int terminal_vhangup_fd(int fd) {
4399 if (ioctl(fd, TIOCVHANGUP) < 0)
4405 int terminal_vhangup(const char *name) {
4406 _cleanup_close_ int fd;
4408 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4412 return terminal_vhangup_fd(fd);
4415 int vt_disallocate(const char *name) {
4419 /* Deallocate the VT if possible. If not possible
4420 * (i.e. because it is the active one), at least clear it
4421 * entirely (including the scrollback buffer) */
4423 if (!startswith(name, "/dev/"))
4426 if (!tty_is_vc(name)) {
4427 /* So this is not a VT. I guess we cannot deallocate
4428 * it then. But let's at least clear the screen */
4430 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4435 "\033[r" /* clear scrolling region */
4436 "\033[H" /* move home */
4437 "\033[2J", /* clear screen */
4444 if (!startswith(name, "/dev/tty"))
4447 r = safe_atou(name+8, &u);
4454 /* Try to deallocate */
4455 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4459 r = ioctl(fd, VT_DISALLOCATE, u);
4468 /* Couldn't deallocate, so let's clear it fully with
4470 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4475 "\033[r" /* clear scrolling region */
4476 "\033[H" /* move home */
4477 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4484 int symlink_atomic(const char *from, const char *to) {
4485 _cleanup_free_ char *t = NULL;
4491 r = tempfn_random(to, &t);
4495 if (symlink(from, t) < 0)
4498 if (rename(t, to) < 0) {
4506 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4507 _cleanup_free_ char *t = NULL;
4512 r = tempfn_random(path, &t);
4516 if (mknod(t, mode, dev) < 0)
4519 if (rename(t, path) < 0) {
4527 int mkfifo_atomic(const char *path, mode_t mode) {
4528 _cleanup_free_ char *t = NULL;
4533 r = tempfn_random(path, &t);
4537 if (mkfifo(t, mode) < 0)
4540 if (rename(t, path) < 0) {
4548 bool display_is_local(const char *display) {
4552 display[0] == ':' &&
4553 display[1] >= '0' &&
4557 int socket_from_display(const char *display, char **path) {
4564 if (!display_is_local(display))
4567 k = strspn(display+1, "0123456789");
4569 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4573 c = stpcpy(f, "/tmp/.X11-unix/X");
4574 memcpy(c, display+1, k);
4583 const char **username,
4584 uid_t *uid, gid_t *gid,
4586 const char **shell) {
4594 /* We enforce some special rules for uid=0: in order to avoid
4595 * NSS lookups for root we hardcode its data. */
4597 if (streq(*username, "root") || streq(*username, "0")) {
4615 if (parse_uid(*username, &u) >= 0) {
4619 /* If there are multiple users with the same id, make
4620 * sure to leave $USER to the configured value instead
4621 * of the first occurrence in the database. However if
4622 * the uid was configured by a numeric uid, then let's
4623 * pick the real username from /etc/passwd. */
4625 *username = p->pw_name;
4628 p = getpwnam(*username);
4632 return errno > 0 ? -errno : -ESRCH;
4644 *shell = p->pw_shell;
4649 char* uid_to_name(uid_t uid) {
4654 return strdup("root");
4658 return strdup(p->pw_name);
4660 if (asprintf(&r, UID_FMT, uid) < 0)
4666 char* gid_to_name(gid_t gid) {
4671 return strdup("root");
4675 return strdup(p->gr_name);
4677 if (asprintf(&r, GID_FMT, gid) < 0)
4683 int get_group_creds(const char **groupname, gid_t *gid) {
4689 /* We enforce some special rules for gid=0: in order to avoid
4690 * NSS lookups for root we hardcode its data. */
4692 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4693 *groupname = "root";
4701 if (parse_gid(*groupname, &id) >= 0) {
4706 *groupname = g->gr_name;
4709 g = getgrnam(*groupname);
4713 return errno > 0 ? -errno : -ESRCH;
4721 int in_gid(gid_t gid) {
4723 int ngroups_max, r, i;
4725 if (getgid() == gid)
4728 if (getegid() == gid)
4731 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4732 assert(ngroups_max > 0);
4734 gids = alloca(sizeof(gid_t) * ngroups_max);
4736 r = getgroups(ngroups_max, gids);
4740 for (i = 0; i < r; i++)
4747 int in_group(const char *name) {
4751 r = get_group_creds(&name, &gid);
4758 int glob_exists(const char *path) {
4759 _cleanup_globfree_ glob_t g = {};
4765 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4767 if (k == GLOB_NOMATCH)
4769 else if (k == GLOB_NOSPACE)
4772 return !strv_isempty(g.gl_pathv);
4774 return errno ? -errno : -EIO;
4777 int glob_extend(char ***strv, const char *path) {
4778 _cleanup_globfree_ glob_t g = {};
4783 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4785 if (k == GLOB_NOMATCH)
4787 else if (k == GLOB_NOSPACE)
4789 else if (k != 0 || strv_isempty(g.gl_pathv))
4790 return errno ? -errno : -EIO;
4792 STRV_FOREACH(p, g.gl_pathv) {
4793 k = strv_extend(strv, *p);
4801 int dirent_ensure_type(DIR *d, struct dirent *de) {
4807 if (de->d_type != DT_UNKNOWN)
4810 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4814 S_ISREG(st.st_mode) ? DT_REG :
4815 S_ISDIR(st.st_mode) ? DT_DIR :
4816 S_ISLNK(st.st_mode) ? DT_LNK :
4817 S_ISFIFO(st.st_mode) ? DT_FIFO :
4818 S_ISSOCK(st.st_mode) ? DT_SOCK :
4819 S_ISCHR(st.st_mode) ? DT_CHR :
4820 S_ISBLK(st.st_mode) ? DT_BLK :
4826 int get_files_in_directory(const char *path, char ***list) {
4827 _cleanup_closedir_ DIR *d = NULL;
4828 size_t bufsize = 0, n = 0;
4829 _cleanup_strv_free_ char **l = NULL;
4833 /* Returns all files in a directory in *list, and the number
4834 * of files as return value. If list is NULL returns only the
4846 if (!de && errno != 0)
4851 dirent_ensure_type(d, de);
4853 if (!dirent_is_file(de))
4857 /* one extra slot is needed for the terminating NULL */
4858 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4861 l[n] = strdup(de->d_name);
4872 l = NULL; /* avoid freeing */
4878 char *strjoin(const char *x, ...) {
4892 t = va_arg(ap, const char *);
4897 if (n > ((size_t) -1) - l) {
4921 t = va_arg(ap, const char *);
4935 bool is_main_thread(void) {
4936 static thread_local int cached = 0;
4938 if (_unlikely_(cached == 0))
4939 cached = getpid() == gettid() ? 1 : -1;
4944 int block_get_whole_disk(dev_t d, dev_t *ret) {
4951 /* If it has a queue this is good enough for us */
4952 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4955 r = access(p, F_OK);
4963 /* If it is a partition find the originating device */
4964 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4967 r = access(p, F_OK);
4973 /* Get parent dev_t */
4974 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4977 r = read_one_line_file(p, &s);
4983 r = sscanf(s, "%u:%u", &m, &n);
4989 /* Only return this if it is really good enough for us. */
4990 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4993 r = access(p, F_OK);
4997 *ret = makedev(m, n);
5004 static const char *const ioprio_class_table[] = {
5005 [IOPRIO_CLASS_NONE] = "none",
5006 [IOPRIO_CLASS_RT] = "realtime",
5007 [IOPRIO_CLASS_BE] = "best-effort",
5008 [IOPRIO_CLASS_IDLE] = "idle"
5011 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
5013 static const char *const sigchld_code_table[] = {
5014 [CLD_EXITED] = "exited",
5015 [CLD_KILLED] = "killed",
5016 [CLD_DUMPED] = "dumped",
5017 [CLD_TRAPPED] = "trapped",
5018 [CLD_STOPPED] = "stopped",
5019 [CLD_CONTINUED] = "continued",
5022 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
5024 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
5025 [LOG_FAC(LOG_KERN)] = "kern",
5026 [LOG_FAC(LOG_USER)] = "user",
5027 [LOG_FAC(LOG_MAIL)] = "mail",
5028 [LOG_FAC(LOG_DAEMON)] = "daemon",
5029 [LOG_FAC(LOG_AUTH)] = "auth",
5030 [LOG_FAC(LOG_SYSLOG)] = "syslog",
5031 [LOG_FAC(LOG_LPR)] = "lpr",
5032 [LOG_FAC(LOG_NEWS)] = "news",
5033 [LOG_FAC(LOG_UUCP)] = "uucp",
5034 [LOG_FAC(LOG_CRON)] = "cron",
5035 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
5036 [LOG_FAC(LOG_FTP)] = "ftp",
5037 [LOG_FAC(LOG_LOCAL0)] = "local0",
5038 [LOG_FAC(LOG_LOCAL1)] = "local1",
5039 [LOG_FAC(LOG_LOCAL2)] = "local2",
5040 [LOG_FAC(LOG_LOCAL3)] = "local3",
5041 [LOG_FAC(LOG_LOCAL4)] = "local4",
5042 [LOG_FAC(LOG_LOCAL5)] = "local5",
5043 [LOG_FAC(LOG_LOCAL6)] = "local6",
5044 [LOG_FAC(LOG_LOCAL7)] = "local7"
5047 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
5049 static const char *const log_level_table[] = {
5050 [LOG_EMERG] = "emerg",
5051 [LOG_ALERT] = "alert",
5052 [LOG_CRIT] = "crit",
5054 [LOG_WARNING] = "warning",
5055 [LOG_NOTICE] = "notice",
5056 [LOG_INFO] = "info",
5057 [LOG_DEBUG] = "debug"
5060 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5062 static const char* const sched_policy_table[] = {
5063 [SCHED_OTHER] = "other",
5064 [SCHED_BATCH] = "batch",
5065 [SCHED_IDLE] = "idle",
5066 [SCHED_FIFO] = "fifo",
5070 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5072 static const char* const rlimit_table[_RLIMIT_MAX] = {
5073 [RLIMIT_CPU] = "LimitCPU",
5074 [RLIMIT_FSIZE] = "LimitFSIZE",
5075 [RLIMIT_DATA] = "LimitDATA",
5076 [RLIMIT_STACK] = "LimitSTACK",
5077 [RLIMIT_CORE] = "LimitCORE",
5078 [RLIMIT_RSS] = "LimitRSS",
5079 [RLIMIT_NOFILE] = "LimitNOFILE",
5080 [RLIMIT_AS] = "LimitAS",
5081 [RLIMIT_NPROC] = "LimitNPROC",
5082 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5083 [RLIMIT_LOCKS] = "LimitLOCKS",
5084 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5085 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5086 [RLIMIT_NICE] = "LimitNICE",
5087 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5088 [RLIMIT_RTTIME] = "LimitRTTIME"
5091 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5093 static const char* const ip_tos_table[] = {
5094 [IPTOS_LOWDELAY] = "low-delay",
5095 [IPTOS_THROUGHPUT] = "throughput",
5096 [IPTOS_RELIABILITY] = "reliability",
5097 [IPTOS_LOWCOST] = "low-cost",
5100 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5102 static const char *const __signal_table[] = {
5119 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5130 [SIGVTALRM] = "VTALRM",
5132 [SIGWINCH] = "WINCH",
5138 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5140 const char *signal_to_string(int signo) {
5141 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5144 name = __signal_to_string(signo);
5148 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5149 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5151 snprintf(buf, sizeof(buf), "%d", signo);
5156 int signal_from_string(const char *s) {
5161 signo = __signal_from_string(s);
5165 if (startswith(s, "RTMIN+")) {
5169 if (safe_atou(s, &u) >= 0) {
5170 signo = (int) u + offset;
5171 if (signo > 0 && signo < _NSIG)
5177 bool kexec_loaded(void) {
5178 bool loaded = false;
5181 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5189 int prot_from_flags(int flags) {
5191 switch (flags & O_ACCMODE) {
5200 return PROT_READ|PROT_WRITE;
5207 char *format_bytes(char *buf, size_t l, off_t t) {
5210 static const struct {
5214 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5215 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5216 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5217 { "G", 1024ULL*1024ULL*1024ULL },
5218 { "M", 1024ULL*1024ULL },
5222 if (t == (off_t) -1)
5225 for (i = 0; i < ELEMENTSOF(table); i++) {
5227 if (t >= table[i].factor) {
5230 (unsigned long long) (t / table[i].factor),
5231 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5238 snprintf(buf, l, "%lluB", (unsigned long long) t);
5246 void* memdup(const void *p, size_t l) {
5259 int fd_inc_sndbuf(int fd, size_t n) {
5261 socklen_t l = sizeof(value);
5263 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5264 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5267 /* If we have the privileges we will ignore the kernel limit. */
5270 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5271 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5277 int fd_inc_rcvbuf(int fd, size_t n) {
5279 socklen_t l = sizeof(value);
5281 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5282 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5285 /* If we have the privileges we will ignore the kernel limit. */
5288 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5289 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5294 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5295 bool stdout_is_tty, stderr_is_tty;
5296 pid_t parent_pid, agent_pid;
5297 sigset_t ss, saved_ss;
5305 /* Spawns a temporary TTY agent, making sure it goes away when
5308 parent_pid = getpid();
5310 /* First we temporarily block all signals, so that the new
5311 * child has them blocked initially. This way, we can be sure
5312 * that SIGTERMs are not lost we might send to the agent. */
5313 assert_se(sigfillset(&ss) >= 0);
5314 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5317 if (agent_pid < 0) {
5318 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5322 if (agent_pid != 0) {
5323 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5330 * Make sure the agent goes away when the parent dies */
5331 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5332 _exit(EXIT_FAILURE);
5334 /* Make sure we actually can kill the agent, if we need to, in
5335 * case somebody invoked us from a shell script that trapped
5336 * SIGTERM or so... */
5337 reset_all_signal_handlers();
5338 reset_signal_mask();
5340 /* Check whether our parent died before we were able
5341 * to set the death signal and unblock the signals */
5342 if (getppid() != parent_pid)
5343 _exit(EXIT_SUCCESS);
5345 /* Don't leak fds to the agent */
5346 close_all_fds(except, n_except);
5348 stdout_is_tty = isatty(STDOUT_FILENO);
5349 stderr_is_tty = isatty(STDERR_FILENO);
5351 if (!stdout_is_tty || !stderr_is_tty) {
5354 /* Detach from stdout/stderr. and reopen
5355 * /dev/tty for them. This is important to
5356 * ensure that when systemctl is started via
5357 * popen() or a similar call that expects to
5358 * read EOF we actually do generate EOF and
5359 * not delay this indefinitely by because we
5360 * keep an unused copy of stdin around. */
5361 fd = open("/dev/tty", O_WRONLY);
5363 log_error_errno(errno, "Failed to open /dev/tty: %m");
5364 _exit(EXIT_FAILURE);
5368 dup2(fd, STDOUT_FILENO);
5371 dup2(fd, STDERR_FILENO);
5377 /* Count arguments */
5379 for (n = 0; va_arg(ap, char*); n++)
5384 l = alloca(sizeof(char *) * (n + 1));
5386 /* Fill in arguments */
5388 for (i = 0; i <= n; i++)
5389 l[i] = va_arg(ap, char*);
5393 _exit(EXIT_FAILURE);
5396 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5397 struct rlimit highest, fixed;
5401 if (setrlimit(resource, rlim) >= 0)
5407 /* So we failed to set the desired setrlimit, then let's try
5408 * to get as close as we can */
5409 assert_se(getrlimit(resource, &highest) == 0);
5411 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5412 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5414 if (setrlimit(resource, &fixed) < 0)
5420 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5421 _cleanup_fclose_ FILE *f = NULL;
5432 path = procfs_file_alloca(pid, "environ");
5434 f = fopen(path, "re");
5442 char line[LINE_MAX];
5445 for (i = 0; i < sizeof(line)-1; i++) {
5449 if (_unlikely_(c == EOF)) {
5459 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5460 value = strdup(line + l + 1);
5474 bool http_etag_is_valid(const char *etag) {
5478 if (!endswith(etag, "\""))
5481 if (!startswith(etag, "\"") && !startswith(etag, "W/\""))
5487 bool http_url_is_valid(const char *url) {
5493 p = startswith(url, "http://");
5495 p = startswith(url, "https://");
5502 return ascii_is_valid(p);
5505 bool documentation_url_is_valid(const char *url) {
5511 if (http_url_is_valid(url))
5514 p = startswith(url, "file:/");
5516 p = startswith(url, "info:");
5518 p = startswith(url, "man:");
5523 return ascii_is_valid(p);
5526 bool in_initrd(void) {
5527 static int saved = -1;
5533 /* We make two checks here:
5535 * 1. the flag file /etc/initrd-release must exist
5536 * 2. the root file system must be a memory file system
5538 * The second check is extra paranoia, since misdetecting an
5539 * initrd can have bad bad consequences due the initrd
5540 * emptying when transititioning to the main systemd.
5543 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5544 statfs("/", &s) >= 0 &&
5545 is_temporary_fs(&s);
5550 void warn_melody(void) {
5551 _cleanup_close_ int fd = -1;
5553 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5557 /* Yeah, this is synchronous. Kinda sucks. But well... */
5559 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5560 usleep(125*USEC_PER_MSEC);
5562 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5563 usleep(125*USEC_PER_MSEC);
5565 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5566 usleep(125*USEC_PER_MSEC);
5568 ioctl(fd, KIOCSOUND, 0);
5571 int make_console_stdio(void) {
5574 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5576 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5578 return log_error_errno(fd, "Failed to acquire terminal: %m");
5582 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5587 int get_home_dir(char **_h) {
5595 /* Take the user specified one */
5596 e = secure_getenv("HOME");
5597 if (e && path_is_absolute(e)) {
5606 /* Hardcode home directory for root to avoid NSS */
5609 h = strdup("/root");
5617 /* Check the database... */
5621 return errno > 0 ? -errno : -ESRCH;
5623 if (!path_is_absolute(p->pw_dir))
5626 h = strdup(p->pw_dir);
5634 int get_shell(char **_s) {
5642 /* Take the user specified one */
5643 e = getenv("SHELL");
5653 /* Hardcode home directory for root to avoid NSS */
5656 s = strdup("/bin/sh");
5664 /* Check the database... */
5668 return errno > 0 ? -errno : -ESRCH;
5670 if (!path_is_absolute(p->pw_shell))
5673 s = strdup(p->pw_shell);
5681 bool filename_is_valid(const char *p) {
5695 if (strlen(p) > FILENAME_MAX)
5701 bool string_is_safe(const char *p) {
5707 for (t = p; *t; t++) {
5708 if (*t > 0 && *t < ' ')
5711 if (strchr("\\\"\'\0x7f", *t))
5719 * Check if a string contains control characters. If 'ok' is non-NULL
5720 * it may be a string containing additional CCs to be considered OK.
5722 bool string_has_cc(const char *p, const char *ok) {
5727 for (t = p; *t; t++) {
5728 if (ok && strchr(ok, *t))
5731 if (*t > 0 && *t < ' ')
5741 bool path_is_safe(const char *p) {
5746 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5749 if (strlen(p) > PATH_MAX)
5752 /* The following two checks are not really dangerous, but hey, they still are confusing */
5753 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5756 if (strstr(p, "//"))
5762 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5763 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5764 int (*compar) (const void *, const void *, void *), void *arg) {
5773 p = (void *)(((const char *) base) + (idx * size));
5774 comparison = compar(key, p, arg);
5777 else if (comparison > 0)
5785 bool is_locale_utf8(void) {
5787 static int cached_answer = -1;
5789 if (cached_answer >= 0)
5792 if (!setlocale(LC_ALL, "")) {
5793 cached_answer = true;
5797 set = nl_langinfo(CODESET);
5799 cached_answer = true;
5803 if (streq(set, "UTF-8")) {
5804 cached_answer = true;
5808 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5809 * unset and everything can do to UTF-8 nowadays. */
5810 set = setlocale(LC_CTYPE, NULL);
5812 cached_answer = true;
5816 /* Check result, but ignore the result if C was set
5820 !getenv("LC_ALL") &&
5821 !getenv("LC_CTYPE") &&
5825 return (bool) cached_answer;
5828 const char *draw_special_char(DrawSpecialChar ch) {
5829 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5832 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5833 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5834 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5835 [DRAW_TREE_SPACE] = " ", /* */
5836 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5837 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5838 [DRAW_ARROW] = "\342\206\222", /* → */
5839 [DRAW_DASH] = "\342\200\223", /* – */
5842 /* ASCII fallback */ {
5843 [DRAW_TREE_VERTICAL] = "| ",
5844 [DRAW_TREE_BRANCH] = "|-",
5845 [DRAW_TREE_RIGHT] = "`-",
5846 [DRAW_TREE_SPACE] = " ",
5847 [DRAW_TRIANGULAR_BULLET] = ">",
5848 [DRAW_BLACK_CIRCLE] = "*",
5849 [DRAW_ARROW] = "->",
5854 return draw_table[!is_locale_utf8()][ch];
5857 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5860 size_t l, old_len, new_len;
5866 old_len = strlen(old_string);
5867 new_len = strlen(new_string);
5880 if (!startswith(f, old_string)) {
5886 nl = l - old_len + new_len;
5887 a = realloc(r, nl + 1);
5895 t = stpcpy(t, new_string);
5907 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5908 const char *i, *begin = NULL;
5913 } state = STATE_OTHER;
5915 size_t osz = 0, isz;
5921 /* Strips ANSI color and replaces TABs by 8 spaces */
5923 isz = _isz ? *_isz : strlen(*ibuf);
5925 f = open_memstream(&obuf, &osz);
5929 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5934 if (i >= *ibuf + isz) /* EOT */
5936 else if (*i == '\x1B')
5937 state = STATE_ESCAPE;
5938 else if (*i == '\t')
5945 if (i >= *ibuf + isz) { /* EOT */
5948 } else if (*i == '[') {
5949 state = STATE_BRACKET;
5954 state = STATE_OTHER;
5961 if (i >= *ibuf + isz || /* EOT */
5962 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5965 state = STATE_OTHER;
5967 } else if (*i == 'm')
5968 state = STATE_OTHER;
5990 int on_ac_power(void) {
5991 bool found_offline = false, found_online = false;
5992 _cleanup_closedir_ DIR *d = NULL;
5994 d = opendir("/sys/class/power_supply");
6000 _cleanup_close_ int fd = -1, device = -1;
6006 if (!de && errno != 0)
6012 if (hidden_file(de->d_name))
6015 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
6017 if (errno == ENOENT || errno == ENOTDIR)
6023 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6025 if (errno == ENOENT)
6031 n = read(fd, contents, sizeof(contents));
6035 if (n != 6 || memcmp(contents, "Mains\n", 6))
6039 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6041 if (errno == ENOENT)
6047 n = read(fd, contents, sizeof(contents));
6051 if (n != 2 || contents[1] != '\n')
6054 if (contents[0] == '1') {
6055 found_online = true;
6057 } else if (contents[0] == '0')
6058 found_offline = true;
6063 return found_online || !found_offline;
6066 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6073 if (!path_strv_resolve_uniq(search, root))
6076 STRV_FOREACH(i, search) {
6077 _cleanup_free_ char *p = NULL;
6081 p = strjoin(root, *i, "/", path, NULL);
6083 p = strjoin(*i, "/", path, NULL);
6093 if (errno != ENOENT)
6100 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6101 _cleanup_strv_free_ char **copy = NULL;
6107 if (path_is_absolute(path)) {
6110 f = fopen(path, mode);
6119 copy = strv_copy((char**) search);
6123 return search_and_fopen_internal(path, mode, root, copy, _f);
6126 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6127 _cleanup_strv_free_ char **s = NULL;
6129 if (path_is_absolute(path)) {
6132 f = fopen(path, mode);
6141 s = strv_split_nulstr(search);
6145 return search_and_fopen_internal(path, mode, root, s, _f);
6148 char *strextend(char **x, ...) {
6155 l = f = *x ? strlen(*x) : 0;
6162 t = va_arg(ap, const char *);
6167 if (n > ((size_t) -1) - l) {
6176 r = realloc(*x, l+1);
6186 t = va_arg(ap, const char *);
6200 char *strrep(const char *s, unsigned n) {
6208 p = r = malloc(l * n + 1);
6212 for (i = 0; i < n; i++)
6219 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6226 if (*allocated >= need)
6229 newalloc = MAX(need * 2, 64u / size);
6230 a = newalloc * size;
6232 /* check for overflows */
6233 if (a < size * need)
6241 *allocated = newalloc;
6245 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6254 q = greedy_realloc(p, allocated, need, size);
6258 if (*allocated > prev)
6259 memzero(q + prev * size, (*allocated - prev) * size);
6264 bool id128_is_valid(const char *s) {
6270 /* Simple formatted 128bit hex string */
6272 for (i = 0; i < l; i++) {
6275 if (!(c >= '0' && c <= '9') &&
6276 !(c >= 'a' && c <= 'z') &&
6277 !(c >= 'A' && c <= 'Z'))
6281 } else if (l == 36) {
6283 /* Formatted UUID */
6285 for (i = 0; i < l; i++) {
6288 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6292 if (!(c >= '0' && c <= '9') &&
6293 !(c >= 'a' && c <= 'z') &&
6294 !(c >= 'A' && c <= 'Z'))
6305 int split_pair(const char *s, const char *sep, char **l, char **r) {
6320 a = strndup(s, x - s);
6324 b = strdup(x + strlen(sep));
6336 int shall_restore_state(void) {
6337 _cleanup_free_ char *value = NULL;
6340 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6346 return parse_boolean(value) != 0;
6349 int proc_cmdline(char **ret) {
6352 if (detect_container(NULL) > 0)
6353 return get_process_cmdline(1, 0, false, ret);
6355 return read_one_line_file("/proc/cmdline", ret);
6358 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6359 _cleanup_free_ char *line = NULL;
6365 r = proc_cmdline(&line);
6371 _cleanup_free_ char *word = NULL;
6374 r = unquote_first_word(&p, &word, true);
6380 /* Filter out arguments that are intended only for the
6382 if (!in_initrd() && startswith(word, "rd."))
6385 value = strchr(word, '=');
6389 r = parse_item(word, value);
6397 int get_proc_cmdline_key(const char *key, char **value) {
6398 _cleanup_free_ char *line = NULL, *ret = NULL;
6405 r = proc_cmdline(&line);
6411 _cleanup_free_ char *word = NULL;
6414 r = unquote_first_word(&p, &word, true);
6420 /* Filter out arguments that are intended only for the
6422 if (!in_initrd() && startswith(word, "rd."))
6426 e = startswith(word, key);
6430 r = free_and_strdup(&ret, e);
6436 if (streq(word, key))
6450 int container_get_leader(const char *machine, pid_t *pid) {
6451 _cleanup_free_ char *s = NULL, *class = NULL;
6459 p = strjoina("/run/systemd/machines/", machine);
6460 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6468 if (!streq_ptr(class, "container"))
6471 r = parse_pid(s, &leader);
6481 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6482 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6490 mntns = procfs_file_alloca(pid, "ns/mnt");
6491 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6499 pidns = procfs_file_alloca(pid, "ns/pid");
6500 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6508 netns = procfs_file_alloca(pid, "ns/net");
6509 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6517 root = procfs_file_alloca(pid, "root");
6518 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6524 *pidns_fd = pidnsfd;
6527 *mntns_fd = mntnsfd;
6530 *netns_fd = netnsfd;
6535 pidnsfd = mntnsfd = netnsfd = -1;
6540 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6543 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6547 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6551 if (setns(netns_fd, CLONE_NEWNET) < 0)
6555 if (fchdir(root_fd) < 0)
6558 if (chroot(".") < 0)
6562 if (setresgid(0, 0, 0) < 0)
6565 if (setgroups(0, NULL) < 0)
6568 if (setresuid(0, 0, 0) < 0)
6574 bool pid_is_unwaited(pid_t pid) {
6575 /* Checks whether a PID is still valid at all, including a zombie */
6580 if (kill(pid, 0) >= 0)
6583 return errno != ESRCH;
6586 bool pid_is_alive(pid_t pid) {
6589 /* Checks whether a PID is still valid and not a zombie */
6594 r = get_process_state(pid);
6595 if (r == -ENOENT || r == 'Z')
6601 int getpeercred(int fd, struct ucred *ucred) {
6602 socklen_t n = sizeof(struct ucred);
6609 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6613 if (n != sizeof(struct ucred))
6616 /* Check if the data is actually useful and not suppressed due
6617 * to namespacing issues */
6620 if (u.uid == UID_INVALID)
6622 if (u.gid == GID_INVALID)
6629 int getpeersec(int fd, char **ret) {
6641 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6645 if (errno != ERANGE)
6652 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6668 /* This is much like like mkostemp() but is subject to umask(). */
6669 int mkostemp_safe(char *pattern, int flags) {
6670 _cleanup_umask_ mode_t u;
6677 fd = mkostemp(pattern, flags);
6684 int open_tmpfile(const char *path, int flags) {
6691 /* Try O_TMPFILE first, if it is supported */
6692 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6697 /* Fall back to unguessable name + unlinking */
6698 p = strjoina(path, "/systemd-tmp-XXXXXX");
6700 fd = mkostemp_safe(p, flags);
6708 int fd_warn_permissions(const char *path, int fd) {
6711 if (fstat(fd, &st) < 0)
6714 if (st.st_mode & 0111)
6715 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6717 if (st.st_mode & 0002)
6718 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6720 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6721 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6726 unsigned long personality_from_string(const char *p) {
6728 /* Parse a personality specifier. We introduce our own
6729 * identifiers that indicate specific ABIs, rather than just
6730 * hints regarding the register size, since we want to keep
6731 * things open for multiple locally supported ABIs for the
6732 * same register size. We try to reuse the ABI identifiers
6733 * used by libseccomp. */
6735 #if defined(__x86_64__)
6737 if (streq(p, "x86"))
6740 if (streq(p, "x86-64"))
6743 #elif defined(__i386__)
6745 if (streq(p, "x86"))
6749 /* personality(7) documents that 0xffffffffUL is used for
6750 * querying the current personality, hence let's use that here
6751 * as error indicator. */
6752 return 0xffffffffUL;
6755 const char* personality_to_string(unsigned long p) {
6757 #if defined(__x86_64__)
6759 if (p == PER_LINUX32)
6765 #elif defined(__i386__)
6774 uint64_t physical_memory(void) {
6777 /* We return this as uint64_t in case we are running as 32bit
6778 * process on a 64bit kernel with huge amounts of memory */
6780 mem = sysconf(_SC_PHYS_PAGES);
6783 return (uint64_t) mem * (uint64_t) page_size();
6786 void hexdump(FILE *f, const void *p, size_t s) {
6787 const uint8_t *b = p;
6790 assert(s == 0 || b);
6795 fprintf(f, "%04x ", n);
6797 for (i = 0; i < 16; i++) {
6802 fprintf(f, "%02x ", b[i]);
6810 for (i = 0; i < 16; i++) {
6815 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6829 int update_reboot_param_file(const char *param) {
6834 r = write_string_file(REBOOT_PARAM_FILE, param);
6836 log_error("Failed to write reboot param to "
6837 REBOOT_PARAM_FILE": %s", strerror(-r));
6839 unlink(REBOOT_PARAM_FILE);
6844 int umount_recursive(const char *prefix, int flags) {
6848 /* Try to umount everything recursively below a
6849 * directory. Also, take care of stacked mounts, and keep
6850 * unmounting them until they are gone. */
6853 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6858 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6859 if (!proc_self_mountinfo)
6863 _cleanup_free_ char *path = NULL, *p = NULL;
6866 k = fscanf(proc_self_mountinfo,
6867 "%*s " /* (1) mount id */
6868 "%*s " /* (2) parent id */
6869 "%*s " /* (3) major:minor */
6870 "%*s " /* (4) root */
6871 "%ms " /* (5) mount point */
6872 "%*s" /* (6) mount options */
6873 "%*[^-]" /* (7) optional fields */
6874 "- " /* (8) separator */
6875 "%*s " /* (9) file system type */
6876 "%*s" /* (10) mount source */
6877 "%*s" /* (11) mount options 2 */
6878 "%*[^\n]", /* some rubbish at the end */
6887 p = cunescape(path);
6891 if (!path_startswith(p, prefix))
6894 if (umount2(p, flags) < 0) {
6910 static int get_mount_flags(const char *path, unsigned long *flags) {
6913 if (statvfs(path, &buf) < 0)
6915 *flags = buf.f_flag;
6919 int bind_remount_recursive(const char *prefix, bool ro) {
6920 _cleanup_set_free_free_ Set *done = NULL;
6921 _cleanup_free_ char *cleaned = NULL;
6924 /* Recursively remount a directory (and all its submounts)
6925 * read-only or read-write. If the directory is already
6926 * mounted, we reuse the mount and simply mark it
6927 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6928 * operation). If it isn't we first make it one. Afterwards we
6929 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6930 * submounts we can access, too. When mounts are stacked on
6931 * the same mount point we only care for each individual
6932 * "top-level" mount on each point, as we cannot
6933 * influence/access the underlying mounts anyway. We do not
6934 * have any effect on future submounts that might get
6935 * propagated, they migt be writable. This includes future
6936 * submounts that have been triggered via autofs. */
6938 cleaned = strdup(prefix);
6942 path_kill_slashes(cleaned);
6944 done = set_new(&string_hash_ops);
6949 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6950 _cleanup_set_free_free_ Set *todo = NULL;
6951 bool top_autofs = false;
6953 unsigned long orig_flags;
6955 todo = set_new(&string_hash_ops);
6959 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6960 if (!proc_self_mountinfo)
6964 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6967 k = fscanf(proc_self_mountinfo,
6968 "%*s " /* (1) mount id */
6969 "%*s " /* (2) parent id */
6970 "%*s " /* (3) major:minor */
6971 "%*s " /* (4) root */
6972 "%ms " /* (5) mount point */
6973 "%*s" /* (6) mount options (superblock) */
6974 "%*[^-]" /* (7) optional fields */
6975 "- " /* (8) separator */
6976 "%ms " /* (9) file system type */
6977 "%*s" /* (10) mount source */
6978 "%*s" /* (11) mount options (bind mount) */
6979 "%*[^\n]", /* some rubbish at the end */
6989 p = cunescape(path);
6993 /* Let's ignore autofs mounts. If they aren't
6994 * triggered yet, we want to avoid triggering
6995 * them, as we don't make any guarantees for
6996 * future submounts anyway. If they are
6997 * already triggered, then we will find
6998 * another entry for this. */
6999 if (streq(type, "autofs")) {
7000 top_autofs = top_autofs || path_equal(cleaned, p);
7004 if (path_startswith(p, cleaned) &&
7005 !set_contains(done, p)) {
7007 r = set_consume(todo, p);
7017 /* If we have no submounts to process anymore and if
7018 * the root is either already done, or an autofs, we
7020 if (set_isempty(todo) &&
7021 (top_autofs || set_contains(done, cleaned)))
7024 if (!set_contains(done, cleaned) &&
7025 !set_contains(todo, cleaned)) {
7026 /* The prefix directory itself is not yet a
7027 * mount, make it one. */
7028 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
7032 (void) get_mount_flags(cleaned, &orig_flags);
7033 orig_flags &= ~MS_RDONLY;
7035 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
7038 x = strdup(cleaned);
7042 r = set_consume(done, x);
7047 while ((x = set_steal_first(todo))) {
7049 r = set_consume(done, x);
7055 /* Try to reuse the original flag set, but
7056 * don't care for errors, in case of
7057 * obstructed mounts */
7059 (void) get_mount_flags(x, &orig_flags);
7060 orig_flags &= ~MS_RDONLY;
7062 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7064 /* Deal with mount points that are
7065 * obstructed by a later mount */
7067 if (errno != ENOENT)
7075 int fflush_and_check(FILE *f) {
7082 return errno ? -errno : -EIO;
7087 int tempfn_xxxxxx(const char *p, char **ret) {
7099 * /foo/bar/.#waldoXXXXXX
7103 if (!filename_is_valid(fn))
7106 t = new(char, strlen(p) + 2 + 6 + 1);
7110 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7112 *ret = path_kill_slashes(t);
7116 int tempfn_random(const char *p, char **ret) {
7130 * /foo/bar/.#waldobaa2a261115984a9
7134 if (!filename_is_valid(fn))
7137 t = new(char, strlen(p) + 2 + 16 + 1);
7141 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7144 for (i = 0; i < 16; i++) {
7145 *(x++) = hexchar(u & 0xF);
7151 *ret = path_kill_slashes(t);
7155 int tempfn_random_child(const char *p, char **ret) {
7166 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7169 t = new(char, strlen(p) + 3 + 16 + 1);
7173 x = stpcpy(stpcpy(t, p), "/.#");
7176 for (i = 0; i < 16; i++) {
7177 *(x++) = hexchar(u & 0xF);
7183 *ret = path_kill_slashes(t);
7187 /* make sure the hostname is not "localhost" */
7188 bool is_localhost(const char *hostname) {
7191 /* This tries to identify local host and domain names
7192 * described in RFC6761 plus the redhatism of .localdomain */
7194 return streq(hostname, "localhost") ||
7195 streq(hostname, "localhost.") ||
7196 streq(hostname, "localdomain.") ||
7197 streq(hostname, "localdomain") ||
7198 endswith(hostname, ".localhost") ||
7199 endswith(hostname, ".localhost.") ||
7200 endswith(hostname, ".localdomain") ||
7201 endswith(hostname, ".localdomain.");
7204 int take_password_lock(const char *root) {
7206 struct flock flock = {
7208 .l_whence = SEEK_SET,
7216 /* This is roughly the same as lckpwdf(), but not as awful. We
7217 * don't want to use alarm() and signals, hence we implement
7218 * our own trivial version of this.
7220 * Note that shadow-utils also takes per-database locks in
7221 * addition to lckpwdf(). However, we don't given that they
7222 * are redundant as they they invoke lckpwdf() first and keep
7223 * it during everything they do. The per-database locks are
7224 * awfully racy, and thus we just won't do them. */
7227 path = strjoina(root, "/etc/.pwd.lock");
7229 path = "/etc/.pwd.lock";
7231 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7235 r = fcntl(fd, F_SETLKW, &flock);
7244 int is_symlink(const char *path) {
7247 if (lstat(path, &info) < 0)
7250 return !!S_ISLNK(info.st_mode);
7253 int is_dir(const char* path, bool follow) {
7258 r = stat(path, &st);
7260 r = lstat(path, &st);
7264 return !!S_ISDIR(st.st_mode);
7267 int unquote_first_word(const char **p, char **ret, bool relax) {
7268 _cleanup_free_ char *s = NULL;
7269 size_t allocated = 0, sz = 0;
7276 SINGLE_QUOTE_ESCAPE,
7278 DOUBLE_QUOTE_ESCAPE,
7286 /* Parses the first word of a string, and returns it in
7287 * *ret. Removes all quotes in the process. When parsing fails
7288 * (because of an uneven number of quotes or similar), leaves
7289 * the pointer *p at the first invalid character. */
7299 else if (strchr(WHITESPACE, c))
7309 state = SINGLE_QUOTE;
7311 state = VALUE_ESCAPE;
7313 state = DOUBLE_QUOTE;
7314 else if (strchr(WHITESPACE, c))
7317 if (!GREEDY_REALLOC(s, allocated, sz+2))
7332 if (!GREEDY_REALLOC(s, allocated, sz+2))
7345 } else if (c == '\'')
7348 state = SINGLE_QUOTE_ESCAPE;
7350 if (!GREEDY_REALLOC(s, allocated, sz+2))
7358 case SINGLE_QUOTE_ESCAPE:
7365 if (!GREEDY_REALLOC(s, allocated, sz+2))
7369 state = SINGLE_QUOTE;
7378 state = DOUBLE_QUOTE_ESCAPE;
7380 if (!GREEDY_REALLOC(s, allocated, sz+2))
7388 case DOUBLE_QUOTE_ESCAPE:
7395 if (!GREEDY_REALLOC(s, allocated, sz+2))
7399 state = DOUBLE_QUOTE;
7405 if (!strchr(WHITESPACE, c))
7427 int unquote_many_words(const char **p, ...) {
7432 /* Parses a number of words from a string, stripping any
7433 * quotes if necessary. */
7437 /* Count how many words are expected */
7440 if (!va_arg(ap, char **))
7449 /* Read all words into a temporary array */
7450 l = newa0(char*, n);
7451 for (c = 0; c < n; c++) {
7453 r = unquote_first_word(p, &l[c], false);
7457 for (j = 0; j < c; j++)
7467 /* If we managed to parse all words, return them in the passed
7470 for (i = 0; i < n; i++) {
7473 v = va_arg(ap, char **);
7483 int free_and_strdup(char **p, const char *s) {
7488 /* Replaces a string pointer with an strdup()ed new string,
7489 * possibly freeing the old one. */
7504 int sethostname_idempotent(const char *s) {
7506 char buf[HOST_NAME_MAX + 1] = {};
7510 r = gethostname(buf, sizeof(buf));
7517 r = sethostname(s, strlen(s));
7524 int ptsname_malloc(int fd, char **ret) {
7537 if (ptsname_r(fd, c, l) == 0) {
7541 if (errno != ERANGE) {
7551 int openpt_in_namespace(pid_t pid, int flags) {
7552 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7553 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7555 struct cmsghdr cmsghdr;
7556 uint8_t buf[CMSG_SPACE(sizeof(int))];
7558 struct msghdr mh = {
7559 .msg_control = &control,
7560 .msg_controllen = sizeof(control),
7562 struct cmsghdr *cmsg;
7569 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7573 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7583 pair[0] = safe_close(pair[0]);
7585 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7587 _exit(EXIT_FAILURE);
7589 master = posix_openpt(flags);
7591 _exit(EXIT_FAILURE);
7593 cmsg = CMSG_FIRSTHDR(&mh);
7594 cmsg->cmsg_level = SOL_SOCKET;
7595 cmsg->cmsg_type = SCM_RIGHTS;
7596 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7597 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7599 mh.msg_controllen = cmsg->cmsg_len;
7601 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7602 _exit(EXIT_FAILURE);
7604 _exit(EXIT_SUCCESS);
7607 pair[1] = safe_close(pair[1]);
7609 r = wait_for_terminate(child, &si);
7612 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7615 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7618 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7619 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7623 fds = (int*) CMSG_DATA(cmsg);
7624 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7627 close_many(fds, n_fds);
7637 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7638 _cleanup_close_ int fd = -1;
7641 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7643 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7647 l = fgetxattr(fd, attribute, value, size);
7654 static int parse_crtime(le64_t le, usec_t *usec) {
7660 if (u == 0 || u == (uint64_t) -1)
7667 int fd_getcrtime(int fd, usec_t *usec) {
7674 /* Until Linux gets a real concept of birthtime/creation time,
7675 * let's fake one with xattrs */
7677 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7680 if (n != sizeof(le))
7683 return parse_crtime(le, usec);
7686 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7690 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7693 if (n != sizeof(le))
7696 return parse_crtime(le, usec);
7699 int path_getcrtime(const char *p, usec_t *usec) {
7706 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7709 if (n != sizeof(le))
7712 return parse_crtime(le, usec);
7715 int fd_setcrtime(int fd, usec_t usec) {
7721 usec = now(CLOCK_REALTIME);
7723 le = htole64((uint64_t) usec);
7724 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7730 int same_fd(int a, int b) {
7731 struct stat sta, stb;
7738 /* Compares two file descriptors. Note that semantics are
7739 * quite different depending on whether we have kcmp() or we
7740 * don't. If we have kcmp() this will only return true for
7741 * dup()ed file descriptors, but not otherwise. If we don't
7742 * have kcmp() this will also return true for two fds of the same
7743 * file, created by separate open() calls. Since we use this
7744 * call mostly for filtering out duplicates in the fd store
7745 * this difference hopefully doesn't matter too much. */
7750 /* Try to use kcmp() if we have it. */
7752 r = kcmp(pid, pid, KCMP_FILE, a, b);
7757 if (errno != ENOSYS)
7760 /* We don't have kcmp(), use fstat() instead. */
7761 if (fstat(a, &sta) < 0)
7764 if (fstat(b, &stb) < 0)
7767 if ((sta.st_mode & S_IFMT) != (stb.st_mode & S_IFMT))
7770 /* We consider all device fds different, since two device fds
7771 * might refer to quite different device contexts even though
7772 * they share the same inode and backing dev_t. */
7774 if (S_ISCHR(sta.st_mode) || S_ISBLK(sta.st_mode))
7777 if (sta.st_dev != stb.st_dev || sta.st_ino != stb.st_ino)
7780 /* The fds refer to the same inode on disk, let's also check
7781 * if they have the same fd flags. This is useful to
7782 * distuingish the read and write side of a pipe created with
7784 fa = fcntl(a, F_GETFL);
7788 fb = fcntl(b, F_GETFL);
7795 int chattr_fd(int fd, bool b, unsigned mask) {
7796 unsigned old_attr, new_attr;
7803 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7807 new_attr = old_attr | mask;
7809 new_attr = old_attr & ~mask;
7811 if (new_attr == old_attr)
7814 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7820 int chattr_path(const char *p, bool b, unsigned mask) {
7821 _cleanup_close_ int fd = -1;
7828 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7832 return chattr_fd(fd, b, mask);
7835 int read_attr_fd(int fd, unsigned *ret) {
7838 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7844 int read_attr_path(const char *p, unsigned *ret) {
7845 _cleanup_close_ int fd = -1;
7850 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7854 return read_attr_fd(fd, ret);
7857 int make_lock_file(const char *p, int operation, LockFile *ret) {
7858 _cleanup_close_ int fd = -1;
7859 _cleanup_free_ char *t = NULL;
7863 * We use UNPOSIX locks if they are available. They have nice
7864 * semantics, and are mostly compatible with NFS. However,
7865 * they are only available on new kernels. When we detect we
7866 * are running on an older kernel, then we fall back to good
7867 * old BSD locks. They also have nice semantics, but are
7868 * slightly problematic on NFS, where they are upgraded to
7869 * POSIX locks, even though locally they are orthogonal to
7879 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7880 .l_whence = SEEK_SET,
7884 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7888 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7891 /* If the kernel is too old, use good old BSD locks */
7892 if (errno == EINVAL)
7893 r = flock(fd, operation);
7896 return errno == EAGAIN ? -EBUSY : -errno;
7899 /* If we acquired the lock, let's check if the file
7900 * still exists in the file system. If not, then the
7901 * previous exclusive owner removed it and then closed
7902 * it. In such a case our acquired lock is worthless,
7903 * hence try again. */
7908 if (st.st_nlink > 0)
7911 fd = safe_close(fd);
7916 ret->operation = operation;
7924 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7932 if (!filename_is_valid(fn))
7935 t = newa(char, strlen(p) + 2 + 4 + 1);
7936 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7938 return make_lock_file(t, operation, ret);
7941 void release_lock_file(LockFile *f) {
7949 /* If we are the exclusive owner we can safely delete
7950 * the lock file itself. If we are not the exclusive
7951 * owner, we can try becoming it. */
7954 (f->operation & ~LOCK_NB) == LOCK_SH) {
7955 static const struct flock fl = {
7957 .l_whence = SEEK_SET,
7960 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7961 if (r < 0 && errno == EINVAL)
7962 r = flock(f->fd, LOCK_EX|LOCK_NB);
7965 f->operation = LOCK_EX|LOCK_NB;
7968 if ((f->operation & ~LOCK_NB) == LOCK_EX)
7969 unlink_noerrno(f->path);
7975 f->fd = safe_close(f->fd);
7979 static size_t nul_length(const uint8_t *p, size_t sz) {
7994 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
7995 const uint8_t *q, *w, *e;
8003 n = nul_length(q, e - q);
8005 /* If there are more than the specified run length of
8006 * NUL bytes, or if this is the beginning or the end
8007 * of the buffer, then seek instead of write */
8008 if ((n > run_length) ||
8009 (n > 0 && q == p) ||
8010 (n > 0 && q + n >= e)) {
8012 l = write(fd, w, q - w);
8019 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
8031 l = write(fd, w, q - w);
8038 return q - (const uint8_t*) p;
8041 void sigkill_wait(pid_t *pid) {
8047 if (kill(*pid, SIGKILL) > 0)
8048 (void) wait_for_terminate(*pid, NULL);
8051 int syslog_parse_priority(const char **p, int *priority, bool with_facility) {
8052 int a = 0, b = 0, c = 0;
8062 if (!strchr(*p, '>'))
8065 if ((*p)[2] == '>') {
8066 c = undecchar((*p)[1]);
8068 } else if ((*p)[3] == '>') {
8069 b = undecchar((*p)[1]);
8070 c = undecchar((*p)[2]);
8072 } else if ((*p)[4] == '>') {
8073 a = undecchar((*p)[1]);
8074 b = undecchar((*p)[2]);
8075 c = undecchar((*p)[3]);
8080 if (a < 0 || b < 0 || c < 0 ||
8081 (!with_facility && (a || b || c > 7)))
8085 *priority = a*100 + b*10 + c;
8087 *priority = (*priority & LOG_FACMASK) | c;
8093 ssize_t string_table_lookup(const char * const *table, size_t len, const char *key) {
8099 for (i = 0; i < len; ++i)
8100 if (streq_ptr(table[i], key))