1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
31 #include <sys/resource.h>
32 #include <linux/sched.h>
33 #include <sys/types.h>
37 #include <sys/ioctl.h>
39 #include <linux/tiocl.h>
44 #include <sys/prctl.h>
45 #include <sys/utsname.h>
47 #include <netinet/ip.h>
55 #include <sys/mount.h>
56 #include <linux/magic.h>
60 #include <sys/personality.h>
61 #include <sys/xattr.h>
62 #include <sys/statvfs.h>
66 /* When we include libgen.h because we need dirname() we immediately
67 * undefine basename() since libgen.h defines it as a macro to the XDG
68 * version which is really broken. */
72 #ifdef HAVE_SYS_AUXV_H
84 #include "path-util.h"
85 #include "exit-status.h"
89 #include "device-nodes.h"
94 #include "sparse-endian.h"
95 #include "formats-util.h"
97 /* Put this test here for a lack of better place */
98 assert_cc(EAGAIN == EWOULDBLOCK);
101 char **saved_argv = NULL;
103 static volatile unsigned cached_columns = 0;
104 static volatile unsigned cached_lines = 0;
106 size_t page_size(void) {
107 static thread_local size_t pgsz = 0;
110 if (_likely_(pgsz > 0))
113 r = sysconf(_SC_PAGESIZE);
120 bool streq_ptr(const char *a, const char *b) {
122 /* Like streq(), but tries to make sense of NULL pointers */
133 char* endswith(const char *s, const char *postfix) {
140 pl = strlen(postfix);
143 return (char*) s + sl;
148 if (memcmp(s + sl - pl, postfix, pl) != 0)
151 return (char*) s + sl - pl;
154 char* first_word(const char *s, const char *word) {
161 /* Checks if the string starts with the specified word, either
162 * followed by NUL or by whitespace. Returns a pointer to the
163 * NUL or the first character after the whitespace. */
174 if (memcmp(s, word, wl) != 0)
181 if (!strchr(WHITESPACE, *p))
184 p += strspn(p, WHITESPACE);
188 static size_t cescape_char(char c, char *buf) {
189 char * buf_old = buf;
235 /* For special chars we prefer octal over
236 * hexadecimal encoding, simply because glib's
237 * g_strescape() does the same */
238 if ((c < ' ') || (c >= 127)) {
240 *(buf++) = octchar((unsigned char) c >> 6);
241 *(buf++) = octchar((unsigned char) c >> 3);
242 *(buf++) = octchar((unsigned char) c);
248 return buf - buf_old;
251 int close_nointr(int fd) {
258 * Just ignore EINTR; a retry loop is the wrong thing to do on
261 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
262 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
263 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
264 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
272 int safe_close(int fd) {
275 * Like close_nointr() but cannot fail. Guarantees errno is
276 * unchanged. Is a NOP with negative fds passed, and returns
277 * -1, so that it can be used in this syntax:
279 * fd = safe_close(fd);
285 /* The kernel might return pretty much any error code
286 * via close(), but the fd will be closed anyway. The
287 * only condition we want to check for here is whether
288 * the fd was invalid at all... */
290 assert_se(close_nointr(fd) != -EBADF);
296 void close_many(const int fds[], unsigned n_fd) {
299 assert(fds || n_fd <= 0);
301 for (i = 0; i < n_fd; i++)
305 int unlink_noerrno(const char *path) {
316 int parse_boolean(const char *v) {
319 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
321 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
327 int parse_pid(const char *s, pid_t* ret_pid) {
328 unsigned long ul = 0;
335 r = safe_atolu(s, &ul);
341 if ((unsigned long) pid != ul)
351 int parse_uid(const char *s, uid_t* ret_uid) {
352 unsigned long ul = 0;
359 r = safe_atolu(s, &ul);
365 if ((unsigned long) uid != ul)
368 /* Some libc APIs use UID_INVALID as special placeholder */
369 if (uid == (uid_t) 0xFFFFFFFF)
372 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
373 if (uid == (uid_t) 0xFFFF)
380 int safe_atou(const char *s, unsigned *ret_u) {
388 l = strtoul(s, &x, 0);
390 if (!x || x == s || *x || errno)
391 return errno > 0 ? -errno : -EINVAL;
393 if ((unsigned long) (unsigned) l != l)
396 *ret_u = (unsigned) l;
400 int safe_atoi(const char *s, int *ret_i) {
408 l = strtol(s, &x, 0);
410 if (!x || x == s || *x || errno)
411 return errno > 0 ? -errno : -EINVAL;
413 if ((long) (int) l != l)
420 int safe_atou8(const char *s, uint8_t *ret) {
428 l = strtoul(s, &x, 0);
430 if (!x || x == s || *x || errno)
431 return errno > 0 ? -errno : -EINVAL;
433 if ((unsigned long) (uint8_t) l != l)
440 int safe_atou16(const char *s, uint16_t *ret) {
448 l = strtoul(s, &x, 0);
450 if (!x || x == s || *x || errno)
451 return errno > 0 ? -errno : -EINVAL;
453 if ((unsigned long) (uint16_t) l != l)
460 int safe_atoi16(const char *s, int16_t *ret) {
468 l = strtol(s, &x, 0);
470 if (!x || x == s || *x || errno)
471 return errno > 0 ? -errno : -EINVAL;
473 if ((long) (int16_t) l != l)
480 int safe_atollu(const char *s, long long unsigned *ret_llu) {
482 unsigned long long l;
488 l = strtoull(s, &x, 0);
490 if (!x || x == s || *x || errno)
491 return errno ? -errno : -EINVAL;
497 int safe_atolli(const char *s, long long int *ret_lli) {
505 l = strtoll(s, &x, 0);
507 if (!x || x == s || *x || errno)
508 return errno ? -errno : -EINVAL;
514 int safe_atod(const char *s, double *ret_d) {
522 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
523 if (loc == (locale_t) 0)
527 d = strtod_l(s, &x, loc);
529 if (!x || x == s || *x || errno) {
531 return errno ? -errno : -EINVAL;
539 static size_t strcspn_escaped(const char *s, const char *reject) {
540 bool escaped = false;
543 for (n=0; s[n]; n++) {
546 else if (s[n] == '\\')
548 else if (strchr(reject, s[n]))
552 /* if s ends in \, return index of previous char */
556 /* Split a string into words. */
557 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
563 assert(**state == '\0');
567 current += strspn(current, separator);
573 if (quoted && strchr("\'\"", *current)) {
574 char quotechars[2] = {*current, '\0'};
576 *l = strcspn_escaped(current + 1, quotechars);
577 if (current[*l + 1] == '\0' ||
578 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
579 /* right quote missing or garbage at the end */
583 assert(current[*l + 1] == quotechars[0]);
584 *state = current++ + *l + 2;
586 *l = strcspn_escaped(current, separator);
587 if (current[*l] && !strchr(separator, current[*l])) {
588 /* unfinished escape */
592 *state = current + *l;
594 *l = strcspn(current, separator);
595 *state = current + *l;
601 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
603 _cleanup_free_ char *line = NULL;
615 p = procfs_file_alloca(pid, "stat");
616 r = read_one_line_file(p, &line);
620 /* Let's skip the pid and comm fields. The latter is enclosed
621 * in () but does not escape any () in its value, so let's
622 * skip over it manually */
624 p = strrchr(line, ')');
636 if ((long unsigned) (pid_t) ppid != ppid)
639 *_ppid = (pid_t) ppid;
644 int fchmod_umask(int fd, mode_t m) {
649 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
655 char *truncate_nl(char *s) {
658 s[strcspn(s, NEWLINE)] = 0;
662 int get_process_state(pid_t pid) {
666 _cleanup_free_ char *line = NULL;
670 p = procfs_file_alloca(pid, "stat");
671 r = read_one_line_file(p, &line);
675 p = strrchr(line, ')');
681 if (sscanf(p, " %c", &state) != 1)
684 return (unsigned char) state;
687 int get_process_comm(pid_t pid, char **name) {
694 p = procfs_file_alloca(pid, "comm");
696 r = read_one_line_file(p, name);
703 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
704 _cleanup_fclose_ FILE *f = NULL;
712 p = procfs_file_alloca(pid, "cmdline");
718 if (max_length == 0) {
719 size_t len = 0, allocated = 0;
721 while ((c = getc(f)) != EOF) {
723 if (!GREEDY_REALLOC(r, allocated, len+2)) {
728 r[len++] = isprint(c) ? c : ' ';
738 r = new(char, max_length);
744 while ((c = getc(f)) != EOF) {
766 size_t n = MIN(left-1, 3U);
773 /* Kernel threads have no argv[] */
775 _cleanup_free_ char *t = NULL;
783 h = get_process_comm(pid, &t);
787 r = strjoin("[", t, "]", NULL);
796 int is_kernel_thread(pid_t pid) {
808 p = procfs_file_alloca(pid, "cmdline");
813 count = fread(&c, 1, 1, f);
817 /* Kernel threads have an empty cmdline */
820 return eof ? 1 : -errno;
825 int get_process_capeff(pid_t pid, char **capeff) {
831 p = procfs_file_alloca(pid, "status");
833 return get_status_field(p, "\nCapEff:", capeff);
836 static int get_process_link_contents(const char *proc_file, char **name) {
842 r = readlink_malloc(proc_file, name);
844 return r == -ENOENT ? -ESRCH : r;
849 int get_process_exe(pid_t pid, char **name) {
856 p = procfs_file_alloca(pid, "exe");
857 r = get_process_link_contents(p, name);
861 d = endswith(*name, " (deleted)");
868 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
869 _cleanup_fclose_ FILE *f = NULL;
879 p = procfs_file_alloca(pid, "status");
884 FOREACH_LINE(line, f, return -errno) {
889 if (startswith(l, field)) {
891 l += strspn(l, WHITESPACE);
893 l[strcspn(l, WHITESPACE)] = 0;
895 return parse_uid(l, uid);
902 int get_process_uid(pid_t pid, uid_t *uid) {
903 return get_process_id(pid, "Uid:", uid);
906 int get_process_gid(pid_t pid, gid_t *gid) {
907 assert_cc(sizeof(uid_t) == sizeof(gid_t));
908 return get_process_id(pid, "Gid:", gid);
911 int get_process_cwd(pid_t pid, char **cwd) {
916 p = procfs_file_alloca(pid, "cwd");
918 return get_process_link_contents(p, cwd);
921 int get_process_root(pid_t pid, char **root) {
926 p = procfs_file_alloca(pid, "root");
928 return get_process_link_contents(p, root);
931 int get_process_environ(pid_t pid, char **env) {
932 _cleanup_fclose_ FILE *f = NULL;
933 _cleanup_free_ char *outcome = NULL;
936 size_t allocated = 0, sz = 0;
941 p = procfs_file_alloca(pid, "environ");
947 while ((c = fgetc(f)) != EOF) {
948 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
952 outcome[sz++] = '\n';
954 sz += cescape_char(c, outcome + sz);
964 char *strnappend(const char *s, const char *suffix, size_t b) {
972 return strndup(suffix, b);
981 if (b > ((size_t) -1) - a)
984 r = new(char, a+b+1);
989 memcpy(r+a, suffix, b);
995 char *strappend(const char *s, const char *suffix) {
996 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
999 int readlinkat_malloc(int fd, const char *p, char **ret) {
1014 n = readlinkat(fd, p, c, l-1);
1021 if ((size_t) n < l-1) {
1032 int readlink_malloc(const char *p, char **ret) {
1033 return readlinkat_malloc(AT_FDCWD, p, ret);
1036 int readlink_value(const char *p, char **ret) {
1037 _cleanup_free_ char *link = NULL;
1041 r = readlink_malloc(p, &link);
1045 value = basename(link);
1049 value = strdup(value);
1058 int readlink_and_make_absolute(const char *p, char **r) {
1059 _cleanup_free_ char *target = NULL;
1066 j = readlink_malloc(p, &target);
1070 k = file_in_same_dir(p, target);
1078 int readlink_and_canonicalize(const char *p, char **r) {
1085 j = readlink_and_make_absolute(p, &t);
1089 s = canonicalize_file_name(t);
1096 path_kill_slashes(*r);
1101 int reset_all_signal_handlers(void) {
1104 for (sig = 1; sig < _NSIG; sig++) {
1105 struct sigaction sa = {
1106 .sa_handler = SIG_DFL,
1107 .sa_flags = SA_RESTART,
1110 /* These two cannot be caught... */
1111 if (sig == SIGKILL || sig == SIGSTOP)
1114 /* On Linux the first two RT signals are reserved by
1115 * glibc, and sigaction() will return EINVAL for them. */
1116 if ((sigaction(sig, &sa, NULL) < 0))
1117 if (errno != EINVAL && r == 0)
1124 int reset_signal_mask(void) {
1127 if (sigemptyset(&ss) < 0)
1130 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1136 char *strstrip(char *s) {
1139 /* Drops trailing whitespace. Modifies the string in
1140 * place. Returns pointer to first non-space character */
1142 s += strspn(s, WHITESPACE);
1144 for (e = strchr(s, 0); e > s; e --)
1145 if (!strchr(WHITESPACE, e[-1]))
1153 char *delete_chars(char *s, const char *bad) {
1156 /* Drops all whitespace, regardless where in the string */
1158 for (f = s, t = s; *f; f++) {
1159 if (strchr(bad, *f))
1170 char *file_in_same_dir(const char *path, const char *filename) {
1177 /* This removes the last component of path and appends
1178 * filename, unless the latter is absolute anyway or the
1181 if (path_is_absolute(filename))
1182 return strdup(filename);
1184 e = strrchr(path, '/');
1186 return strdup(filename);
1188 k = strlen(filename);
1189 ret = new(char, (e + 1 - path) + k + 1);
1193 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1197 int rmdir_parents(const char *path, const char *stop) {
1206 /* Skip trailing slashes */
1207 while (l > 0 && path[l-1] == '/')
1213 /* Skip last component */
1214 while (l > 0 && path[l-1] != '/')
1217 /* Skip trailing slashes */
1218 while (l > 0 && path[l-1] == '/')
1224 if (!(t = strndup(path, l)))
1227 if (path_startswith(stop, t)) {
1236 if (errno != ENOENT)
1243 char hexchar(int x) {
1244 static const char table[16] = "0123456789abcdef";
1246 return table[x & 15];
1249 int unhexchar(char c) {
1251 if (c >= '0' && c <= '9')
1254 if (c >= 'a' && c <= 'f')
1255 return c - 'a' + 10;
1257 if (c >= 'A' && c <= 'F')
1258 return c - 'A' + 10;
1263 char *hexmem(const void *p, size_t l) {
1267 z = r = malloc(l * 2 + 1);
1271 for (x = p; x < (const uint8_t*) p + l; x++) {
1272 *(z++) = hexchar(*x >> 4);
1273 *(z++) = hexchar(*x & 15);
1280 void *unhexmem(const char *p, size_t l) {
1286 z = r = malloc((l + 1) / 2 + 1);
1290 for (x = p; x < p + l; x += 2) {
1293 a = unhexchar(x[0]);
1295 b = unhexchar(x[1]);
1299 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1306 char octchar(int x) {
1307 return '0' + (x & 7);
1310 int unoctchar(char c) {
1312 if (c >= '0' && c <= '7')
1318 char decchar(int x) {
1319 return '0' + (x % 10);
1322 int undecchar(char c) {
1324 if (c >= '0' && c <= '9')
1330 char *cescape(const char *s) {
1336 /* Does C style string escaping. May be reversed with
1339 r = new(char, strlen(s)*4 + 1);
1343 for (f = s, t = r; *f; f++)
1344 t += cescape_char(*f, t);
1351 static int cunescape_one(const char *p, size_t length, char *ret, uint32_t *ret_unicode) {
1358 /* Unescapes C style. Returns the unescaped character in ret,
1359 * unless we encountered a \u sequence in which case the full
1360 * unicode character is returned in ret_unicode, instead. */
1362 if (length != (size_t) -1 && length < 1)
1399 /* This is an extension of the XDG syntax files */
1404 /* hexadecimal encoding */
1407 if (length != (size_t) -1 && length < 3)
1410 a = unhexchar(p[1]);
1414 b = unhexchar(p[2]);
1418 /* Don't allow NUL bytes */
1419 if (a == 0 && b == 0)
1422 *ret = (char) ((a << 4U) | b);
1428 /* C++11 style 16bit unicode */
1434 if (length != (size_t) -1 && length < 5)
1437 for (i = 0; i < 4; i++) {
1438 a[i] = unhexchar(p[1 + i]);
1443 c = ((uint32_t) a[0] << 12U) | ((uint32_t) a[1] << 8U) | ((uint32_t) a[2] << 4U) | (uint32_t) a[3];
1445 /* Don't allow 0 chars */
1464 /* C++11 style 32bit unicode */
1470 if (length != (size_t) -1 && length < 9)
1473 for (i = 0; i < 8; i++) {
1474 a[i] = unhexchar(p[1 + i]);
1479 c = ((uint32_t) a[0] << 28U) | ((uint32_t) a[1] << 24U) | ((uint32_t) a[2] << 20U) | ((uint32_t) a[3] << 16U) |
1480 ((uint32_t) a[4] << 12U) | ((uint32_t) a[5] << 8U) | ((uint32_t) a[6] << 4U) | (uint32_t) a[7];
1482 /* Don't allow 0 chars */
1486 /* Don't allow invalid code points */
1487 if (!unichar_is_valid(c))
1512 /* octal encoding */
1516 if (length != (size_t) -1 && length < 4)
1519 a = unoctchar(p[0]);
1523 b = unoctchar(p[1]);
1527 c = unoctchar(p[2]);
1531 /* don't allow NUL bytes */
1532 if (a == 0 && b == 0 && c == 0)
1535 /* Don't allow bytes above 255 */
1536 m = ((uint32_t) a << 6U) | ((uint32_t) b << 3U) | (uint32_t) c;
1552 int cunescape_length_with_prefix(const char *s, size_t length, const char *prefix, UnescapeFlags flags, char **ret) {
1560 /* Undoes C style string escaping, and optionally prefixes it. */
1562 pl = prefix ? strlen(prefix) : 0;
1564 r = new(char, pl+length+1);
1569 memcpy(r, prefix, pl);
1571 for (f = s, t = r + pl; f < s + length; f++) {
1577 remaining = s + length - f;
1578 assert(remaining > 0);
1581 /* A literal literal, copy verbatim */
1586 if (remaining == 1) {
1587 if (flags & UNESCAPE_RELAX) {
1588 /* A trailing backslash, copy verbatim */
1597 k = cunescape_one(f + 1, remaining - 1, &c, &u);
1599 if (flags & UNESCAPE_RELAX) {
1600 /* Invalid escape code, let's take it literal then */
1610 /* Non-Unicode? Let's encode this directly */
1613 /* Unicode? Then let's encode this in UTF-8 */
1614 t += utf8_encode_unichar(t, u);
1625 int cunescape_length(const char *s, size_t length, UnescapeFlags flags, char **ret) {
1626 return cunescape_length_with_prefix(s, length, NULL, flags, ret);
1629 int cunescape(const char *s, UnescapeFlags flags, char **ret) {
1630 return cunescape_length(s, strlen(s), flags, ret);
1633 char *xescape(const char *s, const char *bad) {
1637 /* Escapes all chars in bad, in addition to \ and all special
1638 * chars, in \xFF style escaping. May be reversed with
1641 r = new(char, strlen(s) * 4 + 1);
1645 for (f = s, t = r; *f; f++) {
1647 if ((*f < ' ') || (*f >= 127) ||
1648 (*f == '\\') || strchr(bad, *f)) {
1651 *(t++) = hexchar(*f >> 4);
1652 *(t++) = hexchar(*f);
1662 char *ascii_strlower(char *t) {
1667 for (p = t; *p; p++)
1668 if (*p >= 'A' && *p <= 'Z')
1669 *p = *p - 'A' + 'a';
1674 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1678 filename[0] == '.' ||
1679 streq(filename, "lost+found") ||
1680 streq(filename, "aquota.user") ||
1681 streq(filename, "aquota.group") ||
1682 endswith(filename, ".rpmnew") ||
1683 endswith(filename, ".rpmsave") ||
1684 endswith(filename, ".rpmorig") ||
1685 endswith(filename, ".dpkg-old") ||
1686 endswith(filename, ".dpkg-new") ||
1687 endswith(filename, ".dpkg-tmp") ||
1688 endswith(filename, ".dpkg-dist") ||
1689 endswith(filename, ".dpkg-bak") ||
1690 endswith(filename, ".dpkg-backup") ||
1691 endswith(filename, ".dpkg-remove") ||
1692 endswith(filename, ".swp");
1695 bool hidden_file(const char *filename) {
1698 if (endswith(filename, "~"))
1701 return hidden_file_allow_backup(filename);
1704 int fd_nonblock(int fd, bool nonblock) {
1709 flags = fcntl(fd, F_GETFL, 0);
1714 nflags = flags | O_NONBLOCK;
1716 nflags = flags & ~O_NONBLOCK;
1718 if (nflags == flags)
1721 if (fcntl(fd, F_SETFL, nflags) < 0)
1727 int fd_cloexec(int fd, bool cloexec) {
1732 flags = fcntl(fd, F_GETFD, 0);
1737 nflags = flags | FD_CLOEXEC;
1739 nflags = flags & ~FD_CLOEXEC;
1741 if (nflags == flags)
1744 if (fcntl(fd, F_SETFD, nflags) < 0)
1750 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1753 assert(n_fdset == 0 || fdset);
1755 for (i = 0; i < n_fdset; i++)
1762 int close_all_fds(const int except[], unsigned n_except) {
1763 _cleanup_closedir_ DIR *d = NULL;
1767 assert(n_except == 0 || except);
1769 d = opendir("/proc/self/fd");
1774 /* When /proc isn't available (for example in chroots)
1775 * the fallback is brute forcing through the fd
1778 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1779 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1781 if (fd_in_set(fd, except, n_except))
1784 if (close_nointr(fd) < 0)
1785 if (errno != EBADF && r == 0)
1792 while ((de = readdir(d))) {
1795 if (hidden_file(de->d_name))
1798 if (safe_atoi(de->d_name, &fd) < 0)
1799 /* Let's better ignore this, just in case */
1808 if (fd_in_set(fd, except, n_except))
1811 if (close_nointr(fd) < 0) {
1812 /* Valgrind has its own FD and doesn't want to have it closed */
1813 if (errno != EBADF && r == 0)
1821 bool chars_intersect(const char *a, const char *b) {
1824 /* Returns true if any of the chars in a are in b. */
1825 for (p = a; *p; p++)
1832 bool fstype_is_network(const char *fstype) {
1833 static const char table[] =
1848 x = startswith(fstype, "fuse.");
1852 return nulstr_contains(table, fstype);
1856 _cleanup_close_ int fd;
1858 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1864 TIOCL_GETKMSGREDIRECT,
1868 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1871 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1874 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1880 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1881 struct termios old_termios, new_termios;
1882 char c, line[LINE_MAX];
1887 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1888 new_termios = old_termios;
1890 new_termios.c_lflag &= ~ICANON;
1891 new_termios.c_cc[VMIN] = 1;
1892 new_termios.c_cc[VTIME] = 0;
1894 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1897 if (t != USEC_INFINITY) {
1898 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1899 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1904 k = fread(&c, 1, 1, f);
1906 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1912 *need_nl = c != '\n';
1919 if (t != USEC_INFINITY) {
1920 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1925 if (!fgets(line, sizeof(line), f))
1926 return errno ? -errno : -EIO;
1930 if (strlen(line) != 1)
1940 int ask_char(char *ret, const char *replies, const char *text, ...) {
1950 bool need_nl = true;
1953 fputs(ANSI_HIGHLIGHT_ON, stdout);
1960 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1964 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1967 if (r == -EBADMSG) {
1968 puts("Bad input, please try again.");
1979 if (strchr(replies, c)) {
1984 puts("Read unexpected character, please try again.");
1988 int ask_string(char **ret, const char *text, ...) {
1993 char line[LINE_MAX];
1997 fputs(ANSI_HIGHLIGHT_ON, stdout);
2004 fputs(ANSI_HIGHLIGHT_OFF, stdout);
2009 if (!fgets(line, sizeof(line), stdin))
2010 return errno ? -errno : -EIO;
2012 if (!endswith(line, "\n"))
2031 int reset_terminal_fd(int fd, bool switch_to_text) {
2032 struct termios termios;
2035 /* Set terminal to some sane defaults */
2039 /* We leave locked terminal attributes untouched, so that
2040 * Plymouth may set whatever it wants to set, and we don't
2041 * interfere with that. */
2043 /* Disable exclusive mode, just in case */
2044 ioctl(fd, TIOCNXCL);
2046 /* Switch to text mode */
2048 ioctl(fd, KDSETMODE, KD_TEXT);
2050 /* Enable console unicode mode */
2051 ioctl(fd, KDSKBMODE, K_UNICODE);
2053 if (tcgetattr(fd, &termios) < 0) {
2058 /* We only reset the stuff that matters to the software. How
2059 * hardware is set up we don't touch assuming that somebody
2060 * else will do that for us */
2062 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
2063 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
2064 termios.c_oflag |= ONLCR;
2065 termios.c_cflag |= CREAD;
2066 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
2068 termios.c_cc[VINTR] = 03; /* ^C */
2069 termios.c_cc[VQUIT] = 034; /* ^\ */
2070 termios.c_cc[VERASE] = 0177;
2071 termios.c_cc[VKILL] = 025; /* ^X */
2072 termios.c_cc[VEOF] = 04; /* ^D */
2073 termios.c_cc[VSTART] = 021; /* ^Q */
2074 termios.c_cc[VSTOP] = 023; /* ^S */
2075 termios.c_cc[VSUSP] = 032; /* ^Z */
2076 termios.c_cc[VLNEXT] = 026; /* ^V */
2077 termios.c_cc[VWERASE] = 027; /* ^W */
2078 termios.c_cc[VREPRINT] = 022; /* ^R */
2079 termios.c_cc[VEOL] = 0;
2080 termios.c_cc[VEOL2] = 0;
2082 termios.c_cc[VTIME] = 0;
2083 termios.c_cc[VMIN] = 1;
2085 if (tcsetattr(fd, TCSANOW, &termios) < 0)
2089 /* Just in case, flush all crap out */
2090 tcflush(fd, TCIOFLUSH);
2095 int reset_terminal(const char *name) {
2096 _cleanup_close_ int fd = -1;
2098 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2102 return reset_terminal_fd(fd, true);
2105 int open_terminal(const char *name, int mode) {
2110 * If a TTY is in the process of being closed opening it might
2111 * cause EIO. This is horribly awful, but unlikely to be
2112 * changed in the kernel. Hence we work around this problem by
2113 * retrying a couple of times.
2115 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
2118 assert(!(mode & O_CREAT));
2121 fd = open(name, mode, 0);
2128 /* Max 1s in total */
2132 usleep(50 * USEC_PER_MSEC);
2150 int flush_fd(int fd) {
2151 struct pollfd pollfd = {
2161 r = poll(&pollfd, 1, 0);
2171 l = read(fd, buf, sizeof(buf));
2177 if (errno == EAGAIN)
2186 int acquire_terminal(
2190 bool ignore_tiocstty_eperm,
2193 int fd = -1, notify = -1, r = 0, wd = -1;
2198 /* We use inotify to be notified when the tty is closed. We
2199 * create the watch before checking if we can actually acquire
2200 * it, so that we don't lose any event.
2202 * Note: strictly speaking this actually watches for the
2203 * device being closed, it does *not* really watch whether a
2204 * tty loses its controlling process. However, unless some
2205 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2206 * its tty otherwise this will not become a problem. As long
2207 * as the administrator makes sure not configure any service
2208 * on the same tty as an untrusted user this should not be a
2209 * problem. (Which he probably should not do anyway.) */
2211 if (timeout != USEC_INFINITY)
2212 ts = now(CLOCK_MONOTONIC);
2214 if (!fail && !force) {
2215 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2221 wd = inotify_add_watch(notify, name, IN_CLOSE);
2229 struct sigaction sa_old, sa_new = {
2230 .sa_handler = SIG_IGN,
2231 .sa_flags = SA_RESTART,
2235 r = flush_fd(notify);
2240 /* We pass here O_NOCTTY only so that we can check the return
2241 * value TIOCSCTTY and have a reliable way to figure out if we
2242 * successfully became the controlling process of the tty */
2243 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2247 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2248 * if we already own the tty. */
2249 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2251 /* First, try to get the tty */
2252 if (ioctl(fd, TIOCSCTTY, force) < 0)
2255 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2257 /* Sometimes it makes sense to ignore TIOCSCTTY
2258 * returning EPERM, i.e. when very likely we already
2259 * are have this controlling terminal. */
2260 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2263 if (r < 0 && (force || fail || r != -EPERM)) {
2272 assert(notify >= 0);
2275 union inotify_event_buffer buffer;
2276 struct inotify_event *e;
2279 if (timeout != USEC_INFINITY) {
2282 n = now(CLOCK_MONOTONIC);
2283 if (ts + timeout < n) {
2288 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2298 l = read(notify, &buffer, sizeof(buffer));
2300 if (errno == EINTR || errno == EAGAIN)
2307 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2308 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2317 /* We close the tty fd here since if the old session
2318 * ended our handle will be dead. It's important that
2319 * we do this after sleeping, so that we don't enter
2320 * an endless loop. */
2321 fd = safe_close(fd);
2326 r = reset_terminal_fd(fd, true);
2328 log_warning_errno(r, "Failed to reset terminal: %m");
2339 int release_terminal(void) {
2340 static const struct sigaction sa_new = {
2341 .sa_handler = SIG_IGN,
2342 .sa_flags = SA_RESTART,
2345 _cleanup_close_ int fd = -1;
2346 struct sigaction sa_old;
2349 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2353 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2354 * by our own TIOCNOTTY */
2355 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2357 if (ioctl(fd, TIOCNOTTY) < 0)
2360 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2365 int sigaction_many(const struct sigaction *sa, ...) {
2370 while ((sig = va_arg(ap, int)) > 0)
2371 if (sigaction(sig, sa, NULL) < 0)
2378 int ignore_signals(int sig, ...) {
2379 struct sigaction sa = {
2380 .sa_handler = SIG_IGN,
2381 .sa_flags = SA_RESTART,
2386 if (sigaction(sig, &sa, NULL) < 0)
2390 while ((sig = va_arg(ap, int)) > 0)
2391 if (sigaction(sig, &sa, NULL) < 0)
2398 int default_signals(int sig, ...) {
2399 struct sigaction sa = {
2400 .sa_handler = SIG_DFL,
2401 .sa_flags = SA_RESTART,
2406 if (sigaction(sig, &sa, NULL) < 0)
2410 while ((sig = va_arg(ap, int)) > 0)
2411 if (sigaction(sig, &sa, NULL) < 0)
2418 void safe_close_pair(int p[]) {
2422 /* Special case pairs which use the same fd in both
2424 p[0] = p[1] = safe_close(p[0]);
2428 p[0] = safe_close(p[0]);
2429 p[1] = safe_close(p[1]);
2432 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2439 while (nbytes > 0) {
2442 k = read(fd, p, nbytes);
2447 if (errno == EAGAIN && do_poll) {
2449 /* We knowingly ignore any return value here,
2450 * and expect that any error/EOF is reported
2453 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2457 return n > 0 ? n : -errno;
2471 int loop_read_exact(int fd, void *buf, size_t nbytes, bool do_poll) {
2474 n = loop_read(fd, buf, nbytes, do_poll);
2477 if ((size_t) n != nbytes)
2482 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2483 const uint8_t *p = buf;
2490 while (nbytes > 0) {
2493 k = write(fd, p, nbytes);
2498 if (errno == EAGAIN && do_poll) {
2499 /* We knowingly ignore any return value here,
2500 * and expect that any error/EOF is reported
2503 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2510 if (k == 0) /* Can't really happen */
2520 int parse_size(const char *t, off_t base, off_t *size) {
2522 /* Soo, sometimes we want to parse IEC binary suffxies, and
2523 * sometimes SI decimal suffixes. This function can parse
2524 * both. Which one is the right way depends on the
2525 * context. Wikipedia suggests that SI is customary for
2526 * hardrware metrics and network speeds, while IEC is
2527 * customary for most data sizes used by software and volatile
2528 * (RAM) memory. Hence be careful which one you pick!
2530 * In either case we use just K, M, G as suffix, and not Ki,
2531 * Mi, Gi or so (as IEC would suggest). That's because that's
2532 * frickin' ugly. But this means you really need to make sure
2533 * to document which base you are parsing when you use this
2538 unsigned long long factor;
2541 static const struct table iec[] = {
2542 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2543 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2544 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2545 { "G", 1024ULL*1024ULL*1024ULL },
2546 { "M", 1024ULL*1024ULL },
2552 static const struct table si[] = {
2553 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2554 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2555 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2556 { "G", 1000ULL*1000ULL*1000ULL },
2557 { "M", 1000ULL*1000ULL },
2563 const struct table *table;
2565 unsigned long long r = 0;
2566 unsigned n_entries, start_pos = 0;
2569 assert(base == 1000 || base == 1024);
2574 n_entries = ELEMENTSOF(si);
2577 n_entries = ELEMENTSOF(iec);
2583 unsigned long long l2;
2589 l = strtoll(p, &e, 10);
2602 if (*e >= '0' && *e <= '9') {
2605 /* strotoull itself would accept space/+/- */
2606 l2 = strtoull(e, &e2, 10);
2608 if (errno == ERANGE)
2611 /* Ignore failure. E.g. 10.M is valid */
2618 e += strspn(e, WHITESPACE);
2620 for (i = start_pos; i < n_entries; i++)
2621 if (startswith(e, table[i].suffix)) {
2622 unsigned long long tmp;
2623 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2625 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2626 if (tmp > ULLONG_MAX - r)
2630 if ((unsigned long long) (off_t) r != r)
2633 p = e + strlen(table[i].suffix);
2649 int make_stdio(int fd) {
2654 r = dup2(fd, STDIN_FILENO);
2655 s = dup2(fd, STDOUT_FILENO);
2656 t = dup2(fd, STDERR_FILENO);
2661 if (r < 0 || s < 0 || t < 0)
2664 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2665 * dup2() was a NOP and the bit hence possibly set. */
2666 fd_cloexec(STDIN_FILENO, false);
2667 fd_cloexec(STDOUT_FILENO, false);
2668 fd_cloexec(STDERR_FILENO, false);
2673 int make_null_stdio(void) {
2676 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2680 return make_stdio(null_fd);
2683 bool is_device_path(const char *path) {
2685 /* Returns true on paths that refer to a device, either in
2686 * sysfs or in /dev */
2689 path_startswith(path, "/dev/") ||
2690 path_startswith(path, "/sys/");
2693 int dir_is_empty(const char *path) {
2694 _cleanup_closedir_ DIR *d;
2705 if (!de && errno != 0)
2711 if (!hidden_file(de->d_name))
2716 char* dirname_malloc(const char *path) {
2717 char *d, *dir, *dir2;
2734 int dev_urandom(void *p, size_t n) {
2735 static int have_syscall = -1;
2737 _cleanup_close_ int fd = -1;
2740 /* Gathers some randomness from the kernel. This call will
2741 * never block, and will always return some data from the
2742 * kernel, regardless if the random pool is fully initialized
2743 * or not. It thus makes no guarantee for the quality of the
2744 * returned entropy, but is good enough for or usual usecases
2745 * of seeding the hash functions for hashtable */
2747 /* Use the getrandom() syscall unless we know we don't have
2748 * it, or when the requested size is too large for it. */
2749 if (have_syscall != 0 || (size_t) (int) n != n) {
2750 r = getrandom(p, n, GRND_NONBLOCK);
2752 have_syscall = true;
2757 if (errno == ENOSYS)
2758 /* we lack the syscall, continue with
2759 * reading from /dev/urandom */
2760 have_syscall = false;
2761 else if (errno == EAGAIN)
2762 /* not enough entropy for now. Let's
2763 * remember to use the syscall the
2764 * next time, again, but also read
2765 * from /dev/urandom for now, which
2766 * doesn't care about the current
2767 * amount of entropy. */
2768 have_syscall = true;
2772 /* too short read? */
2776 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2778 return errno == ENOENT ? -ENOSYS : -errno;
2780 return loop_read_exact(fd, p, n, true);
2783 void initialize_srand(void) {
2784 static bool srand_called = false;
2786 #ifdef HAVE_SYS_AUXV_H
2795 #ifdef HAVE_SYS_AUXV_H
2796 /* The kernel provides us with a bit of entropy in auxv, so
2797 * let's try to make use of that to seed the pseudo-random
2798 * generator. It's better than nothing... */
2800 auxv = (void*) getauxval(AT_RANDOM);
2802 x ^= *(unsigned*) auxv;
2805 x ^= (unsigned) now(CLOCK_REALTIME);
2806 x ^= (unsigned) gettid();
2809 srand_called = true;
2812 void random_bytes(void *p, size_t n) {
2816 r = dev_urandom(p, n);
2820 /* If some idiot made /dev/urandom unavailable to us, he'll
2821 * get a PRNG instead. */
2825 for (q = p; q < (uint8_t*) p + n; q ++)
2829 void rename_process(const char name[8]) {
2832 /* This is a like a poor man's setproctitle(). It changes the
2833 * comm field, argv[0], and also the glibc's internally used
2834 * name of the process. For the first one a limit of 16 chars
2835 * applies, to the second one usually one of 10 (i.e. length
2836 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2837 * "systemd"). If you pass a longer string it will be
2840 prctl(PR_SET_NAME, name);
2842 if (program_invocation_name)
2843 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2845 if (saved_argc > 0) {
2849 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2851 for (i = 1; i < saved_argc; i++) {
2855 memzero(saved_argv[i], strlen(saved_argv[i]));
2860 void sigset_add_many(sigset_t *ss, ...) {
2867 while ((sig = va_arg(ap, int)) > 0)
2868 assert_se(sigaddset(ss, sig) == 0);
2872 int sigprocmask_many(int how, ...) {
2877 assert_se(sigemptyset(&ss) == 0);
2880 while ((sig = va_arg(ap, int)) > 0)
2881 assert_se(sigaddset(&ss, sig) == 0);
2884 if (sigprocmask(how, &ss, NULL) < 0)
2890 char* gethostname_malloc(void) {
2893 assert_se(uname(&u) >= 0);
2895 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2896 return strdup(u.nodename);
2898 return strdup(u.sysname);
2901 bool hostname_is_set(void) {
2904 assert_se(uname(&u) >= 0);
2906 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2909 char *lookup_uid(uid_t uid) {
2912 _cleanup_free_ char *buf = NULL;
2913 struct passwd pwbuf, *pw = NULL;
2915 /* Shortcut things to avoid NSS lookups */
2917 return strdup("root");
2919 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2923 buf = malloc(bufsize);
2927 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2928 return strdup(pw->pw_name);
2930 if (asprintf(&name, UID_FMT, uid) < 0)
2936 char* getlogname_malloc(void) {
2940 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2945 return lookup_uid(uid);
2948 char *getusername_malloc(void) {
2955 return lookup_uid(getuid());
2958 int getttyname_malloc(int fd, char **ret) {
2968 r = ttyname_r(fd, path, sizeof(path));
2973 p = startswith(path, "/dev/");
2974 c = strdup(p ?: path);
2991 int getttyname_harder(int fd, char **r) {
2995 k = getttyname_malloc(fd, &s);
2999 if (streq(s, "tty")) {
3001 return get_ctty(0, NULL, r);
3008 int get_ctty_devnr(pid_t pid, dev_t *d) {
3010 _cleanup_free_ char *line = NULL;
3012 unsigned long ttynr;
3016 p = procfs_file_alloca(pid, "stat");
3017 r = read_one_line_file(p, &line);
3021 p = strrchr(line, ')');
3031 "%*d " /* session */
3036 if (major(ttynr) == 0 && minor(ttynr) == 0)
3045 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
3046 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
3047 _cleanup_free_ char *s = NULL;
3054 k = get_ctty_devnr(pid, &devnr);
3058 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
3060 k = readlink_malloc(fn, &s);
3066 /* This is an ugly hack */
3067 if (major(devnr) == 136) {
3068 if (asprintf(&b, "pts/%u", minor(devnr)) < 0)
3071 /* Probably something like the ptys which have no
3072 * symlink in /dev/char. Let's return something
3073 * vaguely useful. */
3080 if (startswith(s, "/dev/"))
3082 else if (startswith(s, "../"))
3099 bool is_temporary_fs(const struct statfs *s) {
3102 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3103 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3106 int fd_is_temporary_fs(int fd) {
3109 if (fstatfs(fd, &s) < 0)
3112 return is_temporary_fs(&s);
3115 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3118 /* Under the assumption that we are running privileged we
3119 * first change the access mode and only then hand out
3120 * ownership to avoid a window where access is too open. */
3122 if (mode != MODE_INVALID)
3123 if (chmod(path, mode) < 0)
3126 if (uid != UID_INVALID || gid != GID_INVALID)
3127 if (chown(path, uid, gid) < 0)
3133 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3136 /* Under the assumption that we are running privileged we
3137 * first change the access mode and only then hand out
3138 * ownership to avoid a window where access is too open. */
3140 if (mode != MODE_INVALID)
3141 if (fchmod(fd, mode) < 0)
3144 if (uid != UID_INVALID || gid != GID_INVALID)
3145 if (fchown(fd, uid, gid) < 0)
3151 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3155 /* Allocates the cpuset in the right size */
3158 if (!(r = CPU_ALLOC(n)))
3161 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3162 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3172 if (errno != EINVAL)
3179 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3180 static const char status_indent[] = " "; /* "[" STATUS "] " */
3181 _cleanup_free_ char *s = NULL;
3182 _cleanup_close_ int fd = -1;
3183 struct iovec iovec[6] = {};
3185 static bool prev_ephemeral;
3189 /* This is independent of logging, as status messages are
3190 * optional and go exclusively to the console. */
3192 if (vasprintf(&s, format, ap) < 0)
3195 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3208 sl = status ? sizeof(status_indent)-1 : 0;
3214 e = ellipsize(s, emax, 50);
3222 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3223 prev_ephemeral = ephemeral;
3226 if (!isempty(status)) {
3227 IOVEC_SET_STRING(iovec[n++], "[");
3228 IOVEC_SET_STRING(iovec[n++], status);
3229 IOVEC_SET_STRING(iovec[n++], "] ");
3231 IOVEC_SET_STRING(iovec[n++], status_indent);
3234 IOVEC_SET_STRING(iovec[n++], s);
3236 IOVEC_SET_STRING(iovec[n++], "\n");
3238 if (writev(fd, iovec, n) < 0)
3244 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3250 va_start(ap, format);
3251 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3257 char *replace_env(const char *format, char **env) {
3264 const char *e, *word = format;
3269 for (e = format; *e; e ++) {
3280 k = strnappend(r, word, e-word-1);
3290 } else if (*e == '$') {
3291 k = strnappend(r, word, e-word);
3308 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3310 k = strappend(r, t);
3324 k = strnappend(r, word, e-word);
3336 char **replace_env_argv(char **argv, char **env) {
3338 unsigned k = 0, l = 0;
3340 l = strv_length(argv);
3342 ret = new(char*, l+1);
3346 STRV_FOREACH(i, argv) {
3348 /* If $FOO appears as single word, replace it by the split up variable */
3349 if ((*i)[0] == '$' && (*i)[1] != '{') {
3351 char **w, **m = NULL;
3354 e = strv_env_get(env, *i+1);
3358 r = strv_split_quoted(&m, e, UNQUOTE_RELAX);
3370 w = realloc(ret, sizeof(char*) * (l+1));
3380 memcpy(ret + k, m, q * sizeof(char*));
3388 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3389 ret[k] = replace_env(*i, env);
3401 int fd_columns(int fd) {
3402 struct winsize ws = {};
3404 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3413 unsigned columns(void) {
3417 if (_likely_(cached_columns > 0))
3418 return cached_columns;
3421 e = getenv("COLUMNS");
3423 (void) safe_atoi(e, &c);
3426 c = fd_columns(STDOUT_FILENO);
3432 return cached_columns;
3435 int fd_lines(int fd) {
3436 struct winsize ws = {};
3438 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3447 unsigned lines(void) {
3451 if (_likely_(cached_lines > 0))
3452 return cached_lines;
3455 e = getenv("LINES");
3457 (void) safe_atoi(e, &l);
3460 l = fd_lines(STDOUT_FILENO);
3466 return cached_lines;
3469 /* intended to be used as a SIGWINCH sighandler */
3470 void columns_lines_cache_reset(int signum) {
3476 static int cached_on_tty = -1;
3478 if (_unlikely_(cached_on_tty < 0))
3479 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3481 return cached_on_tty;
3484 int files_same(const char *filea, const char *fileb) {
3487 if (stat(filea, &a) < 0)
3490 if (stat(fileb, &b) < 0)
3493 return a.st_dev == b.st_dev &&
3494 a.st_ino == b.st_ino;
3497 int running_in_chroot(void) {
3500 ret = files_same("/proc/1/root", "/");
3507 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3512 assert(percent <= 100);
3513 assert(new_length >= 3);
3515 if (old_length <= 3 || old_length <= new_length)
3516 return strndup(s, old_length);
3518 r = new0(char, new_length+1);
3522 x = (new_length * percent) / 100;
3524 if (x > new_length - 3)
3532 s + old_length - (new_length - x - 3),
3533 new_length - x - 3);
3538 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3542 unsigned k, len, len2;
3545 assert(percent <= 100);
3546 assert(new_length >= 3);
3548 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3549 if (ascii_is_valid(s))
3550 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3552 if (old_length <= 3 || old_length <= new_length)
3553 return strndup(s, old_length);
3555 x = (new_length * percent) / 100;
3557 if (x > new_length - 3)
3561 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3564 c = utf8_encoded_to_unichar(i);
3567 k += unichar_iswide(c) ? 2 : 1;
3570 if (k > x) /* last character was wide and went over quota */
3573 for (j = s + old_length; k < new_length && j > i; ) {
3576 j = utf8_prev_char(j);
3577 c = utf8_encoded_to_unichar(j);
3580 k += unichar_iswide(c) ? 2 : 1;
3584 /* we don't actually need to ellipsize */
3586 return memdup(s, old_length + 1);
3588 /* make space for ellipsis */
3589 j = utf8_next_char(j);
3592 len2 = s + old_length - j;
3593 e = new(char, len + 3 + len2 + 1);
3598 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3599 old_length, new_length, x, len, len2, k);
3603 e[len] = 0xe2; /* tri-dot ellipsis: … */
3607 memcpy(e + len + 3, j, len2 + 1);
3612 char *ellipsize(const char *s, size_t length, unsigned percent) {
3613 return ellipsize_mem(s, strlen(s), length, percent);
3616 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3617 _cleanup_close_ int fd;
3623 mkdir_parents(path, 0755);
3625 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3630 r = fchmod(fd, mode);
3635 if (uid != UID_INVALID || gid != GID_INVALID) {
3636 r = fchown(fd, uid, gid);
3641 if (stamp != USEC_INFINITY) {
3642 struct timespec ts[2];
3644 timespec_store(&ts[0], stamp);
3646 r = futimens(fd, ts);
3648 r = futimens(fd, NULL);
3655 int touch(const char *path) {
3656 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3659 static char *unquote(const char *s, const char* quotes) {
3663 /* This is rather stupid, simply removes the heading and
3664 * trailing quotes if there is one. Doesn't care about
3665 * escaping or anything.
3667 * DON'T USE THIS FOR NEW CODE ANYMORE!*/
3673 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3674 return strndup(s+1, l-2);
3679 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3690 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3704 * < 0 : wait_for_terminate() failed to get the state of the
3705 * process, the process was terminated by a signal, or
3706 * failed for an unknown reason.
3707 * >=0 : The process terminated normally, and its exit code is
3710 * That is, success is indicated by a return value of zero, and an
3711 * error is indicated by a non-zero value.
3713 * A warning is emitted if the process terminates abnormally,
3714 * and also if it returns non-zero unless check_exit_code is true.
3716 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3723 r = wait_for_terminate(pid, &status);
3725 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3727 if (status.si_code == CLD_EXITED) {
3728 if (status.si_status != 0)
3729 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3730 "%s failed with error code %i.", name, status.si_status);
3732 log_debug("%s succeeded.", name);
3734 return status.si_status;
3735 } else if (status.si_code == CLD_KILLED ||
3736 status.si_code == CLD_DUMPED) {
3738 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3742 log_warning("%s failed due to unknown reason.", name);
3746 noreturn void freeze(void) {
3748 /* Make sure nobody waits for us on a socket anymore */
3749 close_all_fds(NULL, 0);
3757 bool null_or_empty(struct stat *st) {
3760 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3763 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3769 int null_or_empty_path(const char *fn) {
3774 if (stat(fn, &st) < 0)
3777 return null_or_empty(&st);
3780 int null_or_empty_fd(int fd) {
3785 if (fstat(fd, &st) < 0)
3788 return null_or_empty(&st);
3791 DIR *xopendirat(int fd, const char *name, int flags) {
3795 assert(!(flags & O_CREAT));
3797 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3810 int signal_from_string_try_harder(const char *s) {
3814 signo = signal_from_string(s);
3816 if (startswith(s, "SIG"))
3817 return signal_from_string(s+3);
3822 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3823 _cleanup_free_ char *t = NULL, *u = NULL;
3826 u = unquote(tagvalue, QUOTES);
3830 enc_len = strlen(u) * 4 + 1;
3831 t = new(char, enc_len);
3835 if (encode_devnode_name(u, t, enc_len) < 0)
3838 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3841 char *fstab_node_to_udev_node(const char *p) {
3844 if (startswith(p, "LABEL="))
3845 return tag_to_udev_node(p+6, "label");
3847 if (startswith(p, "UUID="))
3848 return tag_to_udev_node(p+5, "uuid");
3850 if (startswith(p, "PARTUUID="))
3851 return tag_to_udev_node(p+9, "partuuid");
3853 if (startswith(p, "PARTLABEL="))
3854 return tag_to_udev_node(p+10, "partlabel");
3859 bool tty_is_vc(const char *tty) {
3862 return vtnr_from_tty(tty) >= 0;
3865 bool tty_is_console(const char *tty) {
3868 if (startswith(tty, "/dev/"))
3871 return streq(tty, "console");
3874 int vtnr_from_tty(const char *tty) {
3879 if (startswith(tty, "/dev/"))
3882 if (!startswith(tty, "tty") )
3885 if (tty[3] < '0' || tty[3] > '9')
3888 r = safe_atoi(tty+3, &i);
3892 if (i < 0 || i > 63)
3898 char *resolve_dev_console(char **active) {
3901 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3902 * (i.e. not read-only-mounted which is a sign for container setups) */
3904 if (path_is_read_only_fs("/sys") > 0)
3907 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3910 /* If multiple log outputs are configured the last one is what
3911 * /dev/console points to */
3912 tty = strrchr(*active, ' ');
3918 if (streq(tty, "tty0")) {
3921 /* Get the active VC (e.g. tty1) */
3922 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
3924 tty = *active = tmp;
3931 bool tty_is_vc_resolve(const char *tty) {
3932 _cleanup_free_ char *active = NULL;
3936 if (startswith(tty, "/dev/"))
3939 if (streq(tty, "console")) {
3940 tty = resolve_dev_console(&active);
3945 return tty_is_vc(tty);
3948 const char *default_term_for_tty(const char *tty) {
3951 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
3954 bool dirent_is_file(const struct dirent *de) {
3957 if (hidden_file(de->d_name))
3960 if (de->d_type != DT_REG &&
3961 de->d_type != DT_LNK &&
3962 de->d_type != DT_UNKNOWN)
3968 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
3971 if (de->d_type != DT_REG &&
3972 de->d_type != DT_LNK &&
3973 de->d_type != DT_UNKNOWN)
3976 if (hidden_file_allow_backup(de->d_name))
3979 return endswith(de->d_name, suffix);
3982 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
3983 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
3984 _cleanup_set_free_free_ Set *seen = NULL;
3987 /* We fork this all off from a child process so that we can
3988 * somewhat cleanly make use of SIGALRM to set a time limit */
3990 reset_all_signal_handlers();
3991 reset_signal_mask();
3993 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
3995 pids = hashmap_new(NULL);
3999 seen = set_new(&string_hash_ops);
4003 STRV_FOREACH(directory, directories) {
4004 _cleanup_closedir_ DIR *d;
4007 d = opendir(*directory);
4009 if (errno == ENOENT)
4012 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4015 FOREACH_DIRENT(de, d, break) {
4016 _cleanup_free_ char *path = NULL;
4020 if (!dirent_is_file(de))
4023 if (set_contains(seen, de->d_name)) {
4024 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4028 r = set_put_strdup(seen, de->d_name);
4032 path = strjoin(*directory, "/", de->d_name, NULL);
4036 if (null_or_empty_path(path)) {
4037 log_debug("%s is empty (a mask).", path);
4043 log_error_errno(errno, "Failed to fork: %m");
4045 } else if (pid == 0) {
4048 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4058 return log_error_errno(errno, "Failed to execute %s: %m", path);
4061 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4063 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4070 /* Abort execution of this process after the timout. We simply
4071 * rely on SIGALRM as default action terminating the process,
4072 * and turn on alarm(). */
4074 if (timeout != USEC_INFINITY)
4075 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4077 while (!hashmap_isempty(pids)) {
4078 _cleanup_free_ char *path = NULL;
4081 pid = PTR_TO_UINT(hashmap_first_key(pids));
4084 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4087 wait_for_terminate_and_warn(path, pid, true);
4093 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4097 char **dirs = (char**) directories;
4099 assert(!strv_isempty(dirs));
4101 name = basename(dirs[0]);
4102 assert(!isempty(name));
4104 /* Executes all binaries in the directories in parallel and waits
4105 * for them to finish. Optionally a timeout is applied. If a file
4106 * with the same name exists in more than one directory, the
4107 * earliest one wins. */
4109 executor_pid = fork();
4110 if (executor_pid < 0) {
4111 log_error_errno(errno, "Failed to fork: %m");
4114 } else if (executor_pid == 0) {
4115 r = do_execute(dirs, timeout, argv);
4116 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4119 wait_for_terminate_and_warn(name, executor_pid, true);
4122 int kill_and_sigcont(pid_t pid, int sig) {
4125 r = kill(pid, sig) < 0 ? -errno : 0;
4133 bool nulstr_contains(const char*nulstr, const char *needle) {
4139 NULSTR_FOREACH(i, nulstr)
4140 if (streq(i, needle))
4146 bool plymouth_running(void) {
4147 return access("/run/plymouth/pid", F_OK) >= 0;
4150 char* strshorten(char *s, size_t l) {
4159 static bool hostname_valid_char(char c) {
4161 (c >= 'a' && c <= 'z') ||
4162 (c >= 'A' && c <= 'Z') ||
4163 (c >= '0' && c <= '9') ||
4169 bool hostname_is_valid(const char *s) {
4176 /* Doesn't accept empty hostnames, hostnames with trailing or
4177 * leading dots, and hostnames with multiple dots in a
4178 * sequence. Also ensures that the length stays below
4181 for (p = s, dot = true; *p; p++) {
4188 if (!hostname_valid_char(*p))
4198 if (p-s > HOST_NAME_MAX)
4204 char* hostname_cleanup(char *s, bool lowercase) {
4208 for (p = s, d = s, dot = true; *p; p++) {
4215 } else if (hostname_valid_char(*p)) {
4216 *(d++) = lowercase ? tolower(*p) : *p;
4227 strshorten(s, HOST_NAME_MAX);
4232 bool machine_name_is_valid(const char *s) {
4234 if (!hostname_is_valid(s))
4237 /* Machine names should be useful hostnames, but also be
4238 * useful in unit names, hence we enforce a stricter length
4247 int pipe_eof(int fd) {
4248 struct pollfd pollfd = {
4250 .events = POLLIN|POLLHUP,
4255 r = poll(&pollfd, 1, 0);
4262 return pollfd.revents & POLLHUP;
4265 int fd_wait_for_event(int fd, int event, usec_t t) {
4267 struct pollfd pollfd = {
4275 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4282 return pollfd.revents;
4285 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4294 r = tempfn_xxxxxx(path, &t);
4298 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4304 f = fdopen(fd, "we");
4317 int terminal_vhangup_fd(int fd) {
4320 if (ioctl(fd, TIOCVHANGUP) < 0)
4326 int terminal_vhangup(const char *name) {
4327 _cleanup_close_ int fd;
4329 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4333 return terminal_vhangup_fd(fd);
4336 int vt_disallocate(const char *name) {
4340 /* Deallocate the VT if possible. If not possible
4341 * (i.e. because it is the active one), at least clear it
4342 * entirely (including the scrollback buffer) */
4344 if (!startswith(name, "/dev/"))
4347 if (!tty_is_vc(name)) {
4348 /* So this is not a VT. I guess we cannot deallocate
4349 * it then. But let's at least clear the screen */
4351 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4356 "\033[r" /* clear scrolling region */
4357 "\033[H" /* move home */
4358 "\033[2J", /* clear screen */
4365 if (!startswith(name, "/dev/tty"))
4368 r = safe_atou(name+8, &u);
4375 /* Try to deallocate */
4376 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4380 r = ioctl(fd, VT_DISALLOCATE, u);
4389 /* Couldn't deallocate, so let's clear it fully with
4391 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4396 "\033[r" /* clear scrolling region */
4397 "\033[H" /* move home */
4398 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4405 int symlink_atomic(const char *from, const char *to) {
4406 _cleanup_free_ char *t = NULL;
4412 r = tempfn_random(to, &t);
4416 if (symlink(from, t) < 0)
4419 if (rename(t, to) < 0) {
4427 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4428 _cleanup_free_ char *t = NULL;
4433 r = tempfn_random(path, &t);
4437 if (mknod(t, mode, dev) < 0)
4440 if (rename(t, path) < 0) {
4448 int mkfifo_atomic(const char *path, mode_t mode) {
4449 _cleanup_free_ char *t = NULL;
4454 r = tempfn_random(path, &t);
4458 if (mkfifo(t, mode) < 0)
4461 if (rename(t, path) < 0) {
4469 bool display_is_local(const char *display) {
4473 display[0] == ':' &&
4474 display[1] >= '0' &&
4478 int socket_from_display(const char *display, char **path) {
4485 if (!display_is_local(display))
4488 k = strspn(display+1, "0123456789");
4490 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4494 c = stpcpy(f, "/tmp/.X11-unix/X");
4495 memcpy(c, display+1, k);
4504 const char **username,
4505 uid_t *uid, gid_t *gid,
4507 const char **shell) {
4515 /* We enforce some special rules for uid=0: in order to avoid
4516 * NSS lookups for root we hardcode its data. */
4518 if (streq(*username, "root") || streq(*username, "0")) {
4536 if (parse_uid(*username, &u) >= 0) {
4540 /* If there are multiple users with the same id, make
4541 * sure to leave $USER to the configured value instead
4542 * of the first occurrence in the database. However if
4543 * the uid was configured by a numeric uid, then let's
4544 * pick the real username from /etc/passwd. */
4546 *username = p->pw_name;
4549 p = getpwnam(*username);
4553 return errno > 0 ? -errno : -ESRCH;
4565 *shell = p->pw_shell;
4570 char* uid_to_name(uid_t uid) {
4575 return strdup("root");
4579 return strdup(p->pw_name);
4581 if (asprintf(&r, UID_FMT, uid) < 0)
4587 char* gid_to_name(gid_t gid) {
4592 return strdup("root");
4596 return strdup(p->gr_name);
4598 if (asprintf(&r, GID_FMT, gid) < 0)
4604 int get_group_creds(const char **groupname, gid_t *gid) {
4610 /* We enforce some special rules for gid=0: in order to avoid
4611 * NSS lookups for root we hardcode its data. */
4613 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4614 *groupname = "root";
4622 if (parse_gid(*groupname, &id) >= 0) {
4627 *groupname = g->gr_name;
4630 g = getgrnam(*groupname);
4634 return errno > 0 ? -errno : -ESRCH;
4642 int in_gid(gid_t gid) {
4644 int ngroups_max, r, i;
4646 if (getgid() == gid)
4649 if (getegid() == gid)
4652 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4653 assert(ngroups_max > 0);
4655 gids = alloca(sizeof(gid_t) * ngroups_max);
4657 r = getgroups(ngroups_max, gids);
4661 for (i = 0; i < r; i++)
4668 int in_group(const char *name) {
4672 r = get_group_creds(&name, &gid);
4679 int glob_exists(const char *path) {
4680 _cleanup_globfree_ glob_t g = {};
4686 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4688 if (k == GLOB_NOMATCH)
4690 else if (k == GLOB_NOSPACE)
4693 return !strv_isempty(g.gl_pathv);
4695 return errno ? -errno : -EIO;
4698 int glob_extend(char ***strv, const char *path) {
4699 _cleanup_globfree_ glob_t g = {};
4704 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4706 if (k == GLOB_NOMATCH)
4708 else if (k == GLOB_NOSPACE)
4710 else if (k != 0 || strv_isempty(g.gl_pathv))
4711 return errno ? -errno : -EIO;
4713 STRV_FOREACH(p, g.gl_pathv) {
4714 k = strv_extend(strv, *p);
4722 int dirent_ensure_type(DIR *d, struct dirent *de) {
4728 if (de->d_type != DT_UNKNOWN)
4731 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4735 S_ISREG(st.st_mode) ? DT_REG :
4736 S_ISDIR(st.st_mode) ? DT_DIR :
4737 S_ISLNK(st.st_mode) ? DT_LNK :
4738 S_ISFIFO(st.st_mode) ? DT_FIFO :
4739 S_ISSOCK(st.st_mode) ? DT_SOCK :
4740 S_ISCHR(st.st_mode) ? DT_CHR :
4741 S_ISBLK(st.st_mode) ? DT_BLK :
4747 int get_files_in_directory(const char *path, char ***list) {
4748 _cleanup_closedir_ DIR *d = NULL;
4749 size_t bufsize = 0, n = 0;
4750 _cleanup_strv_free_ char **l = NULL;
4754 /* Returns all files in a directory in *list, and the number
4755 * of files as return value. If list is NULL returns only the
4767 if (!de && errno != 0)
4772 dirent_ensure_type(d, de);
4774 if (!dirent_is_file(de))
4778 /* one extra slot is needed for the terminating NULL */
4779 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4782 l[n] = strdup(de->d_name);
4793 l = NULL; /* avoid freeing */
4799 char *strjoin(const char *x, ...) {
4813 t = va_arg(ap, const char *);
4818 if (n > ((size_t) -1) - l) {
4842 t = va_arg(ap, const char *);
4856 bool is_main_thread(void) {
4857 static thread_local int cached = 0;
4859 if (_unlikely_(cached == 0))
4860 cached = getpid() == gettid() ? 1 : -1;
4865 int block_get_whole_disk(dev_t d, dev_t *ret) {
4872 /* If it has a queue this is good enough for us */
4873 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4876 r = access(p, F_OK);
4884 /* If it is a partition find the originating device */
4885 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4888 r = access(p, F_OK);
4894 /* Get parent dev_t */
4895 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4898 r = read_one_line_file(p, &s);
4904 r = sscanf(s, "%u:%u", &m, &n);
4910 /* Only return this if it is really good enough for us. */
4911 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4914 r = access(p, F_OK);
4918 *ret = makedev(m, n);
4925 static const char *const ioprio_class_table[] = {
4926 [IOPRIO_CLASS_NONE] = "none",
4927 [IOPRIO_CLASS_RT] = "realtime",
4928 [IOPRIO_CLASS_BE] = "best-effort",
4929 [IOPRIO_CLASS_IDLE] = "idle"
4932 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
4934 static const char *const sigchld_code_table[] = {
4935 [CLD_EXITED] = "exited",
4936 [CLD_KILLED] = "killed",
4937 [CLD_DUMPED] = "dumped",
4938 [CLD_TRAPPED] = "trapped",
4939 [CLD_STOPPED] = "stopped",
4940 [CLD_CONTINUED] = "continued",
4943 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
4945 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
4946 [LOG_FAC(LOG_KERN)] = "kern",
4947 [LOG_FAC(LOG_USER)] = "user",
4948 [LOG_FAC(LOG_MAIL)] = "mail",
4949 [LOG_FAC(LOG_DAEMON)] = "daemon",
4950 [LOG_FAC(LOG_AUTH)] = "auth",
4951 [LOG_FAC(LOG_SYSLOG)] = "syslog",
4952 [LOG_FAC(LOG_LPR)] = "lpr",
4953 [LOG_FAC(LOG_NEWS)] = "news",
4954 [LOG_FAC(LOG_UUCP)] = "uucp",
4955 [LOG_FAC(LOG_CRON)] = "cron",
4956 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
4957 [LOG_FAC(LOG_FTP)] = "ftp",
4958 [LOG_FAC(LOG_LOCAL0)] = "local0",
4959 [LOG_FAC(LOG_LOCAL1)] = "local1",
4960 [LOG_FAC(LOG_LOCAL2)] = "local2",
4961 [LOG_FAC(LOG_LOCAL3)] = "local3",
4962 [LOG_FAC(LOG_LOCAL4)] = "local4",
4963 [LOG_FAC(LOG_LOCAL5)] = "local5",
4964 [LOG_FAC(LOG_LOCAL6)] = "local6",
4965 [LOG_FAC(LOG_LOCAL7)] = "local7"
4968 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
4970 static const char *const log_level_table[] = {
4971 [LOG_EMERG] = "emerg",
4972 [LOG_ALERT] = "alert",
4973 [LOG_CRIT] = "crit",
4975 [LOG_WARNING] = "warning",
4976 [LOG_NOTICE] = "notice",
4977 [LOG_INFO] = "info",
4978 [LOG_DEBUG] = "debug"
4981 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
4983 static const char* const sched_policy_table[] = {
4984 [SCHED_OTHER] = "other",
4985 [SCHED_BATCH] = "batch",
4986 [SCHED_IDLE] = "idle",
4987 [SCHED_FIFO] = "fifo",
4991 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
4993 static const char* const rlimit_table[_RLIMIT_MAX] = {
4994 [RLIMIT_CPU] = "LimitCPU",
4995 [RLIMIT_FSIZE] = "LimitFSIZE",
4996 [RLIMIT_DATA] = "LimitDATA",
4997 [RLIMIT_STACK] = "LimitSTACK",
4998 [RLIMIT_CORE] = "LimitCORE",
4999 [RLIMIT_RSS] = "LimitRSS",
5000 [RLIMIT_NOFILE] = "LimitNOFILE",
5001 [RLIMIT_AS] = "LimitAS",
5002 [RLIMIT_NPROC] = "LimitNPROC",
5003 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5004 [RLIMIT_LOCKS] = "LimitLOCKS",
5005 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5006 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5007 [RLIMIT_NICE] = "LimitNICE",
5008 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5009 [RLIMIT_RTTIME] = "LimitRTTIME"
5012 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5014 static const char* const ip_tos_table[] = {
5015 [IPTOS_LOWDELAY] = "low-delay",
5016 [IPTOS_THROUGHPUT] = "throughput",
5017 [IPTOS_RELIABILITY] = "reliability",
5018 [IPTOS_LOWCOST] = "low-cost",
5021 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5023 static const char *const __signal_table[] = {
5040 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5051 [SIGVTALRM] = "VTALRM",
5053 [SIGWINCH] = "WINCH",
5059 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5061 const char *signal_to_string(int signo) {
5062 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5065 name = __signal_to_string(signo);
5069 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5070 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5072 snprintf(buf, sizeof(buf), "%d", signo);
5077 int signal_from_string(const char *s) {
5082 signo = __signal_from_string(s);
5086 if (startswith(s, "RTMIN+")) {
5090 if (safe_atou(s, &u) >= 0) {
5091 signo = (int) u + offset;
5092 if (signo > 0 && signo < _NSIG)
5098 bool kexec_loaded(void) {
5099 bool loaded = false;
5102 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5110 int prot_from_flags(int flags) {
5112 switch (flags & O_ACCMODE) {
5121 return PROT_READ|PROT_WRITE;
5128 char *format_bytes(char *buf, size_t l, off_t t) {
5131 static const struct {
5135 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5136 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5137 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5138 { "G", 1024ULL*1024ULL*1024ULL },
5139 { "M", 1024ULL*1024ULL },
5143 if (t == (off_t) -1)
5146 for (i = 0; i < ELEMENTSOF(table); i++) {
5148 if (t >= table[i].factor) {
5151 (unsigned long long) (t / table[i].factor),
5152 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5159 snprintf(buf, l, "%lluB", (unsigned long long) t);
5167 void* memdup(const void *p, size_t l) {
5180 int fd_inc_sndbuf(int fd, size_t n) {
5182 socklen_t l = sizeof(value);
5184 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5185 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5188 /* If we have the privileges we will ignore the kernel limit. */
5191 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5192 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5198 int fd_inc_rcvbuf(int fd, size_t n) {
5200 socklen_t l = sizeof(value);
5202 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5203 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5206 /* If we have the privileges we will ignore the kernel limit. */
5209 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5210 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5215 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5216 bool stdout_is_tty, stderr_is_tty;
5217 pid_t parent_pid, agent_pid;
5218 sigset_t ss, saved_ss;
5226 /* Spawns a temporary TTY agent, making sure it goes away when
5229 parent_pid = getpid();
5231 /* First we temporarily block all signals, so that the new
5232 * child has them blocked initially. This way, we can be sure
5233 * that SIGTERMs are not lost we might send to the agent. */
5234 assert_se(sigfillset(&ss) >= 0);
5235 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5238 if (agent_pid < 0) {
5239 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5243 if (agent_pid != 0) {
5244 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5251 * Make sure the agent goes away when the parent dies */
5252 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5253 _exit(EXIT_FAILURE);
5255 /* Make sure we actually can kill the agent, if we need to, in
5256 * case somebody invoked us from a shell script that trapped
5257 * SIGTERM or so... */
5258 reset_all_signal_handlers();
5259 reset_signal_mask();
5261 /* Check whether our parent died before we were able
5262 * to set the death signal and unblock the signals */
5263 if (getppid() != parent_pid)
5264 _exit(EXIT_SUCCESS);
5266 /* Don't leak fds to the agent */
5267 close_all_fds(except, n_except);
5269 stdout_is_tty = isatty(STDOUT_FILENO);
5270 stderr_is_tty = isatty(STDERR_FILENO);
5272 if (!stdout_is_tty || !stderr_is_tty) {
5275 /* Detach from stdout/stderr. and reopen
5276 * /dev/tty for them. This is important to
5277 * ensure that when systemctl is started via
5278 * popen() or a similar call that expects to
5279 * read EOF we actually do generate EOF and
5280 * not delay this indefinitely by because we
5281 * keep an unused copy of stdin around. */
5282 fd = open("/dev/tty", O_WRONLY);
5284 log_error_errno(errno, "Failed to open /dev/tty: %m");
5285 _exit(EXIT_FAILURE);
5289 dup2(fd, STDOUT_FILENO);
5292 dup2(fd, STDERR_FILENO);
5298 /* Count arguments */
5300 for (n = 0; va_arg(ap, char*); n++)
5305 l = alloca(sizeof(char *) * (n + 1));
5307 /* Fill in arguments */
5309 for (i = 0; i <= n; i++)
5310 l[i] = va_arg(ap, char*);
5314 _exit(EXIT_FAILURE);
5317 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5318 struct rlimit highest, fixed;
5322 if (setrlimit(resource, rlim) >= 0)
5328 /* So we failed to set the desired setrlimit, then let's try
5329 * to get as close as we can */
5330 assert_se(getrlimit(resource, &highest) == 0);
5332 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5333 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5335 if (setrlimit(resource, &fixed) < 0)
5341 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5342 _cleanup_fclose_ FILE *f = NULL;
5353 path = procfs_file_alloca(pid, "environ");
5355 f = fopen(path, "re");
5363 char line[LINE_MAX];
5366 for (i = 0; i < sizeof(line)-1; i++) {
5370 if (_unlikely_(c == EOF)) {
5380 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5381 value = strdup(line + l + 1);
5395 bool http_etag_is_valid(const char *etag) {
5399 if (!endswith(etag, "\""))
5402 if (!startswith(etag, "\"") && !startswith(etag, "W/\""))
5408 bool http_url_is_valid(const char *url) {
5414 p = startswith(url, "http://");
5416 p = startswith(url, "https://");
5423 return ascii_is_valid(p);
5426 bool documentation_url_is_valid(const char *url) {
5432 if (http_url_is_valid(url))
5435 p = startswith(url, "file:/");
5437 p = startswith(url, "info:");
5439 p = startswith(url, "man:");
5444 return ascii_is_valid(p);
5447 bool in_initrd(void) {
5448 static int saved = -1;
5454 /* We make two checks here:
5456 * 1. the flag file /etc/initrd-release must exist
5457 * 2. the root file system must be a memory file system
5459 * The second check is extra paranoia, since misdetecting an
5460 * initrd can have bad bad consequences due the initrd
5461 * emptying when transititioning to the main systemd.
5464 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5465 statfs("/", &s) >= 0 &&
5466 is_temporary_fs(&s);
5471 void warn_melody(void) {
5472 _cleanup_close_ int fd = -1;
5474 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5478 /* Yeah, this is synchronous. Kinda sucks. But well... */
5480 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5481 usleep(125*USEC_PER_MSEC);
5483 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5484 usleep(125*USEC_PER_MSEC);
5486 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5487 usleep(125*USEC_PER_MSEC);
5489 ioctl(fd, KIOCSOUND, 0);
5492 int make_console_stdio(void) {
5495 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5497 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5499 return log_error_errno(fd, "Failed to acquire terminal: %m");
5503 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5508 int get_home_dir(char **_h) {
5516 /* Take the user specified one */
5517 e = secure_getenv("HOME");
5518 if (e && path_is_absolute(e)) {
5527 /* Hardcode home directory for root to avoid NSS */
5530 h = strdup("/root");
5538 /* Check the database... */
5542 return errno > 0 ? -errno : -ESRCH;
5544 if (!path_is_absolute(p->pw_dir))
5547 h = strdup(p->pw_dir);
5555 int get_shell(char **_s) {
5563 /* Take the user specified one */
5564 e = getenv("SHELL");
5574 /* Hardcode home directory for root to avoid NSS */
5577 s = strdup("/bin/sh");
5585 /* Check the database... */
5589 return errno > 0 ? -errno : -ESRCH;
5591 if (!path_is_absolute(p->pw_shell))
5594 s = strdup(p->pw_shell);
5602 bool filename_is_valid(const char *p) {
5616 if (strlen(p) > FILENAME_MAX)
5622 bool string_is_safe(const char *p) {
5628 for (t = p; *t; t++) {
5629 if (*t > 0 && *t < ' ')
5632 if (strchr("\\\"\'\0x7f", *t))
5640 * Check if a string contains control characters. If 'ok' is non-NULL
5641 * it may be a string containing additional CCs to be considered OK.
5643 bool string_has_cc(const char *p, const char *ok) {
5648 for (t = p; *t; t++) {
5649 if (ok && strchr(ok, *t))
5652 if (*t > 0 && *t < ' ')
5662 bool path_is_safe(const char *p) {
5667 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5670 if (strlen(p) > PATH_MAX)
5673 /* The following two checks are not really dangerous, but hey, they still are confusing */
5674 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5677 if (strstr(p, "//"))
5683 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5684 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5685 int (*compar) (const void *, const void *, void *), void *arg) {
5694 p = (void *)(((const char *) base) + (idx * size));
5695 comparison = compar(key, p, arg);
5698 else if (comparison > 0)
5706 void init_gettext(void) {
5707 setlocale(LC_ALL, "");
5708 textdomain(GETTEXT_PACKAGE);
5711 bool is_locale_utf8(void) {
5713 static int cached_answer = -1;
5715 if (cached_answer >= 0)
5718 if (!setlocale(LC_ALL, "")) {
5719 cached_answer = true;
5723 set = nl_langinfo(CODESET);
5725 cached_answer = true;
5729 if (streq(set, "UTF-8")) {
5730 cached_answer = true;
5734 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5735 * unset and everything can do to UTF-8 nowadays. */
5736 set = setlocale(LC_CTYPE, NULL);
5738 cached_answer = true;
5742 /* Check result, but ignore the result if C was set
5746 !getenv("LC_ALL") &&
5747 !getenv("LC_CTYPE") &&
5751 return (bool) cached_answer;
5754 const char *draw_special_char(DrawSpecialChar ch) {
5755 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5758 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5759 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5760 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5761 [DRAW_TREE_SPACE] = " ", /* */
5762 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5763 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5764 [DRAW_ARROW] = "\342\206\222", /* → */
5765 [DRAW_DASH] = "\342\200\223", /* – */
5768 /* ASCII fallback */ {
5769 [DRAW_TREE_VERTICAL] = "| ",
5770 [DRAW_TREE_BRANCH] = "|-",
5771 [DRAW_TREE_RIGHT] = "`-",
5772 [DRAW_TREE_SPACE] = " ",
5773 [DRAW_TRIANGULAR_BULLET] = ">",
5774 [DRAW_BLACK_CIRCLE] = "*",
5775 [DRAW_ARROW] = "->",
5780 return draw_table[!is_locale_utf8()][ch];
5783 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5786 size_t l, old_len, new_len;
5792 old_len = strlen(old_string);
5793 new_len = strlen(new_string);
5806 if (!startswith(f, old_string)) {
5812 nl = l - old_len + new_len;
5813 a = realloc(r, nl + 1);
5821 t = stpcpy(t, new_string);
5833 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5834 const char *i, *begin = NULL;
5839 } state = STATE_OTHER;
5841 size_t osz = 0, isz;
5847 /* Strips ANSI color and replaces TABs by 8 spaces */
5849 isz = _isz ? *_isz : strlen(*ibuf);
5851 f = open_memstream(&obuf, &osz);
5855 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5860 if (i >= *ibuf + isz) /* EOT */
5862 else if (*i == '\x1B')
5863 state = STATE_ESCAPE;
5864 else if (*i == '\t')
5871 if (i >= *ibuf + isz) { /* EOT */
5874 } else if (*i == '[') {
5875 state = STATE_BRACKET;
5880 state = STATE_OTHER;
5887 if (i >= *ibuf + isz || /* EOT */
5888 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5891 state = STATE_OTHER;
5893 } else if (*i == 'm')
5894 state = STATE_OTHER;
5916 int on_ac_power(void) {
5917 bool found_offline = false, found_online = false;
5918 _cleanup_closedir_ DIR *d = NULL;
5920 d = opendir("/sys/class/power_supply");
5922 return errno == ENOENT ? true : -errno;
5926 _cleanup_close_ int fd = -1, device = -1;
5932 if (!de && errno != 0)
5938 if (hidden_file(de->d_name))
5941 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
5943 if (errno == ENOENT || errno == ENOTDIR)
5949 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5951 if (errno == ENOENT)
5957 n = read(fd, contents, sizeof(contents));
5961 if (n != 6 || memcmp(contents, "Mains\n", 6))
5965 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5967 if (errno == ENOENT)
5973 n = read(fd, contents, sizeof(contents));
5977 if (n != 2 || contents[1] != '\n')
5980 if (contents[0] == '1') {
5981 found_online = true;
5983 } else if (contents[0] == '0')
5984 found_offline = true;
5989 return found_online || !found_offline;
5992 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
5999 if (!path_strv_resolve_uniq(search, root))
6002 STRV_FOREACH(i, search) {
6003 _cleanup_free_ char *p = NULL;
6007 p = strjoin(root, *i, "/", path, NULL);
6009 p = strjoin(*i, "/", path, NULL);
6019 if (errno != ENOENT)
6026 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6027 _cleanup_strv_free_ char **copy = NULL;
6033 if (path_is_absolute(path)) {
6036 f = fopen(path, mode);
6045 copy = strv_copy((char**) search);
6049 return search_and_fopen_internal(path, mode, root, copy, _f);
6052 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6053 _cleanup_strv_free_ char **s = NULL;
6055 if (path_is_absolute(path)) {
6058 f = fopen(path, mode);
6067 s = strv_split_nulstr(search);
6071 return search_and_fopen_internal(path, mode, root, s, _f);
6074 char *strextend(char **x, ...) {
6081 l = f = *x ? strlen(*x) : 0;
6088 t = va_arg(ap, const char *);
6093 if (n > ((size_t) -1) - l) {
6102 r = realloc(*x, l+1);
6112 t = va_arg(ap, const char *);
6126 char *strrep(const char *s, unsigned n) {
6134 p = r = malloc(l * n + 1);
6138 for (i = 0; i < n; i++)
6145 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6152 if (*allocated >= need)
6155 newalloc = MAX(need * 2, 64u / size);
6156 a = newalloc * size;
6158 /* check for overflows */
6159 if (a < size * need)
6167 *allocated = newalloc;
6171 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6180 q = greedy_realloc(p, allocated, need, size);
6184 if (*allocated > prev)
6185 memzero(q + prev * size, (*allocated - prev) * size);
6190 bool id128_is_valid(const char *s) {
6196 /* Simple formatted 128bit hex string */
6198 for (i = 0; i < l; i++) {
6201 if (!(c >= '0' && c <= '9') &&
6202 !(c >= 'a' && c <= 'z') &&
6203 !(c >= 'A' && c <= 'Z'))
6207 } else if (l == 36) {
6209 /* Formatted UUID */
6211 for (i = 0; i < l; i++) {
6214 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6218 if (!(c >= '0' && c <= '9') &&
6219 !(c >= 'a' && c <= 'z') &&
6220 !(c >= 'A' && c <= 'Z'))
6231 int split_pair(const char *s, const char *sep, char **l, char **r) {
6246 a = strndup(s, x - s);
6250 b = strdup(x + strlen(sep));
6262 int shall_restore_state(void) {
6263 _cleanup_free_ char *value = NULL;
6266 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6272 return parse_boolean(value) != 0;
6275 int proc_cmdline(char **ret) {
6278 if (detect_container(NULL) > 0)
6279 return get_process_cmdline(1, 0, false, ret);
6281 return read_one_line_file("/proc/cmdline", ret);
6284 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6285 _cleanup_free_ char *line = NULL;
6291 r = proc_cmdline(&line);
6297 _cleanup_free_ char *word = NULL;
6300 r = unquote_first_word(&p, &word, UNQUOTE_RELAX);
6306 /* Filter out arguments that are intended only for the
6308 if (!in_initrd() && startswith(word, "rd."))
6311 value = strchr(word, '=');
6315 r = parse_item(word, value);
6323 int get_proc_cmdline_key(const char *key, char **value) {
6324 _cleanup_free_ char *line = NULL, *ret = NULL;
6331 r = proc_cmdline(&line);
6337 _cleanup_free_ char *word = NULL;
6340 r = unquote_first_word(&p, &word, UNQUOTE_RELAX);
6346 /* Filter out arguments that are intended only for the
6348 if (!in_initrd() && startswith(word, "rd."))
6352 e = startswith(word, key);
6356 r = free_and_strdup(&ret, e);
6362 if (streq(word, key))
6376 int container_get_leader(const char *machine, pid_t *pid) {
6377 _cleanup_free_ char *s = NULL, *class = NULL;
6385 p = strjoina("/run/systemd/machines/", machine);
6386 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6394 if (!streq_ptr(class, "container"))
6397 r = parse_pid(s, &leader);
6407 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6408 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6416 mntns = procfs_file_alloca(pid, "ns/mnt");
6417 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6425 pidns = procfs_file_alloca(pid, "ns/pid");
6426 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6434 netns = procfs_file_alloca(pid, "ns/net");
6435 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6443 root = procfs_file_alloca(pid, "root");
6444 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6450 *pidns_fd = pidnsfd;
6453 *mntns_fd = mntnsfd;
6456 *netns_fd = netnsfd;
6461 pidnsfd = mntnsfd = netnsfd = -1;
6466 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6469 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6473 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6477 if (setns(netns_fd, CLONE_NEWNET) < 0)
6481 if (fchdir(root_fd) < 0)
6484 if (chroot(".") < 0)
6488 if (setresgid(0, 0, 0) < 0)
6491 if (setgroups(0, NULL) < 0)
6494 if (setresuid(0, 0, 0) < 0)
6500 bool pid_is_unwaited(pid_t pid) {
6501 /* Checks whether a PID is still valid at all, including a zombie */
6506 if (kill(pid, 0) >= 0)
6509 return errno != ESRCH;
6512 bool pid_is_alive(pid_t pid) {
6515 /* Checks whether a PID is still valid and not a zombie */
6520 r = get_process_state(pid);
6521 if (r == -ENOENT || r == 'Z')
6527 int getpeercred(int fd, struct ucred *ucred) {
6528 socklen_t n = sizeof(struct ucred);
6535 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6539 if (n != sizeof(struct ucred))
6542 /* Check if the data is actually useful and not suppressed due
6543 * to namespacing issues */
6546 if (u.uid == UID_INVALID)
6548 if (u.gid == GID_INVALID)
6555 int getpeersec(int fd, char **ret) {
6567 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6571 if (errno != ERANGE)
6578 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6594 /* This is much like like mkostemp() but is subject to umask(). */
6595 int mkostemp_safe(char *pattern, int flags) {
6596 _cleanup_umask_ mode_t u;
6603 fd = mkostemp(pattern, flags);
6610 int open_tmpfile(const char *path, int flags) {
6617 /* Try O_TMPFILE first, if it is supported */
6618 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6623 /* Fall back to unguessable name + unlinking */
6624 p = strjoina(path, "/systemd-tmp-XXXXXX");
6626 fd = mkostemp_safe(p, flags);
6634 int fd_warn_permissions(const char *path, int fd) {
6637 if (fstat(fd, &st) < 0)
6640 if (st.st_mode & 0111)
6641 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6643 if (st.st_mode & 0002)
6644 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6646 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6647 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6652 unsigned long personality_from_string(const char *p) {
6654 /* Parse a personality specifier. We introduce our own
6655 * identifiers that indicate specific ABIs, rather than just
6656 * hints regarding the register size, since we want to keep
6657 * things open for multiple locally supported ABIs for the
6658 * same register size. We try to reuse the ABI identifiers
6659 * used by libseccomp. */
6661 #if defined(__x86_64__)
6663 if (streq(p, "x86"))
6666 if (streq(p, "x86-64"))
6669 #elif defined(__i386__)
6671 if (streq(p, "x86"))
6675 /* personality(7) documents that 0xffffffffUL is used for
6676 * querying the current personality, hence let's use that here
6677 * as error indicator. */
6678 return 0xffffffffUL;
6681 const char* personality_to_string(unsigned long p) {
6683 #if defined(__x86_64__)
6685 if (p == PER_LINUX32)
6691 #elif defined(__i386__)
6700 uint64_t physical_memory(void) {
6703 /* We return this as uint64_t in case we are running as 32bit
6704 * process on a 64bit kernel with huge amounts of memory */
6706 mem = sysconf(_SC_PHYS_PAGES);
6709 return (uint64_t) mem * (uint64_t) page_size();
6712 void hexdump(FILE *f, const void *p, size_t s) {
6713 const uint8_t *b = p;
6716 assert(s == 0 || b);
6721 fprintf(f, "%04x ", n);
6723 for (i = 0; i < 16; i++) {
6728 fprintf(f, "%02x ", b[i]);
6736 for (i = 0; i < 16; i++) {
6741 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6755 int update_reboot_param_file(const char *param) {
6760 r = write_string_file(REBOOT_PARAM_FILE, param);
6762 log_error("Failed to write reboot param to "
6763 REBOOT_PARAM_FILE": %s", strerror(-r));
6765 unlink(REBOOT_PARAM_FILE);
6770 int umount_recursive(const char *prefix, int flags) {
6774 /* Try to umount everything recursively below a
6775 * directory. Also, take care of stacked mounts, and keep
6776 * unmounting them until they are gone. */
6779 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6784 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6785 if (!proc_self_mountinfo)
6789 _cleanup_free_ char *path = NULL, *p = NULL;
6792 k = fscanf(proc_self_mountinfo,
6793 "%*s " /* (1) mount id */
6794 "%*s " /* (2) parent id */
6795 "%*s " /* (3) major:minor */
6796 "%*s " /* (4) root */
6797 "%ms " /* (5) mount point */
6798 "%*s" /* (6) mount options */
6799 "%*[^-]" /* (7) optional fields */
6800 "- " /* (8) separator */
6801 "%*s " /* (9) file system type */
6802 "%*s" /* (10) mount source */
6803 "%*s" /* (11) mount options 2 */
6804 "%*[^\n]", /* some rubbish at the end */
6813 r = cunescape(path, UNESCAPE_RELAX, &p);
6817 if (!path_startswith(p, prefix))
6820 if (umount2(p, flags) < 0) {
6836 static int get_mount_flags(const char *path, unsigned long *flags) {
6839 if (statvfs(path, &buf) < 0)
6841 *flags = buf.f_flag;
6845 int bind_remount_recursive(const char *prefix, bool ro) {
6846 _cleanup_set_free_free_ Set *done = NULL;
6847 _cleanup_free_ char *cleaned = NULL;
6850 /* Recursively remount a directory (and all its submounts)
6851 * read-only or read-write. If the directory is already
6852 * mounted, we reuse the mount and simply mark it
6853 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6854 * operation). If it isn't we first make it one. Afterwards we
6855 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6856 * submounts we can access, too. When mounts are stacked on
6857 * the same mount point we only care for each individual
6858 * "top-level" mount on each point, as we cannot
6859 * influence/access the underlying mounts anyway. We do not
6860 * have any effect on future submounts that might get
6861 * propagated, they migt be writable. This includes future
6862 * submounts that have been triggered via autofs. */
6864 cleaned = strdup(prefix);
6868 path_kill_slashes(cleaned);
6870 done = set_new(&string_hash_ops);
6875 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6876 _cleanup_set_free_free_ Set *todo = NULL;
6877 bool top_autofs = false;
6879 unsigned long orig_flags;
6881 todo = set_new(&string_hash_ops);
6885 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6886 if (!proc_self_mountinfo)
6890 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6893 k = fscanf(proc_self_mountinfo,
6894 "%*s " /* (1) mount id */
6895 "%*s " /* (2) parent id */
6896 "%*s " /* (3) major:minor */
6897 "%*s " /* (4) root */
6898 "%ms " /* (5) mount point */
6899 "%*s" /* (6) mount options (superblock) */
6900 "%*[^-]" /* (7) optional fields */
6901 "- " /* (8) separator */
6902 "%ms " /* (9) file system type */
6903 "%*s" /* (10) mount source */
6904 "%*s" /* (11) mount options (bind mount) */
6905 "%*[^\n]", /* some rubbish at the end */
6915 r = cunescape(path, UNESCAPE_RELAX, &p);
6919 /* Let's ignore autofs mounts. If they aren't
6920 * triggered yet, we want to avoid triggering
6921 * them, as we don't make any guarantees for
6922 * future submounts anyway. If they are
6923 * already triggered, then we will find
6924 * another entry for this. */
6925 if (streq(type, "autofs")) {
6926 top_autofs = top_autofs || path_equal(cleaned, p);
6930 if (path_startswith(p, cleaned) &&
6931 !set_contains(done, p)) {
6933 r = set_consume(todo, p);
6943 /* If we have no submounts to process anymore and if
6944 * the root is either already done, or an autofs, we
6946 if (set_isempty(todo) &&
6947 (top_autofs || set_contains(done, cleaned)))
6950 if (!set_contains(done, cleaned) &&
6951 !set_contains(todo, cleaned)) {
6952 /* The prefix directory itself is not yet a
6953 * mount, make it one. */
6954 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
6958 (void) get_mount_flags(cleaned, &orig_flags);
6959 orig_flags &= ~MS_RDONLY;
6961 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
6964 x = strdup(cleaned);
6968 r = set_consume(done, x);
6973 while ((x = set_steal_first(todo))) {
6975 r = set_consume(done, x);
6981 /* Try to reuse the original flag set, but
6982 * don't care for errors, in case of
6983 * obstructed mounts */
6985 (void) get_mount_flags(x, &orig_flags);
6986 orig_flags &= ~MS_RDONLY;
6988 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
6990 /* Deal with mount points that are
6991 * obstructed by a later mount */
6993 if (errno != ENOENT)
7001 int fflush_and_check(FILE *f) {
7008 return errno ? -errno : -EIO;
7013 int tempfn_xxxxxx(const char *p, char **ret) {
7025 * /foo/bar/.#waldoXXXXXX
7029 if (!filename_is_valid(fn))
7032 t = new(char, strlen(p) + 2 + 6 + 1);
7036 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7038 *ret = path_kill_slashes(t);
7042 int tempfn_random(const char *p, char **ret) {
7056 * /foo/bar/.#waldobaa2a261115984a9
7060 if (!filename_is_valid(fn))
7063 t = new(char, strlen(p) + 2 + 16 + 1);
7067 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7070 for (i = 0; i < 16; i++) {
7071 *(x++) = hexchar(u & 0xF);
7077 *ret = path_kill_slashes(t);
7081 int tempfn_random_child(const char *p, char **ret) {
7092 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7095 t = new(char, strlen(p) + 3 + 16 + 1);
7099 x = stpcpy(stpcpy(t, p), "/.#");
7102 for (i = 0; i < 16; i++) {
7103 *(x++) = hexchar(u & 0xF);
7109 *ret = path_kill_slashes(t);
7113 /* make sure the hostname is not "localhost" */
7114 bool is_localhost(const char *hostname) {
7117 /* This tries to identify local host and domain names
7118 * described in RFC6761 plus the redhatism of .localdomain */
7120 return streq(hostname, "localhost") ||
7121 streq(hostname, "localhost.") ||
7122 streq(hostname, "localdomain.") ||
7123 streq(hostname, "localdomain") ||
7124 endswith(hostname, ".localhost") ||
7125 endswith(hostname, ".localhost.") ||
7126 endswith(hostname, ".localdomain") ||
7127 endswith(hostname, ".localdomain.");
7130 int take_password_lock(const char *root) {
7132 struct flock flock = {
7134 .l_whence = SEEK_SET,
7142 /* This is roughly the same as lckpwdf(), but not as awful. We
7143 * don't want to use alarm() and signals, hence we implement
7144 * our own trivial version of this.
7146 * Note that shadow-utils also takes per-database locks in
7147 * addition to lckpwdf(). However, we don't given that they
7148 * are redundant as they they invoke lckpwdf() first and keep
7149 * it during everything they do. The per-database locks are
7150 * awfully racy, and thus we just won't do them. */
7153 path = strjoina(root, "/etc/.pwd.lock");
7155 path = "/etc/.pwd.lock";
7157 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7161 r = fcntl(fd, F_SETLKW, &flock);
7170 int is_symlink(const char *path) {
7173 if (lstat(path, &info) < 0)
7176 return !!S_ISLNK(info.st_mode);
7179 int is_dir(const char* path, bool follow) {
7184 r = stat(path, &st);
7186 r = lstat(path, &st);
7190 return !!S_ISDIR(st.st_mode);
7193 int unquote_first_word(const char **p, char **ret, UnquoteFlags flags) {
7194 _cleanup_free_ char *s = NULL;
7195 size_t allocated = 0, sz = 0;
7203 SINGLE_QUOTE_ESCAPE,
7205 DOUBLE_QUOTE_ESCAPE,
7213 /* Parses the first word of a string, and returns it in
7214 * *ret. Removes all quotes in the process. When parsing fails
7215 * (because of an uneven number of quotes or similar), leaves
7216 * the pointer *p at the first invalid character. */
7226 else if (strchr(WHITESPACE, c))
7236 state = SINGLE_QUOTE;
7238 state = VALUE_ESCAPE;
7240 state = DOUBLE_QUOTE;
7241 else if (strchr(WHITESPACE, c))
7244 if (!GREEDY_REALLOC(s, allocated, sz+2))
7254 if (flags & UNQUOTE_RELAX)
7259 if (!GREEDY_REALLOC(s, allocated, sz+7))
7262 if (flags & UNQUOTE_CUNESCAPE) {
7265 r = cunescape_one(*p, (size_t) -1, &c, &u);
7272 s[sz++] = c; /* normal explicit char */
7274 sz += utf8_encode_unichar(s + sz, u); /* unicode chars we'll encode as utf8 */
7283 if (flags & UNQUOTE_RELAX)
7286 } else if (c == '\'')
7289 state = SINGLE_QUOTE_ESCAPE;
7291 if (!GREEDY_REALLOC(s, allocated, sz+2))
7299 case SINGLE_QUOTE_ESCAPE:
7301 if (flags & UNQUOTE_RELAX)
7306 if (!GREEDY_REALLOC(s, allocated, sz+7))
7309 if (flags & UNQUOTE_CUNESCAPE) {
7312 r = cunescape_one(*p, (size_t) -1, &c, &u);
7321 sz += utf8_encode_unichar(s + sz, u);
7325 state = SINGLE_QUOTE;
7334 state = DOUBLE_QUOTE_ESCAPE;
7336 if (!GREEDY_REALLOC(s, allocated, sz+2))
7344 case DOUBLE_QUOTE_ESCAPE:
7346 if (flags & UNQUOTE_RELAX)
7351 if (!GREEDY_REALLOC(s, allocated, sz+7))
7354 if (flags & UNQUOTE_CUNESCAPE) {
7357 r = cunescape_one(*p, (size_t) -1, &c, &u);
7366 sz += utf8_encode_unichar(s + sz, u);
7370 state = DOUBLE_QUOTE;
7376 if (!strchr(WHITESPACE, c))
7398 int unquote_many_words(const char **p, UnquoteFlags flags, ...) {
7403 /* Parses a number of words from a string, stripping any
7404 * quotes if necessary. */
7408 /* Count how many words are expected */
7409 va_start(ap, flags);
7411 if (!va_arg(ap, char **))
7420 /* Read all words into a temporary array */
7421 l = newa0(char*, n);
7422 for (c = 0; c < n; c++) {
7424 r = unquote_first_word(p, &l[c], flags);
7428 for (j = 0; j < c; j++)
7438 /* If we managed to parse all words, return them in the passed
7440 va_start(ap, flags);
7441 for (i = 0; i < n; i++) {
7444 v = va_arg(ap, char **);
7454 int free_and_strdup(char **p, const char *s) {
7459 /* Replaces a string pointer with an strdup()ed new string,
7460 * possibly freeing the old one. */
7475 int sethostname_idempotent(const char *s) {
7477 char buf[HOST_NAME_MAX + 1] = {};
7481 r = gethostname(buf, sizeof(buf));
7488 r = sethostname(s, strlen(s));
7495 int ptsname_malloc(int fd, char **ret) {
7508 if (ptsname_r(fd, c, l) == 0) {
7512 if (errno != ERANGE) {
7522 int openpt_in_namespace(pid_t pid, int flags) {
7523 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7524 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7526 struct cmsghdr cmsghdr;
7527 uint8_t buf[CMSG_SPACE(sizeof(int))];
7529 struct msghdr mh = {
7530 .msg_control = &control,
7531 .msg_controllen = sizeof(control),
7533 struct cmsghdr *cmsg;
7540 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7544 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7554 pair[0] = safe_close(pair[0]);
7556 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7558 _exit(EXIT_FAILURE);
7560 master = posix_openpt(flags);
7562 _exit(EXIT_FAILURE);
7564 cmsg = CMSG_FIRSTHDR(&mh);
7565 cmsg->cmsg_level = SOL_SOCKET;
7566 cmsg->cmsg_type = SCM_RIGHTS;
7567 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7568 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7570 mh.msg_controllen = cmsg->cmsg_len;
7572 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7573 _exit(EXIT_FAILURE);
7575 _exit(EXIT_SUCCESS);
7578 pair[1] = safe_close(pair[1]);
7580 r = wait_for_terminate(child, &si);
7583 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7586 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7589 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7590 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7594 fds = (int*) CMSG_DATA(cmsg);
7595 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7598 close_many(fds, n_fds);
7608 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7609 _cleanup_close_ int fd = -1;
7612 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7614 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7618 l = fgetxattr(fd, attribute, value, size);
7625 static int parse_crtime(le64_t le, usec_t *usec) {
7631 if (u == 0 || u == (uint64_t) -1)
7638 int fd_getcrtime(int fd, usec_t *usec) {
7645 /* Until Linux gets a real concept of birthtime/creation time,
7646 * let's fake one with xattrs */
7648 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7651 if (n != sizeof(le))
7654 return parse_crtime(le, usec);
7657 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7661 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7664 if (n != sizeof(le))
7667 return parse_crtime(le, usec);
7670 int path_getcrtime(const char *p, usec_t *usec) {
7677 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7680 if (n != sizeof(le))
7683 return parse_crtime(le, usec);
7686 int fd_setcrtime(int fd, usec_t usec) {
7692 usec = now(CLOCK_REALTIME);
7694 le = htole64((uint64_t) usec);
7695 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7701 int chattr_fd(int fd, unsigned value, unsigned mask) {
7702 unsigned old_attr, new_attr;
7709 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7712 new_attr = (old_attr & ~mask) | (value & mask);
7713 if (new_attr == old_attr)
7716 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7722 int chattr_path(const char *p, unsigned value, unsigned mask) {
7723 _cleanup_close_ int fd = -1;
7730 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7734 return chattr_fd(fd, value, mask);
7737 int read_attr_fd(int fd, unsigned *ret) {
7740 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7746 int read_attr_path(const char *p, unsigned *ret) {
7747 _cleanup_close_ int fd = -1;
7752 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7756 return read_attr_fd(fd, ret);
7759 int make_lock_file(const char *p, int operation, LockFile *ret) {
7760 _cleanup_close_ int fd = -1;
7761 _cleanup_free_ char *t = NULL;
7765 * We use UNPOSIX locks if they are available. They have nice
7766 * semantics, and are mostly compatible with NFS. However,
7767 * they are only available on new kernels. When we detect we
7768 * are running on an older kernel, then we fall back to good
7769 * old BSD locks. They also have nice semantics, but are
7770 * slightly problematic on NFS, where they are upgraded to
7771 * POSIX locks, even though locally they are orthogonal to
7781 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7782 .l_whence = SEEK_SET,
7786 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7790 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7793 /* If the kernel is too old, use good old BSD locks */
7794 if (errno == EINVAL)
7795 r = flock(fd, operation);
7798 return errno == EAGAIN ? -EBUSY : -errno;
7801 /* If we acquired the lock, let's check if the file
7802 * still exists in the file system. If not, then the
7803 * previous exclusive owner removed it and then closed
7804 * it. In such a case our acquired lock is worthless,
7805 * hence try again. */
7810 if (st.st_nlink > 0)
7813 fd = safe_close(fd);
7818 ret->operation = operation;
7826 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7834 if (!filename_is_valid(fn))
7837 t = newa(char, strlen(p) + 2 + 4 + 1);
7838 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7840 return make_lock_file(t, operation, ret);
7843 void release_lock_file(LockFile *f) {
7851 /* If we are the exclusive owner we can safely delete
7852 * the lock file itself. If we are not the exclusive
7853 * owner, we can try becoming it. */
7856 (f->operation & ~LOCK_NB) == LOCK_SH) {
7857 static const struct flock fl = {
7859 .l_whence = SEEK_SET,
7862 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7863 if (r < 0 && errno == EINVAL)
7864 r = flock(f->fd, LOCK_EX|LOCK_NB);
7867 f->operation = LOCK_EX|LOCK_NB;
7870 if ((f->operation & ~LOCK_NB) == LOCK_EX)
7871 unlink_noerrno(f->path);
7877 f->fd = safe_close(f->fd);
7881 static size_t nul_length(const uint8_t *p, size_t sz) {
7896 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
7897 const uint8_t *q, *w, *e;
7905 n = nul_length(q, e - q);
7907 /* If there are more than the specified run length of
7908 * NUL bytes, or if this is the beginning or the end
7909 * of the buffer, then seek instead of write */
7910 if ((n > run_length) ||
7911 (n > 0 && q == p) ||
7912 (n > 0 && q + n >= e)) {
7914 l = write(fd, w, q - w);
7921 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
7933 l = write(fd, w, q - w);
7940 return q - (const uint8_t*) p;
7943 void sigkill_wait(pid_t *pid) {
7949 if (kill(*pid, SIGKILL) > 0)
7950 (void) wait_for_terminate(*pid, NULL);
7953 int syslog_parse_priority(const char **p, int *priority, bool with_facility) {
7954 int a = 0, b = 0, c = 0;
7964 if (!strchr(*p, '>'))
7967 if ((*p)[2] == '>') {
7968 c = undecchar((*p)[1]);
7970 } else if ((*p)[3] == '>') {
7971 b = undecchar((*p)[1]);
7972 c = undecchar((*p)[2]);
7974 } else if ((*p)[4] == '>') {
7975 a = undecchar((*p)[1]);
7976 b = undecchar((*p)[2]);
7977 c = undecchar((*p)[3]);
7982 if (a < 0 || b < 0 || c < 0 ||
7983 (!with_facility && (a || b || c > 7)))
7987 *priority = a*100 + b*10 + c;
7989 *priority = (*priority & LOG_FACMASK) | c;
7995 ssize_t string_table_lookup(const char * const *table, size_t len, const char *key) {
8001 for (i = 0; i < len; ++i)
8002 if (streq_ptr(table[i], key))
8008 void cmsg_close_all(struct msghdr *mh) {
8009 struct cmsghdr *cmsg;
8013 for (cmsg = CMSG_FIRSTHDR(mh); cmsg; cmsg = CMSG_NXTHDR(mh, cmsg))
8014 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS)
8015 close_many((int*) CMSG_DATA(cmsg), (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int));
8018 int rename_noreplace(int olddirfd, const char *oldpath, int newdirfd, const char *newpath) {
8022 ret = renameat2(olddirfd, oldpath, newdirfd, newpath, RENAME_NOREPLACE);
8026 /* Even though renameat2() exists since Linux 3.15, btrfs added
8027 * support for it later. If it is not implemented, fallback to another
8029 if (errno != EINVAL)
8032 /* The link()/unlink() fallback does not work on directories. But
8033 * renameat() without RENAME_NOREPLACE gives the same semantics on
8034 * directories, except when newpath is an *empty* directory. This is
8036 ret = fstatat(olddirfd, oldpath, &buf, AT_SYMLINK_NOFOLLOW);
8037 if (ret >= 0 && S_ISDIR(buf.st_mode)) {
8038 ret = renameat(olddirfd, oldpath, newdirfd, newpath);
8039 return ret >= 0 ? 0 : -errno;
8042 /* If it is not a directory, use the link()/unlink() fallback. */
8043 ret = linkat(olddirfd, oldpath, newdirfd, newpath, 0);
8047 ret = unlinkat(olddirfd, oldpath, 0);
8049 /* backup errno before the following unlinkat() alters it */
8051 (void) unlinkat(newdirfd, newpath, 0);
8059 char *shell_maybe_quote(const char *s) {
8065 /* Encloses a string in double quotes if necessary to make it
8066 * OK as shell string. */
8068 for (p = s; *p; p++)
8071 strchr(SHELL_NEED_QUOTES, *p))
8077 r = new(char, 1+strlen(s)*2+1+1);
8083 t = mempcpy(t, s, p - s);
8087 if (strchr(SHELL_NEED_ESCAPE, *p))
8099 int parse_mode(const char *s, mode_t *ret) {
8107 l = strtol(s, &x, 8);
8111 if (!x || x == s || *x)
8113 if (l < 0 || l > 07777)