1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
31 #include <sys/resource.h>
32 #include <linux/sched.h>
33 #include <sys/types.h>
37 #include <sys/ioctl.h>
39 #include <linux/tiocl.h>
44 #include <sys/prctl.h>
45 #include <sys/utsname.h>
47 #include <netinet/ip.h>
55 #include <sys/mount.h>
56 #include <linux/magic.h>
60 #include <sys/personality.h>
61 #include <sys/xattr.h>
62 #include <sys/statvfs.h>
66 /* When we include libgen.h because we need dirname() we immediately
67 * undefine basename() since libgen.h defines it as a macro to the XDG
68 * version which is really broken. */
72 #ifdef HAVE_SYS_AUXV_H
84 #include "path-util.h"
85 #include "exit-status.h"
89 #include "device-nodes.h"
94 #include "sparse-endian.h"
96 /* Put this test here for a lack of better place */
97 assert_cc(EAGAIN == EWOULDBLOCK);
100 char **saved_argv = NULL;
102 static volatile unsigned cached_columns = 0;
103 static volatile unsigned cached_lines = 0;
105 size_t page_size(void) {
106 static thread_local size_t pgsz = 0;
109 if (_likely_(pgsz > 0))
112 r = sysconf(_SC_PAGESIZE);
119 bool streq_ptr(const char *a, const char *b) {
121 /* Like streq(), but tries to make sense of NULL pointers */
132 char* endswith(const char *s, const char *postfix) {
139 pl = strlen(postfix);
142 return (char*) s + sl;
147 if (memcmp(s + sl - pl, postfix, pl) != 0)
150 return (char*) s + sl - pl;
153 char* endswith_no_case(const char *s, const char *postfix) {
160 pl = strlen(postfix);
163 return (char*) s + sl;
168 if (strcasecmp(s + sl - pl, postfix) != 0)
171 return (char*) s + sl - pl;
174 char* first_word(const char *s, const char *word) {
181 /* Checks if the string starts with the specified word, either
182 * followed by NUL or by whitespace. Returns a pointer to the
183 * NUL or the first character after the whitespace. */
194 if (memcmp(s, word, wl) != 0)
201 if (!strchr(WHITESPACE, *p))
204 p += strspn(p, WHITESPACE);
208 static size_t cescape_char(char c, char *buf) {
209 char * buf_old = buf;
255 /* For special chars we prefer octal over
256 * hexadecimal encoding, simply because glib's
257 * g_strescape() does the same */
258 if ((c < ' ') || (c >= 127)) {
260 *(buf++) = octchar((unsigned char) c >> 6);
261 *(buf++) = octchar((unsigned char) c >> 3);
262 *(buf++) = octchar((unsigned char) c);
268 return buf - buf_old;
271 int close_nointr(int fd) {
278 * Just ignore EINTR; a retry loop is the wrong thing to do on
281 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
282 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
283 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
284 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
292 int safe_close(int fd) {
295 * Like close_nointr() but cannot fail. Guarantees errno is
296 * unchanged. Is a NOP with negative fds passed, and returns
297 * -1, so that it can be used in this syntax:
299 * fd = safe_close(fd);
305 /* The kernel might return pretty much any error code
306 * via close(), but the fd will be closed anyway. The
307 * only condition we want to check for here is whether
308 * the fd was invalid at all... */
310 assert_se(close_nointr(fd) != -EBADF);
316 void close_many(const int fds[], unsigned n_fd) {
319 assert(fds || n_fd <= 0);
321 for (i = 0; i < n_fd; i++)
325 int unlink_noerrno(const char *path) {
336 int parse_boolean(const char *v) {
339 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
341 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
347 int parse_pid(const char *s, pid_t* ret_pid) {
348 unsigned long ul = 0;
355 r = safe_atolu(s, &ul);
361 if ((unsigned long) pid != ul)
371 int parse_uid(const char *s, uid_t* ret_uid) {
372 unsigned long ul = 0;
379 r = safe_atolu(s, &ul);
385 if ((unsigned long) uid != ul)
388 /* Some libc APIs use UID_INVALID as special placeholder */
389 if (uid == (uid_t) 0xFFFFFFFF)
392 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
393 if (uid == (uid_t) 0xFFFF)
400 int safe_atou(const char *s, unsigned *ret_u) {
408 l = strtoul(s, &x, 0);
410 if (!x || x == s || *x || errno)
411 return errno > 0 ? -errno : -EINVAL;
413 if ((unsigned long) (unsigned) l != l)
416 *ret_u = (unsigned) l;
420 int safe_atoi(const char *s, int *ret_i) {
428 l = strtol(s, &x, 0);
430 if (!x || x == s || *x || errno)
431 return errno > 0 ? -errno : -EINVAL;
433 if ((long) (int) l != l)
440 int safe_atou8(const char *s, uint8_t *ret) {
448 l = strtoul(s, &x, 0);
450 if (!x || x == s || *x || errno)
451 return errno > 0 ? -errno : -EINVAL;
453 if ((unsigned long) (uint8_t) l != l)
460 int safe_atou16(const char *s, uint16_t *ret) {
468 l = strtoul(s, &x, 0);
470 if (!x || x == s || *x || errno)
471 return errno > 0 ? -errno : -EINVAL;
473 if ((unsigned long) (uint16_t) l != l)
480 int safe_atoi16(const char *s, int16_t *ret) {
488 l = strtol(s, &x, 0);
490 if (!x || x == s || *x || errno)
491 return errno > 0 ? -errno : -EINVAL;
493 if ((long) (int16_t) l != l)
500 int safe_atollu(const char *s, long long unsigned *ret_llu) {
502 unsigned long long l;
508 l = strtoull(s, &x, 0);
510 if (!x || x == s || *x || errno)
511 return errno ? -errno : -EINVAL;
517 int safe_atolli(const char *s, long long int *ret_lli) {
525 l = strtoll(s, &x, 0);
527 if (!x || x == s || *x || errno)
528 return errno ? -errno : -EINVAL;
534 int safe_atod(const char *s, double *ret_d) {
542 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
543 if (loc == (locale_t) 0)
547 d = strtod_l(s, &x, loc);
549 if (!x || x == s || *x || errno) {
551 return errno ? -errno : -EINVAL;
559 static size_t strcspn_escaped(const char *s, const char *reject) {
560 bool escaped = false;
563 for (n=0; s[n]; n++) {
566 else if (s[n] == '\\')
568 else if (strchr(reject, s[n]))
572 /* if s ends in \, return index of previous char */
576 /* Split a string into words. */
577 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
583 assert(**state == '\0');
587 current += strspn(current, separator);
593 if (quoted && strchr("\'\"", *current)) {
594 char quotechars[2] = {*current, '\0'};
596 *l = strcspn_escaped(current + 1, quotechars);
597 if (current[*l + 1] == '\0' ||
598 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
599 /* right quote missing or garbage at the end */
603 assert(current[*l + 1] == quotechars[0]);
604 *state = current++ + *l + 2;
606 *l = strcspn_escaped(current, separator);
607 if (current[*l] && !strchr(separator, current[*l])) {
608 /* unfinished escape */
612 *state = current + *l;
614 *l = strcspn(current, separator);
615 *state = current + *l;
621 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
623 _cleanup_free_ char *line = NULL;
635 p = procfs_file_alloca(pid, "stat");
636 r = read_one_line_file(p, &line);
640 /* Let's skip the pid and comm fields. The latter is enclosed
641 * in () but does not escape any () in its value, so let's
642 * skip over it manually */
644 p = strrchr(line, ')');
656 if ((long unsigned) (pid_t) ppid != ppid)
659 *_ppid = (pid_t) ppid;
664 int fchmod_umask(int fd, mode_t m) {
669 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
675 char *truncate_nl(char *s) {
678 s[strcspn(s, NEWLINE)] = 0;
682 int get_process_state(pid_t pid) {
686 _cleanup_free_ char *line = NULL;
690 p = procfs_file_alloca(pid, "stat");
691 r = read_one_line_file(p, &line);
695 p = strrchr(line, ')');
701 if (sscanf(p, " %c", &state) != 1)
704 return (unsigned char) state;
707 int get_process_comm(pid_t pid, char **name) {
714 p = procfs_file_alloca(pid, "comm");
716 r = read_one_line_file(p, name);
723 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
724 _cleanup_fclose_ FILE *f = NULL;
732 p = procfs_file_alloca(pid, "cmdline");
738 if (max_length == 0) {
739 size_t len = 0, allocated = 0;
741 while ((c = getc(f)) != EOF) {
743 if (!GREEDY_REALLOC(r, allocated, len+2)) {
748 r[len++] = isprint(c) ? c : ' ';
758 r = new(char, max_length);
764 while ((c = getc(f)) != EOF) {
786 size_t n = MIN(left-1, 3U);
793 /* Kernel threads have no argv[] */
795 _cleanup_free_ char *t = NULL;
803 h = get_process_comm(pid, &t);
807 r = strjoin("[", t, "]", NULL);
816 int is_kernel_thread(pid_t pid) {
828 p = procfs_file_alloca(pid, "cmdline");
833 count = fread(&c, 1, 1, f);
837 /* Kernel threads have an empty cmdline */
840 return eof ? 1 : -errno;
845 int get_process_capeff(pid_t pid, char **capeff) {
851 p = procfs_file_alloca(pid, "status");
853 return get_status_field(p, "\nCapEff:", capeff);
856 static int get_process_link_contents(const char *proc_file, char **name) {
862 r = readlink_malloc(proc_file, name);
864 return r == -ENOENT ? -ESRCH : r;
869 int get_process_exe(pid_t pid, char **name) {
876 p = procfs_file_alloca(pid, "exe");
877 r = get_process_link_contents(p, name);
881 d = endswith(*name, " (deleted)");
888 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
889 _cleanup_fclose_ FILE *f = NULL;
899 p = procfs_file_alloca(pid, "status");
904 FOREACH_LINE(line, f, return -errno) {
909 if (startswith(l, field)) {
911 l += strspn(l, WHITESPACE);
913 l[strcspn(l, WHITESPACE)] = 0;
915 return parse_uid(l, uid);
922 int get_process_uid(pid_t pid, uid_t *uid) {
923 return get_process_id(pid, "Uid:", uid);
926 int get_process_gid(pid_t pid, gid_t *gid) {
927 assert_cc(sizeof(uid_t) == sizeof(gid_t));
928 return get_process_id(pid, "Gid:", gid);
931 int get_process_cwd(pid_t pid, char **cwd) {
936 p = procfs_file_alloca(pid, "cwd");
938 return get_process_link_contents(p, cwd);
941 int get_process_root(pid_t pid, char **root) {
946 p = procfs_file_alloca(pid, "root");
948 return get_process_link_contents(p, root);
951 int get_process_environ(pid_t pid, char **env) {
952 _cleanup_fclose_ FILE *f = NULL;
953 _cleanup_free_ char *outcome = NULL;
956 size_t allocated = 0, sz = 0;
961 p = procfs_file_alloca(pid, "environ");
967 while ((c = fgetc(f)) != EOF) {
968 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
972 outcome[sz++] = '\n';
974 sz += cescape_char(c, outcome + sz);
984 char *strnappend(const char *s, const char *suffix, size_t b) {
992 return strndup(suffix, b);
1001 if (b > ((size_t) -1) - a)
1004 r = new(char, a+b+1);
1009 memcpy(r+a, suffix, b);
1015 char *strappend(const char *s, const char *suffix) {
1016 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
1019 int readlinkat_malloc(int fd, const char *p, char **ret) {
1034 n = readlinkat(fd, p, c, l-1);
1041 if ((size_t) n < l-1) {
1052 int readlink_malloc(const char *p, char **ret) {
1053 return readlinkat_malloc(AT_FDCWD, p, ret);
1056 int readlink_value(const char *p, char **ret) {
1057 _cleanup_free_ char *link = NULL;
1061 r = readlink_malloc(p, &link);
1065 value = basename(link);
1069 value = strdup(value);
1078 int readlink_and_make_absolute(const char *p, char **r) {
1079 _cleanup_free_ char *target = NULL;
1086 j = readlink_malloc(p, &target);
1090 k = file_in_same_dir(p, target);
1098 int readlink_and_canonicalize(const char *p, char **r) {
1105 j = readlink_and_make_absolute(p, &t);
1109 s = canonicalize_file_name(t);
1116 path_kill_slashes(*r);
1121 int reset_all_signal_handlers(void) {
1124 for (sig = 1; sig < _NSIG; sig++) {
1125 struct sigaction sa = {
1126 .sa_handler = SIG_DFL,
1127 .sa_flags = SA_RESTART,
1130 /* These two cannot be caught... */
1131 if (sig == SIGKILL || sig == SIGSTOP)
1134 /* On Linux the first two RT signals are reserved by
1135 * glibc, and sigaction() will return EINVAL for them. */
1136 if ((sigaction(sig, &sa, NULL) < 0))
1137 if (errno != EINVAL && r == 0)
1144 int reset_signal_mask(void) {
1147 if (sigemptyset(&ss) < 0)
1150 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1156 char *strstrip(char *s) {
1159 /* Drops trailing whitespace. Modifies the string in
1160 * place. Returns pointer to first non-space character */
1162 s += strspn(s, WHITESPACE);
1164 for (e = strchr(s, 0); e > s; e --)
1165 if (!strchr(WHITESPACE, e[-1]))
1173 char *delete_chars(char *s, const char *bad) {
1176 /* Drops all whitespace, regardless where in the string */
1178 for (f = s, t = s; *f; f++) {
1179 if (strchr(bad, *f))
1190 char *file_in_same_dir(const char *path, const char *filename) {
1197 /* This removes the last component of path and appends
1198 * filename, unless the latter is absolute anyway or the
1201 if (path_is_absolute(filename))
1202 return strdup(filename);
1204 e = strrchr(path, '/');
1206 return strdup(filename);
1208 k = strlen(filename);
1209 ret = new(char, (e + 1 - path) + k + 1);
1213 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1217 int rmdir_parents(const char *path, const char *stop) {
1226 /* Skip trailing slashes */
1227 while (l > 0 && path[l-1] == '/')
1233 /* Skip last component */
1234 while (l > 0 && path[l-1] != '/')
1237 /* Skip trailing slashes */
1238 while (l > 0 && path[l-1] == '/')
1244 if (!(t = strndup(path, l)))
1247 if (path_startswith(stop, t)) {
1256 if (errno != ENOENT)
1263 char hexchar(int x) {
1264 static const char table[16] = "0123456789abcdef";
1266 return table[x & 15];
1269 int unhexchar(char c) {
1271 if (c >= '0' && c <= '9')
1274 if (c >= 'a' && c <= 'f')
1275 return c - 'a' + 10;
1277 if (c >= 'A' && c <= 'F')
1278 return c - 'A' + 10;
1283 char *hexmem(const void *p, size_t l) {
1287 z = r = malloc(l * 2 + 1);
1291 for (x = p; x < (const uint8_t*) p + l; x++) {
1292 *(z++) = hexchar(*x >> 4);
1293 *(z++) = hexchar(*x & 15);
1300 void *unhexmem(const char *p, size_t l) {
1306 z = r = malloc((l + 1) / 2 + 1);
1310 for (x = p; x < p + l; x += 2) {
1313 a = unhexchar(x[0]);
1315 b = unhexchar(x[1]);
1319 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1326 char octchar(int x) {
1327 return '0' + (x & 7);
1330 int unoctchar(char c) {
1332 if (c >= '0' && c <= '7')
1338 char decchar(int x) {
1339 return '0' + (x % 10);
1342 int undecchar(char c) {
1344 if (c >= '0' && c <= '9')
1350 char *cescape(const char *s) {
1356 /* Does C style string escaping. May be reversed with
1359 r = new(char, strlen(s)*4 + 1);
1363 for (f = s, t = r; *f; f++)
1364 t += cescape_char(*f, t);
1371 static int cunescape_one(const char *p, size_t length, char *ret, uint32_t *ret_unicode) {
1378 /* Unescapes C style. Returns the unescaped character in ret,
1379 * unless we encountered a \u sequence in which case the full
1380 * unicode character is returned in ret_unicode, instead. */
1382 if (length != (size_t) -1 && length < 1)
1419 /* This is an extension of the XDG syntax files */
1424 /* hexadecimal encoding */
1427 if (length != (size_t) -1 && length < 3)
1430 a = unhexchar(p[1]);
1434 b = unhexchar(p[2]);
1438 /* Don't allow NUL bytes */
1439 if (a == 0 && b == 0)
1442 *ret = (char) ((a << 4U) | b);
1448 /* C++11 style 16bit unicode */
1454 if (length != (size_t) -1 && length < 5)
1457 for (i = 0; i < 4; i++) {
1458 a[i] = unhexchar(p[1 + i]);
1463 c = ((uint32_t) a[0] << 12U) | ((uint32_t) a[1] << 8U) | ((uint32_t) a[2] << 4U) | (uint32_t) a[3];
1465 /* Don't allow 0 chars */
1484 /* C++11 style 32bit unicode */
1490 if (length != (size_t) -1 && length < 9)
1493 for (i = 0; i < 8; i++) {
1494 a[i] = unhexchar(p[1 + i]);
1499 c = ((uint32_t) a[0] << 28U) | ((uint32_t) a[1] << 24U) | ((uint32_t) a[2] << 20U) | ((uint32_t) a[3] << 16U) |
1500 ((uint32_t) a[4] << 12U) | ((uint32_t) a[5] << 8U) | ((uint32_t) a[6] << 4U) | (uint32_t) a[7];
1502 /* Don't allow 0 chars */
1506 /* Don't allow invalid code points */
1507 if (!unichar_is_valid(c))
1532 /* octal encoding */
1536 if (length != (size_t) -1 && length < 4)
1539 a = unoctchar(p[0]);
1543 b = unoctchar(p[1]);
1547 c = unoctchar(p[2]);
1551 /* don't allow NUL bytes */
1552 if (a == 0 && b == 0 && c == 0)
1555 /* Don't allow bytes above 255 */
1556 m = ((uint32_t) a << 6U) | ((uint32_t) b << 3U) | (uint32_t) c;
1572 int cunescape_length_with_prefix(const char *s, size_t length, const char *prefix, UnescapeFlags flags, char **ret) {
1580 /* Undoes C style string escaping, and optionally prefixes it. */
1582 pl = prefix ? strlen(prefix) : 0;
1584 r = new(char, pl+length+1);
1589 memcpy(r, prefix, pl);
1591 for (f = s, t = r + pl; f < s + length; f++) {
1597 remaining = s + length - f;
1598 assert(remaining > 0);
1601 /* A literal literal, copy verbatim */
1606 if (remaining == 1) {
1607 if (flags & UNESCAPE_RELAX) {
1608 /* A trailing backslash, copy verbatim */
1617 k = cunescape_one(f + 1, remaining - 1, &c, &u);
1619 if (flags & UNESCAPE_RELAX) {
1620 /* Invalid escape code, let's take it literal then */
1630 /* Non-Unicode? Let's encode this directly */
1633 /* Unicode? Then let's encode this in UTF-8 */
1634 t += utf8_encode_unichar(t, u);
1645 int cunescape_length(const char *s, size_t length, UnescapeFlags flags, char **ret) {
1646 return cunescape_length_with_prefix(s, length, NULL, flags, ret);
1649 int cunescape(const char *s, UnescapeFlags flags, char **ret) {
1650 return cunescape_length(s, strlen(s), flags, ret);
1653 char *xescape(const char *s, const char *bad) {
1657 /* Escapes all chars in bad, in addition to \ and all special
1658 * chars, in \xFF style escaping. May be reversed with
1661 r = new(char, strlen(s) * 4 + 1);
1665 for (f = s, t = r; *f; f++) {
1667 if ((*f < ' ') || (*f >= 127) ||
1668 (*f == '\\') || strchr(bad, *f)) {
1671 *(t++) = hexchar(*f >> 4);
1672 *(t++) = hexchar(*f);
1682 char *ascii_strlower(char *t) {
1687 for (p = t; *p; p++)
1688 if (*p >= 'A' && *p <= 'Z')
1689 *p = *p - 'A' + 'a';
1694 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1698 filename[0] == '.' ||
1699 streq(filename, "lost+found") ||
1700 streq(filename, "aquota.user") ||
1701 streq(filename, "aquota.group") ||
1702 endswith(filename, ".rpmnew") ||
1703 endswith(filename, ".rpmsave") ||
1704 endswith(filename, ".rpmorig") ||
1705 endswith(filename, ".dpkg-old") ||
1706 endswith(filename, ".dpkg-new") ||
1707 endswith(filename, ".dpkg-tmp") ||
1708 endswith(filename, ".dpkg-dist") ||
1709 endswith(filename, ".dpkg-bak") ||
1710 endswith(filename, ".dpkg-backup") ||
1711 endswith(filename, ".dpkg-remove") ||
1712 endswith(filename, ".swp");
1715 bool hidden_file(const char *filename) {
1718 if (endswith(filename, "~"))
1721 return hidden_file_allow_backup(filename);
1724 int fd_nonblock(int fd, bool nonblock) {
1729 flags = fcntl(fd, F_GETFL, 0);
1734 nflags = flags | O_NONBLOCK;
1736 nflags = flags & ~O_NONBLOCK;
1738 if (nflags == flags)
1741 if (fcntl(fd, F_SETFL, nflags) < 0)
1747 int fd_cloexec(int fd, bool cloexec) {
1752 flags = fcntl(fd, F_GETFD, 0);
1757 nflags = flags | FD_CLOEXEC;
1759 nflags = flags & ~FD_CLOEXEC;
1761 if (nflags == flags)
1764 if (fcntl(fd, F_SETFD, nflags) < 0)
1770 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1773 assert(n_fdset == 0 || fdset);
1775 for (i = 0; i < n_fdset; i++)
1782 int close_all_fds(const int except[], unsigned n_except) {
1783 _cleanup_closedir_ DIR *d = NULL;
1787 assert(n_except == 0 || except);
1789 d = opendir("/proc/self/fd");
1794 /* When /proc isn't available (for example in chroots)
1795 * the fallback is brute forcing through the fd
1798 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1799 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1801 if (fd_in_set(fd, except, n_except))
1804 if (close_nointr(fd) < 0)
1805 if (errno != EBADF && r == 0)
1812 while ((de = readdir(d))) {
1815 if (hidden_file(de->d_name))
1818 if (safe_atoi(de->d_name, &fd) < 0)
1819 /* Let's better ignore this, just in case */
1828 if (fd_in_set(fd, except, n_except))
1831 if (close_nointr(fd) < 0) {
1832 /* Valgrind has its own FD and doesn't want to have it closed */
1833 if (errno != EBADF && r == 0)
1841 bool chars_intersect(const char *a, const char *b) {
1844 /* Returns true if any of the chars in a are in b. */
1845 for (p = a; *p; p++)
1852 bool fstype_is_network(const char *fstype) {
1853 static const char table[] =
1868 x = startswith(fstype, "fuse.");
1872 return nulstr_contains(table, fstype);
1876 _cleanup_close_ int fd;
1878 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1884 TIOCL_GETKMSGREDIRECT,
1888 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1891 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1894 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1900 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1901 struct termios old_termios, new_termios;
1902 char c, line[LINE_MAX];
1907 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1908 new_termios = old_termios;
1910 new_termios.c_lflag &= ~ICANON;
1911 new_termios.c_cc[VMIN] = 1;
1912 new_termios.c_cc[VTIME] = 0;
1914 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1917 if (t != USEC_INFINITY) {
1918 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1919 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1924 k = fread(&c, 1, 1, f);
1926 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1932 *need_nl = c != '\n';
1939 if (t != USEC_INFINITY) {
1940 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1945 if (!fgets(line, sizeof(line), f))
1946 return errno ? -errno : -EIO;
1950 if (strlen(line) != 1)
1960 int ask_char(char *ret, const char *replies, const char *text, ...) {
1970 bool need_nl = true;
1973 fputs(ANSI_HIGHLIGHT_ON, stdout);
1980 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1984 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1987 if (r == -EBADMSG) {
1988 puts("Bad input, please try again.");
1999 if (strchr(replies, c)) {
2004 puts("Read unexpected character, please try again.");
2008 int ask_string(char **ret, const char *text, ...) {
2013 char line[LINE_MAX];
2017 fputs(ANSI_HIGHLIGHT_ON, stdout);
2024 fputs(ANSI_HIGHLIGHT_OFF, stdout);
2029 if (!fgets(line, sizeof(line), stdin))
2030 return errno ? -errno : -EIO;
2032 if (!endswith(line, "\n"))
2051 int reset_terminal_fd(int fd, bool switch_to_text) {
2052 struct termios termios;
2055 /* Set terminal to some sane defaults */
2059 /* We leave locked terminal attributes untouched, so that
2060 * Plymouth may set whatever it wants to set, and we don't
2061 * interfere with that. */
2063 /* Disable exclusive mode, just in case */
2064 ioctl(fd, TIOCNXCL);
2066 /* Switch to text mode */
2068 ioctl(fd, KDSETMODE, KD_TEXT);
2070 /* Enable console unicode mode */
2071 ioctl(fd, KDSKBMODE, K_UNICODE);
2073 if (tcgetattr(fd, &termios) < 0) {
2078 /* We only reset the stuff that matters to the software. How
2079 * hardware is set up we don't touch assuming that somebody
2080 * else will do that for us */
2082 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
2083 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
2084 termios.c_oflag |= ONLCR;
2085 termios.c_cflag |= CREAD;
2086 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
2088 termios.c_cc[VINTR] = 03; /* ^C */
2089 termios.c_cc[VQUIT] = 034; /* ^\ */
2090 termios.c_cc[VERASE] = 0177;
2091 termios.c_cc[VKILL] = 025; /* ^X */
2092 termios.c_cc[VEOF] = 04; /* ^D */
2093 termios.c_cc[VSTART] = 021; /* ^Q */
2094 termios.c_cc[VSTOP] = 023; /* ^S */
2095 termios.c_cc[VSUSP] = 032; /* ^Z */
2096 termios.c_cc[VLNEXT] = 026; /* ^V */
2097 termios.c_cc[VWERASE] = 027; /* ^W */
2098 termios.c_cc[VREPRINT] = 022; /* ^R */
2099 termios.c_cc[VEOL] = 0;
2100 termios.c_cc[VEOL2] = 0;
2102 termios.c_cc[VTIME] = 0;
2103 termios.c_cc[VMIN] = 1;
2105 if (tcsetattr(fd, TCSANOW, &termios) < 0)
2109 /* Just in case, flush all crap out */
2110 tcflush(fd, TCIOFLUSH);
2115 int reset_terminal(const char *name) {
2116 _cleanup_close_ int fd = -1;
2118 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2122 return reset_terminal_fd(fd, true);
2125 int open_terminal(const char *name, int mode) {
2130 * If a TTY is in the process of being closed opening it might
2131 * cause EIO. This is horribly awful, but unlikely to be
2132 * changed in the kernel. Hence we work around this problem by
2133 * retrying a couple of times.
2135 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
2138 assert(!(mode & O_CREAT));
2141 fd = open(name, mode, 0);
2148 /* Max 1s in total */
2152 usleep(50 * USEC_PER_MSEC);
2170 int flush_fd(int fd) {
2171 struct pollfd pollfd = {
2181 r = poll(&pollfd, 1, 0);
2191 l = read(fd, buf, sizeof(buf));
2197 if (errno == EAGAIN)
2206 int acquire_terminal(
2210 bool ignore_tiocstty_eperm,
2213 int fd = -1, notify = -1, r = 0, wd = -1;
2218 /* We use inotify to be notified when the tty is closed. We
2219 * create the watch before checking if we can actually acquire
2220 * it, so that we don't lose any event.
2222 * Note: strictly speaking this actually watches for the
2223 * device being closed, it does *not* really watch whether a
2224 * tty loses its controlling process. However, unless some
2225 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2226 * its tty otherwise this will not become a problem. As long
2227 * as the administrator makes sure not configure any service
2228 * on the same tty as an untrusted user this should not be a
2229 * problem. (Which he probably should not do anyway.) */
2231 if (timeout != USEC_INFINITY)
2232 ts = now(CLOCK_MONOTONIC);
2234 if (!fail && !force) {
2235 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2241 wd = inotify_add_watch(notify, name, IN_CLOSE);
2249 struct sigaction sa_old, sa_new = {
2250 .sa_handler = SIG_IGN,
2251 .sa_flags = SA_RESTART,
2255 r = flush_fd(notify);
2260 /* We pass here O_NOCTTY only so that we can check the return
2261 * value TIOCSCTTY and have a reliable way to figure out if we
2262 * successfully became the controlling process of the tty */
2263 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2267 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2268 * if we already own the tty. */
2269 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2271 /* First, try to get the tty */
2272 if (ioctl(fd, TIOCSCTTY, force) < 0)
2275 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2277 /* Sometimes it makes sense to ignore TIOCSCTTY
2278 * returning EPERM, i.e. when very likely we already
2279 * are have this controlling terminal. */
2280 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2283 if (r < 0 && (force || fail || r != -EPERM)) {
2292 assert(notify >= 0);
2295 union inotify_event_buffer buffer;
2296 struct inotify_event *e;
2299 if (timeout != USEC_INFINITY) {
2302 n = now(CLOCK_MONOTONIC);
2303 if (ts + timeout < n) {
2308 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2318 l = read(notify, &buffer, sizeof(buffer));
2320 if (errno == EINTR || errno == EAGAIN)
2327 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2328 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2337 /* We close the tty fd here since if the old session
2338 * ended our handle will be dead. It's important that
2339 * we do this after sleeping, so that we don't enter
2340 * an endless loop. */
2341 fd = safe_close(fd);
2346 r = reset_terminal_fd(fd, true);
2348 log_warning_errno(r, "Failed to reset terminal: %m");
2359 int release_terminal(void) {
2360 static const struct sigaction sa_new = {
2361 .sa_handler = SIG_IGN,
2362 .sa_flags = SA_RESTART,
2365 _cleanup_close_ int fd = -1;
2366 struct sigaction sa_old;
2369 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2373 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2374 * by our own TIOCNOTTY */
2375 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2377 if (ioctl(fd, TIOCNOTTY) < 0)
2380 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2385 int sigaction_many(const struct sigaction *sa, ...) {
2390 while ((sig = va_arg(ap, int)) > 0)
2391 if (sigaction(sig, sa, NULL) < 0)
2398 int ignore_signals(int sig, ...) {
2399 struct sigaction sa = {
2400 .sa_handler = SIG_IGN,
2401 .sa_flags = SA_RESTART,
2406 if (sigaction(sig, &sa, NULL) < 0)
2410 while ((sig = va_arg(ap, int)) > 0)
2411 if (sigaction(sig, &sa, NULL) < 0)
2418 int default_signals(int sig, ...) {
2419 struct sigaction sa = {
2420 .sa_handler = SIG_DFL,
2421 .sa_flags = SA_RESTART,
2426 if (sigaction(sig, &sa, NULL) < 0)
2430 while ((sig = va_arg(ap, int)) > 0)
2431 if (sigaction(sig, &sa, NULL) < 0)
2438 void safe_close_pair(int p[]) {
2442 /* Special case pairs which use the same fd in both
2444 p[0] = p[1] = safe_close(p[0]);
2448 p[0] = safe_close(p[0]);
2449 p[1] = safe_close(p[1]);
2452 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2459 while (nbytes > 0) {
2462 k = read(fd, p, nbytes);
2467 if (errno == EAGAIN && do_poll) {
2469 /* We knowingly ignore any return value here,
2470 * and expect that any error/EOF is reported
2473 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2477 return n > 0 ? n : -errno;
2491 int loop_read_exact(int fd, void *buf, size_t nbytes, bool do_poll) {
2494 n = loop_read(fd, buf, nbytes, do_poll);
2497 if ((size_t) n != nbytes)
2502 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2503 const uint8_t *p = buf;
2510 while (nbytes > 0) {
2513 k = write(fd, p, nbytes);
2518 if (errno == EAGAIN && do_poll) {
2519 /* We knowingly ignore any return value here,
2520 * and expect that any error/EOF is reported
2523 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2530 if (k == 0) /* Can't really happen */
2540 int parse_size(const char *t, off_t base, off_t *size) {
2542 /* Soo, sometimes we want to parse IEC binary suffxies, and
2543 * sometimes SI decimal suffixes. This function can parse
2544 * both. Which one is the right way depends on the
2545 * context. Wikipedia suggests that SI is customary for
2546 * hardrware metrics and network speeds, while IEC is
2547 * customary for most data sizes used by software and volatile
2548 * (RAM) memory. Hence be careful which one you pick!
2550 * In either case we use just K, M, G as suffix, and not Ki,
2551 * Mi, Gi or so (as IEC would suggest). That's because that's
2552 * frickin' ugly. But this means you really need to make sure
2553 * to document which base you are parsing when you use this
2558 unsigned long long factor;
2561 static const struct table iec[] = {
2562 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2563 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2564 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2565 { "G", 1024ULL*1024ULL*1024ULL },
2566 { "M", 1024ULL*1024ULL },
2572 static const struct table si[] = {
2573 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2574 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2575 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2576 { "G", 1000ULL*1000ULL*1000ULL },
2577 { "M", 1000ULL*1000ULL },
2583 const struct table *table;
2585 unsigned long long r = 0;
2586 unsigned n_entries, start_pos = 0;
2589 assert(base == 1000 || base == 1024);
2594 n_entries = ELEMENTSOF(si);
2597 n_entries = ELEMENTSOF(iec);
2603 unsigned long long l2;
2609 l = strtoll(p, &e, 10);
2622 if (*e >= '0' && *e <= '9') {
2625 /* strotoull itself would accept space/+/- */
2626 l2 = strtoull(e, &e2, 10);
2628 if (errno == ERANGE)
2631 /* Ignore failure. E.g. 10.M is valid */
2638 e += strspn(e, WHITESPACE);
2640 for (i = start_pos; i < n_entries; i++)
2641 if (startswith(e, table[i].suffix)) {
2642 unsigned long long tmp;
2643 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2645 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2646 if (tmp > ULLONG_MAX - r)
2650 if ((unsigned long long) (off_t) r != r)
2653 p = e + strlen(table[i].suffix);
2669 int make_stdio(int fd) {
2674 r = dup2(fd, STDIN_FILENO);
2675 s = dup2(fd, STDOUT_FILENO);
2676 t = dup2(fd, STDERR_FILENO);
2681 if (r < 0 || s < 0 || t < 0)
2684 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2685 * dup2() was a NOP and the bit hence possibly set. */
2686 fd_cloexec(STDIN_FILENO, false);
2687 fd_cloexec(STDOUT_FILENO, false);
2688 fd_cloexec(STDERR_FILENO, false);
2693 int make_null_stdio(void) {
2696 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2700 return make_stdio(null_fd);
2703 bool is_device_path(const char *path) {
2705 /* Returns true on paths that refer to a device, either in
2706 * sysfs or in /dev */
2709 path_startswith(path, "/dev/") ||
2710 path_startswith(path, "/sys/");
2713 int dir_is_empty(const char *path) {
2714 _cleanup_closedir_ DIR *d;
2725 if (!de && errno != 0)
2731 if (!hidden_file(de->d_name))
2736 char* dirname_malloc(const char *path) {
2737 char *d, *dir, *dir2;
2754 int dev_urandom(void *p, size_t n) {
2755 static int have_syscall = -1;
2757 _cleanup_close_ int fd = -1;
2760 /* Gathers some randomness from the kernel. This call will
2761 * never block, and will always return some data from the
2762 * kernel, regardless if the random pool is fully initialized
2763 * or not. It thus makes no guarantee for the quality of the
2764 * returned entropy, but is good enough for or usual usecases
2765 * of seeding the hash functions for hashtable */
2767 /* Use the getrandom() syscall unless we know we don't have
2768 * it, or when the requested size is too large for it. */
2769 if (have_syscall != 0 || (size_t) (int) n != n) {
2770 r = getrandom(p, n, GRND_NONBLOCK);
2772 have_syscall = true;
2777 if (errno == ENOSYS)
2778 /* we lack the syscall, continue with
2779 * reading from /dev/urandom */
2780 have_syscall = false;
2781 else if (errno == EAGAIN)
2782 /* not enough entropy for now. Let's
2783 * remember to use the syscall the
2784 * next time, again, but also read
2785 * from /dev/urandom for now, which
2786 * doesn't care about the current
2787 * amount of entropy. */
2788 have_syscall = true;
2792 /* too short read? */
2796 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2798 return errno == ENOENT ? -ENOSYS : -errno;
2800 return loop_read_exact(fd, p, n, true);
2803 void initialize_srand(void) {
2804 static bool srand_called = false;
2806 #ifdef HAVE_SYS_AUXV_H
2815 #ifdef HAVE_SYS_AUXV_H
2816 /* The kernel provides us with a bit of entropy in auxv, so
2817 * let's try to make use of that to seed the pseudo-random
2818 * generator. It's better than nothing... */
2820 auxv = (void*) getauxval(AT_RANDOM);
2822 x ^= *(unsigned*) auxv;
2825 x ^= (unsigned) now(CLOCK_REALTIME);
2826 x ^= (unsigned) gettid();
2829 srand_called = true;
2832 void random_bytes(void *p, size_t n) {
2836 r = dev_urandom(p, n);
2840 /* If some idiot made /dev/urandom unavailable to us, he'll
2841 * get a PRNG instead. */
2845 for (q = p; q < (uint8_t*) p + n; q ++)
2849 void rename_process(const char name[8]) {
2852 /* This is a like a poor man's setproctitle(). It changes the
2853 * comm field, argv[0], and also the glibc's internally used
2854 * name of the process. For the first one a limit of 16 chars
2855 * applies, to the second one usually one of 10 (i.e. length
2856 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2857 * "systemd"). If you pass a longer string it will be
2860 prctl(PR_SET_NAME, name);
2862 if (program_invocation_name)
2863 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2865 if (saved_argc > 0) {
2869 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2871 for (i = 1; i < saved_argc; i++) {
2875 memzero(saved_argv[i], strlen(saved_argv[i]));
2880 void sigset_add_many(sigset_t *ss, ...) {
2887 while ((sig = va_arg(ap, int)) > 0)
2888 assert_se(sigaddset(ss, sig) == 0);
2892 int sigprocmask_many(int how, ...) {
2897 assert_se(sigemptyset(&ss) == 0);
2900 while ((sig = va_arg(ap, int)) > 0)
2901 assert_se(sigaddset(&ss, sig) == 0);
2904 if (sigprocmask(how, &ss, NULL) < 0)
2910 char* gethostname_malloc(void) {
2913 assert_se(uname(&u) >= 0);
2915 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2916 return strdup(u.nodename);
2918 return strdup(u.sysname);
2921 bool hostname_is_set(void) {
2924 assert_se(uname(&u) >= 0);
2926 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2929 char *lookup_uid(uid_t uid) {
2932 _cleanup_free_ char *buf = NULL;
2933 struct passwd pwbuf, *pw = NULL;
2935 /* Shortcut things to avoid NSS lookups */
2937 return strdup("root");
2939 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2943 buf = malloc(bufsize);
2947 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2948 return strdup(pw->pw_name);
2950 if (asprintf(&name, UID_FMT, uid) < 0)
2956 char* getlogname_malloc(void) {
2960 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2965 return lookup_uid(uid);
2968 char *getusername_malloc(void) {
2975 return lookup_uid(getuid());
2978 int getttyname_malloc(int fd, char **ret) {
2988 r = ttyname_r(fd, path, sizeof(path));
2993 p = startswith(path, "/dev/");
2994 c = strdup(p ?: path);
3011 int getttyname_harder(int fd, char **r) {
3015 k = getttyname_malloc(fd, &s);
3019 if (streq(s, "tty")) {
3021 return get_ctty(0, NULL, r);
3028 int get_ctty_devnr(pid_t pid, dev_t *d) {
3030 _cleanup_free_ char *line = NULL;
3032 unsigned long ttynr;
3036 p = procfs_file_alloca(pid, "stat");
3037 r = read_one_line_file(p, &line);
3041 p = strrchr(line, ')');
3051 "%*d " /* session */
3056 if (major(ttynr) == 0 && minor(ttynr) == 0)
3065 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
3066 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
3067 _cleanup_free_ char *s = NULL;
3074 k = get_ctty_devnr(pid, &devnr);
3078 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
3080 k = readlink_malloc(fn, &s);
3086 /* This is an ugly hack */
3087 if (major(devnr) == 136) {
3088 if (asprintf(&b, "pts/%u", minor(devnr)) < 0)
3091 /* Probably something like the ptys which have no
3092 * symlink in /dev/char. Let's return something
3093 * vaguely useful. */
3100 if (startswith(s, "/dev/"))
3102 else if (startswith(s, "../"))
3119 bool is_temporary_fs(const struct statfs *s) {
3122 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3123 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3126 int fd_is_temporary_fs(int fd) {
3129 if (fstatfs(fd, &s) < 0)
3132 return is_temporary_fs(&s);
3135 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3138 /* Under the assumption that we are running privileged we
3139 * first change the access mode and only then hand out
3140 * ownership to avoid a window where access is too open. */
3142 if (mode != MODE_INVALID)
3143 if (chmod(path, mode) < 0)
3146 if (uid != UID_INVALID || gid != GID_INVALID)
3147 if (chown(path, uid, gid) < 0)
3153 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3156 /* Under the assumption that we are running privileged we
3157 * first change the access mode and only then hand out
3158 * ownership to avoid a window where access is too open. */
3160 if (mode != MODE_INVALID)
3161 if (fchmod(fd, mode) < 0)
3164 if (uid != UID_INVALID || gid != GID_INVALID)
3165 if (fchown(fd, uid, gid) < 0)
3171 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3175 /* Allocates the cpuset in the right size */
3178 if (!(r = CPU_ALLOC(n)))
3181 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3182 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3192 if (errno != EINVAL)
3199 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3200 static const char status_indent[] = " "; /* "[" STATUS "] " */
3201 _cleanup_free_ char *s = NULL;
3202 _cleanup_close_ int fd = -1;
3203 struct iovec iovec[6] = {};
3205 static bool prev_ephemeral;
3209 /* This is independent of logging, as status messages are
3210 * optional and go exclusively to the console. */
3212 if (vasprintf(&s, format, ap) < 0)
3215 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3228 sl = status ? sizeof(status_indent)-1 : 0;
3234 e = ellipsize(s, emax, 50);
3242 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3243 prev_ephemeral = ephemeral;
3246 if (!isempty(status)) {
3247 IOVEC_SET_STRING(iovec[n++], "[");
3248 IOVEC_SET_STRING(iovec[n++], status);
3249 IOVEC_SET_STRING(iovec[n++], "] ");
3251 IOVEC_SET_STRING(iovec[n++], status_indent);
3254 IOVEC_SET_STRING(iovec[n++], s);
3256 IOVEC_SET_STRING(iovec[n++], "\n");
3258 if (writev(fd, iovec, n) < 0)
3264 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3270 va_start(ap, format);
3271 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3277 char *replace_env(const char *format, char **env) {
3284 const char *e, *word = format;
3289 for (e = format; *e; e ++) {
3300 k = strnappend(r, word, e-word-1);
3310 } else if (*e == '$') {
3311 k = strnappend(r, word, e-word);
3328 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3330 k = strappend(r, t);
3344 k = strnappend(r, word, e-word);
3356 char **replace_env_argv(char **argv, char **env) {
3358 unsigned k = 0, l = 0;
3360 l = strv_length(argv);
3362 ret = new(char*, l+1);
3366 STRV_FOREACH(i, argv) {
3368 /* If $FOO appears as single word, replace it by the split up variable */
3369 if ((*i)[0] == '$' && (*i)[1] != '{') {
3371 char **w, **m = NULL;
3374 e = strv_env_get(env, *i+1);
3378 r = strv_split_quoted(&m, e, UNQUOTE_RELAX);
3390 w = realloc(ret, sizeof(char*) * (l+1));
3400 memcpy(ret + k, m, q * sizeof(char*));
3408 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3409 ret[k] = replace_env(*i, env);
3421 int fd_columns(int fd) {
3422 struct winsize ws = {};
3424 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3433 unsigned columns(void) {
3437 if (_likely_(cached_columns > 0))
3438 return cached_columns;
3441 e = getenv("COLUMNS");
3443 (void) safe_atoi(e, &c);
3446 c = fd_columns(STDOUT_FILENO);
3452 return cached_columns;
3455 int fd_lines(int fd) {
3456 struct winsize ws = {};
3458 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3467 unsigned lines(void) {
3471 if (_likely_(cached_lines > 0))
3472 return cached_lines;
3475 e = getenv("LINES");
3477 (void) safe_atoi(e, &l);
3480 l = fd_lines(STDOUT_FILENO);
3486 return cached_lines;
3489 /* intended to be used as a SIGWINCH sighandler */
3490 void columns_lines_cache_reset(int signum) {
3496 static int cached_on_tty = -1;
3498 if (_unlikely_(cached_on_tty < 0))
3499 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3501 return cached_on_tty;
3504 int files_same(const char *filea, const char *fileb) {
3507 if (stat(filea, &a) < 0)
3510 if (stat(fileb, &b) < 0)
3513 return a.st_dev == b.st_dev &&
3514 a.st_ino == b.st_ino;
3517 int running_in_chroot(void) {
3520 ret = files_same("/proc/1/root", "/");
3527 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3532 assert(percent <= 100);
3533 assert(new_length >= 3);
3535 if (old_length <= 3 || old_length <= new_length)
3536 return strndup(s, old_length);
3538 r = new0(char, new_length+1);
3542 x = (new_length * percent) / 100;
3544 if (x > new_length - 3)
3552 s + old_length - (new_length - x - 3),
3553 new_length - x - 3);
3558 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3562 unsigned k, len, len2;
3565 assert(percent <= 100);
3566 assert(new_length >= 3);
3568 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3569 if (ascii_is_valid(s))
3570 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3572 if (old_length <= 3 || old_length <= new_length)
3573 return strndup(s, old_length);
3575 x = (new_length * percent) / 100;
3577 if (x > new_length - 3)
3581 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3584 c = utf8_encoded_to_unichar(i);
3587 k += unichar_iswide(c) ? 2 : 1;
3590 if (k > x) /* last character was wide and went over quota */
3593 for (j = s + old_length; k < new_length && j > i; ) {
3596 j = utf8_prev_char(j);
3597 c = utf8_encoded_to_unichar(j);
3600 k += unichar_iswide(c) ? 2 : 1;
3604 /* we don't actually need to ellipsize */
3606 return memdup(s, old_length + 1);
3608 /* make space for ellipsis */
3609 j = utf8_next_char(j);
3612 len2 = s + old_length - j;
3613 e = new(char, len + 3 + len2 + 1);
3618 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3619 old_length, new_length, x, len, len2, k);
3623 e[len] = 0xe2; /* tri-dot ellipsis: … */
3627 memcpy(e + len + 3, j, len2 + 1);
3632 char *ellipsize(const char *s, size_t length, unsigned percent) {
3633 return ellipsize_mem(s, strlen(s), length, percent);
3636 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3637 _cleanup_close_ int fd;
3643 mkdir_parents(path, 0755);
3645 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3650 r = fchmod(fd, mode);
3655 if (uid != UID_INVALID || gid != GID_INVALID) {
3656 r = fchown(fd, uid, gid);
3661 if (stamp != USEC_INFINITY) {
3662 struct timespec ts[2];
3664 timespec_store(&ts[0], stamp);
3666 r = futimens(fd, ts);
3668 r = futimens(fd, NULL);
3675 int touch(const char *path) {
3676 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3679 static char *unquote(const char *s, const char* quotes) {
3683 /* This is rather stupid, simply removes the heading and
3684 * trailing quotes if there is one. Doesn't care about
3685 * escaping or anything.
3687 * DON'T USE THIS FOR NEW CODE ANYMORE!*/
3693 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3694 return strndup(s+1, l-2);
3699 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3710 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3724 * < 0 : wait_for_terminate() failed to get the state of the
3725 * process, the process was terminated by a signal, or
3726 * failed for an unknown reason.
3727 * >=0 : The process terminated normally, and its exit code is
3730 * That is, success is indicated by a return value of zero, and an
3731 * error is indicated by a non-zero value.
3733 * A warning is emitted if the process terminates abnormally,
3734 * and also if it returns non-zero unless check_exit_code is true.
3736 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3743 r = wait_for_terminate(pid, &status);
3745 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3747 if (status.si_code == CLD_EXITED) {
3748 if (status.si_status != 0)
3749 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3750 "%s failed with error code %i.", name, status.si_status);
3752 log_debug("%s succeeded.", name);
3754 return status.si_status;
3755 } else if (status.si_code == CLD_KILLED ||
3756 status.si_code == CLD_DUMPED) {
3758 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3762 log_warning("%s failed due to unknown reason.", name);
3766 noreturn void freeze(void) {
3768 /* Make sure nobody waits for us on a socket anymore */
3769 close_all_fds(NULL, 0);
3777 bool null_or_empty(struct stat *st) {
3780 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3783 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3789 int null_or_empty_path(const char *fn) {
3794 if (stat(fn, &st) < 0)
3797 return null_or_empty(&st);
3800 int null_or_empty_fd(int fd) {
3805 if (fstat(fd, &st) < 0)
3808 return null_or_empty(&st);
3811 DIR *xopendirat(int fd, const char *name, int flags) {
3815 assert(!(flags & O_CREAT));
3817 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3830 int signal_from_string_try_harder(const char *s) {
3834 signo = signal_from_string(s);
3836 if (startswith(s, "SIG"))
3837 return signal_from_string(s+3);
3842 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3843 _cleanup_free_ char *t = NULL, *u = NULL;
3846 u = unquote(tagvalue, QUOTES);
3850 enc_len = strlen(u) * 4 + 1;
3851 t = new(char, enc_len);
3855 if (encode_devnode_name(u, t, enc_len) < 0)
3858 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3861 char *fstab_node_to_udev_node(const char *p) {
3864 if (startswith(p, "LABEL="))
3865 return tag_to_udev_node(p+6, "label");
3867 if (startswith(p, "UUID="))
3868 return tag_to_udev_node(p+5, "uuid");
3870 if (startswith(p, "PARTUUID="))
3871 return tag_to_udev_node(p+9, "partuuid");
3873 if (startswith(p, "PARTLABEL="))
3874 return tag_to_udev_node(p+10, "partlabel");
3879 bool tty_is_vc(const char *tty) {
3882 return vtnr_from_tty(tty) >= 0;
3885 bool tty_is_console(const char *tty) {
3888 if (startswith(tty, "/dev/"))
3891 return streq(tty, "console");
3894 int vtnr_from_tty(const char *tty) {
3899 if (startswith(tty, "/dev/"))
3902 if (!startswith(tty, "tty") )
3905 if (tty[3] < '0' || tty[3] > '9')
3908 r = safe_atoi(tty+3, &i);
3912 if (i < 0 || i > 63)
3918 char *resolve_dev_console(char **active) {
3921 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3922 * (i.e. not read-only-mounted which is a sign for container setups) */
3924 if (path_is_read_only_fs("/sys") > 0)
3927 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3930 /* If multiple log outputs are configured the last one is what
3931 * /dev/console points to */
3932 tty = strrchr(*active, ' ');
3938 if (streq(tty, "tty0")) {
3941 /* Get the active VC (e.g. tty1) */
3942 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
3944 tty = *active = tmp;
3951 bool tty_is_vc_resolve(const char *tty) {
3952 _cleanup_free_ char *active = NULL;
3956 if (startswith(tty, "/dev/"))
3959 if (streq(tty, "console")) {
3960 tty = resolve_dev_console(&active);
3965 return tty_is_vc(tty);
3968 const char *default_term_for_tty(const char *tty) {
3971 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
3974 bool dirent_is_file(const struct dirent *de) {
3977 if (hidden_file(de->d_name))
3980 if (de->d_type != DT_REG &&
3981 de->d_type != DT_LNK &&
3982 de->d_type != DT_UNKNOWN)
3988 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
3991 if (de->d_type != DT_REG &&
3992 de->d_type != DT_LNK &&
3993 de->d_type != DT_UNKNOWN)
3996 if (hidden_file_allow_backup(de->d_name))
3999 return endswith(de->d_name, suffix);
4002 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4003 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4004 _cleanup_set_free_free_ Set *seen = NULL;
4007 /* We fork this all off from a child process so that we can
4008 * somewhat cleanly make use of SIGALRM to set a time limit */
4010 reset_all_signal_handlers();
4011 reset_signal_mask();
4013 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4015 pids = hashmap_new(NULL);
4019 seen = set_new(&string_hash_ops);
4023 STRV_FOREACH(directory, directories) {
4024 _cleanup_closedir_ DIR *d;
4027 d = opendir(*directory);
4029 if (errno == ENOENT)
4032 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4035 FOREACH_DIRENT(de, d, break) {
4036 _cleanup_free_ char *path = NULL;
4040 if (!dirent_is_file(de))
4043 if (set_contains(seen, de->d_name)) {
4044 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4048 r = set_put_strdup(seen, de->d_name);
4052 path = strjoin(*directory, "/", de->d_name, NULL);
4056 if (null_or_empty_path(path)) {
4057 log_debug("%s is empty (a mask).", path);
4063 log_error_errno(errno, "Failed to fork: %m");
4065 } else if (pid == 0) {
4068 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4078 return log_error_errno(errno, "Failed to execute %s: %m", path);
4081 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4083 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4090 /* Abort execution of this process after the timout. We simply
4091 * rely on SIGALRM as default action terminating the process,
4092 * and turn on alarm(). */
4094 if (timeout != USEC_INFINITY)
4095 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4097 while (!hashmap_isempty(pids)) {
4098 _cleanup_free_ char *path = NULL;
4101 pid = PTR_TO_UINT(hashmap_first_key(pids));
4104 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4107 wait_for_terminate_and_warn(path, pid, true);
4113 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4117 char **dirs = (char**) directories;
4119 assert(!strv_isempty(dirs));
4121 name = basename(dirs[0]);
4122 assert(!isempty(name));
4124 /* Executes all binaries in the directories in parallel and waits
4125 * for them to finish. Optionally a timeout is applied. If a file
4126 * with the same name exists in more than one directory, the
4127 * earliest one wins. */
4129 executor_pid = fork();
4130 if (executor_pid < 0) {
4131 log_error_errno(errno, "Failed to fork: %m");
4134 } else if (executor_pid == 0) {
4135 r = do_execute(dirs, timeout, argv);
4136 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4139 wait_for_terminate_and_warn(name, executor_pid, true);
4142 int kill_and_sigcont(pid_t pid, int sig) {
4145 r = kill(pid, sig) < 0 ? -errno : 0;
4153 bool nulstr_contains(const char*nulstr, const char *needle) {
4159 NULSTR_FOREACH(i, nulstr)
4160 if (streq(i, needle))
4166 bool plymouth_running(void) {
4167 return access("/run/plymouth/pid", F_OK) >= 0;
4170 char* strshorten(char *s, size_t l) {
4179 static bool hostname_valid_char(char c) {
4181 (c >= 'a' && c <= 'z') ||
4182 (c >= 'A' && c <= 'Z') ||
4183 (c >= '0' && c <= '9') ||
4189 bool hostname_is_valid(const char *s) {
4196 /* Doesn't accept empty hostnames, hostnames with trailing or
4197 * leading dots, and hostnames with multiple dots in a
4198 * sequence. Also ensures that the length stays below
4201 for (p = s, dot = true; *p; p++) {
4208 if (!hostname_valid_char(*p))
4218 if (p-s > HOST_NAME_MAX)
4224 char* hostname_cleanup(char *s, bool lowercase) {
4228 for (p = s, d = s, dot = true; *p; p++) {
4235 } else if (hostname_valid_char(*p)) {
4236 *(d++) = lowercase ? tolower(*p) : *p;
4247 strshorten(s, HOST_NAME_MAX);
4252 bool machine_name_is_valid(const char *s) {
4254 if (!hostname_is_valid(s))
4257 /* Machine names should be useful hostnames, but also be
4258 * useful in unit names, hence we enforce a stricter length
4267 int pipe_eof(int fd) {
4268 struct pollfd pollfd = {
4270 .events = POLLIN|POLLHUP,
4275 r = poll(&pollfd, 1, 0);
4282 return pollfd.revents & POLLHUP;
4285 int fd_wait_for_event(int fd, int event, usec_t t) {
4287 struct pollfd pollfd = {
4295 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4302 return pollfd.revents;
4305 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4314 r = tempfn_xxxxxx(path, &t);
4318 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4324 f = fdopen(fd, "we");
4337 int terminal_vhangup_fd(int fd) {
4340 if (ioctl(fd, TIOCVHANGUP) < 0)
4346 int terminal_vhangup(const char *name) {
4347 _cleanup_close_ int fd;
4349 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4353 return terminal_vhangup_fd(fd);
4356 int vt_disallocate(const char *name) {
4360 /* Deallocate the VT if possible. If not possible
4361 * (i.e. because it is the active one), at least clear it
4362 * entirely (including the scrollback buffer) */
4364 if (!startswith(name, "/dev/"))
4367 if (!tty_is_vc(name)) {
4368 /* So this is not a VT. I guess we cannot deallocate
4369 * it then. But let's at least clear the screen */
4371 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4376 "\033[r" /* clear scrolling region */
4377 "\033[H" /* move home */
4378 "\033[2J", /* clear screen */
4385 if (!startswith(name, "/dev/tty"))
4388 r = safe_atou(name+8, &u);
4395 /* Try to deallocate */
4396 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4400 r = ioctl(fd, VT_DISALLOCATE, u);
4409 /* Couldn't deallocate, so let's clear it fully with
4411 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4416 "\033[r" /* clear scrolling region */
4417 "\033[H" /* move home */
4418 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4425 int symlink_atomic(const char *from, const char *to) {
4426 _cleanup_free_ char *t = NULL;
4432 r = tempfn_random(to, &t);
4436 if (symlink(from, t) < 0)
4439 if (rename(t, to) < 0) {
4447 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4448 _cleanup_free_ char *t = NULL;
4453 r = tempfn_random(path, &t);
4457 if (mknod(t, mode, dev) < 0)
4460 if (rename(t, path) < 0) {
4468 int mkfifo_atomic(const char *path, mode_t mode) {
4469 _cleanup_free_ char *t = NULL;
4474 r = tempfn_random(path, &t);
4478 if (mkfifo(t, mode) < 0)
4481 if (rename(t, path) < 0) {
4489 bool display_is_local(const char *display) {
4493 display[0] == ':' &&
4494 display[1] >= '0' &&
4498 int socket_from_display(const char *display, char **path) {
4505 if (!display_is_local(display))
4508 k = strspn(display+1, "0123456789");
4510 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4514 c = stpcpy(f, "/tmp/.X11-unix/X");
4515 memcpy(c, display+1, k);
4524 const char **username,
4525 uid_t *uid, gid_t *gid,
4527 const char **shell) {
4535 /* We enforce some special rules for uid=0: in order to avoid
4536 * NSS lookups for root we hardcode its data. */
4538 if (streq(*username, "root") || streq(*username, "0")) {
4556 if (parse_uid(*username, &u) >= 0) {
4560 /* If there are multiple users with the same id, make
4561 * sure to leave $USER to the configured value instead
4562 * of the first occurrence in the database. However if
4563 * the uid was configured by a numeric uid, then let's
4564 * pick the real username from /etc/passwd. */
4566 *username = p->pw_name;
4569 p = getpwnam(*username);
4573 return errno > 0 ? -errno : -ESRCH;
4585 *shell = p->pw_shell;
4590 char* uid_to_name(uid_t uid) {
4595 return strdup("root");
4599 return strdup(p->pw_name);
4601 if (asprintf(&r, UID_FMT, uid) < 0)
4607 char* gid_to_name(gid_t gid) {
4612 return strdup("root");
4616 return strdup(p->gr_name);
4618 if (asprintf(&r, GID_FMT, gid) < 0)
4624 int get_group_creds(const char **groupname, gid_t *gid) {
4630 /* We enforce some special rules for gid=0: in order to avoid
4631 * NSS lookups for root we hardcode its data. */
4633 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4634 *groupname = "root";
4642 if (parse_gid(*groupname, &id) >= 0) {
4647 *groupname = g->gr_name;
4650 g = getgrnam(*groupname);
4654 return errno > 0 ? -errno : -ESRCH;
4662 int in_gid(gid_t gid) {
4664 int ngroups_max, r, i;
4666 if (getgid() == gid)
4669 if (getegid() == gid)
4672 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4673 assert(ngroups_max > 0);
4675 gids = alloca(sizeof(gid_t) * ngroups_max);
4677 r = getgroups(ngroups_max, gids);
4681 for (i = 0; i < r; i++)
4688 int in_group(const char *name) {
4692 r = get_group_creds(&name, &gid);
4699 int glob_exists(const char *path) {
4700 _cleanup_globfree_ glob_t g = {};
4706 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4708 if (k == GLOB_NOMATCH)
4710 else if (k == GLOB_NOSPACE)
4713 return !strv_isempty(g.gl_pathv);
4715 return errno ? -errno : -EIO;
4718 int glob_extend(char ***strv, const char *path) {
4719 _cleanup_globfree_ glob_t g = {};
4724 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4726 if (k == GLOB_NOMATCH)
4728 else if (k == GLOB_NOSPACE)
4730 else if (k != 0 || strv_isempty(g.gl_pathv))
4731 return errno ? -errno : -EIO;
4733 STRV_FOREACH(p, g.gl_pathv) {
4734 k = strv_extend(strv, *p);
4742 int dirent_ensure_type(DIR *d, struct dirent *de) {
4748 if (de->d_type != DT_UNKNOWN)
4751 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4755 S_ISREG(st.st_mode) ? DT_REG :
4756 S_ISDIR(st.st_mode) ? DT_DIR :
4757 S_ISLNK(st.st_mode) ? DT_LNK :
4758 S_ISFIFO(st.st_mode) ? DT_FIFO :
4759 S_ISSOCK(st.st_mode) ? DT_SOCK :
4760 S_ISCHR(st.st_mode) ? DT_CHR :
4761 S_ISBLK(st.st_mode) ? DT_BLK :
4767 int get_files_in_directory(const char *path, char ***list) {
4768 _cleanup_closedir_ DIR *d = NULL;
4769 size_t bufsize = 0, n = 0;
4770 _cleanup_strv_free_ char **l = NULL;
4774 /* Returns all files in a directory in *list, and the number
4775 * of files as return value. If list is NULL returns only the
4787 if (!de && errno != 0)
4792 dirent_ensure_type(d, de);
4794 if (!dirent_is_file(de))
4798 /* one extra slot is needed for the terminating NULL */
4799 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4802 l[n] = strdup(de->d_name);
4813 l = NULL; /* avoid freeing */
4819 char *strjoin(const char *x, ...) {
4833 t = va_arg(ap, const char *);
4838 if (n > ((size_t) -1) - l) {
4862 t = va_arg(ap, const char *);
4876 bool is_main_thread(void) {
4877 static thread_local int cached = 0;
4879 if (_unlikely_(cached == 0))
4880 cached = getpid() == gettid() ? 1 : -1;
4885 int block_get_whole_disk(dev_t d, dev_t *ret) {
4892 /* If it has a queue this is good enough for us */
4893 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4896 r = access(p, F_OK);
4904 /* If it is a partition find the originating device */
4905 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4908 r = access(p, F_OK);
4914 /* Get parent dev_t */
4915 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4918 r = read_one_line_file(p, &s);
4924 r = sscanf(s, "%u:%u", &m, &n);
4930 /* Only return this if it is really good enough for us. */
4931 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4934 r = access(p, F_OK);
4938 *ret = makedev(m, n);
4945 static const char *const ioprio_class_table[] = {
4946 [IOPRIO_CLASS_NONE] = "none",
4947 [IOPRIO_CLASS_RT] = "realtime",
4948 [IOPRIO_CLASS_BE] = "best-effort",
4949 [IOPRIO_CLASS_IDLE] = "idle"
4952 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
4954 static const char *const sigchld_code_table[] = {
4955 [CLD_EXITED] = "exited",
4956 [CLD_KILLED] = "killed",
4957 [CLD_DUMPED] = "dumped",
4958 [CLD_TRAPPED] = "trapped",
4959 [CLD_STOPPED] = "stopped",
4960 [CLD_CONTINUED] = "continued",
4963 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
4965 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
4966 [LOG_FAC(LOG_KERN)] = "kern",
4967 [LOG_FAC(LOG_USER)] = "user",
4968 [LOG_FAC(LOG_MAIL)] = "mail",
4969 [LOG_FAC(LOG_DAEMON)] = "daemon",
4970 [LOG_FAC(LOG_AUTH)] = "auth",
4971 [LOG_FAC(LOG_SYSLOG)] = "syslog",
4972 [LOG_FAC(LOG_LPR)] = "lpr",
4973 [LOG_FAC(LOG_NEWS)] = "news",
4974 [LOG_FAC(LOG_UUCP)] = "uucp",
4975 [LOG_FAC(LOG_CRON)] = "cron",
4976 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
4977 [LOG_FAC(LOG_FTP)] = "ftp",
4978 [LOG_FAC(LOG_LOCAL0)] = "local0",
4979 [LOG_FAC(LOG_LOCAL1)] = "local1",
4980 [LOG_FAC(LOG_LOCAL2)] = "local2",
4981 [LOG_FAC(LOG_LOCAL3)] = "local3",
4982 [LOG_FAC(LOG_LOCAL4)] = "local4",
4983 [LOG_FAC(LOG_LOCAL5)] = "local5",
4984 [LOG_FAC(LOG_LOCAL6)] = "local6",
4985 [LOG_FAC(LOG_LOCAL7)] = "local7"
4988 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
4990 static const char *const log_level_table[] = {
4991 [LOG_EMERG] = "emerg",
4992 [LOG_ALERT] = "alert",
4993 [LOG_CRIT] = "crit",
4995 [LOG_WARNING] = "warning",
4996 [LOG_NOTICE] = "notice",
4997 [LOG_INFO] = "info",
4998 [LOG_DEBUG] = "debug"
5001 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5003 static const char* const sched_policy_table[] = {
5004 [SCHED_OTHER] = "other",
5005 [SCHED_BATCH] = "batch",
5006 [SCHED_IDLE] = "idle",
5007 [SCHED_FIFO] = "fifo",
5011 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5013 static const char* const rlimit_table[_RLIMIT_MAX] = {
5014 [RLIMIT_CPU] = "LimitCPU",
5015 [RLIMIT_FSIZE] = "LimitFSIZE",
5016 [RLIMIT_DATA] = "LimitDATA",
5017 [RLIMIT_STACK] = "LimitSTACK",
5018 [RLIMIT_CORE] = "LimitCORE",
5019 [RLIMIT_RSS] = "LimitRSS",
5020 [RLIMIT_NOFILE] = "LimitNOFILE",
5021 [RLIMIT_AS] = "LimitAS",
5022 [RLIMIT_NPROC] = "LimitNPROC",
5023 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5024 [RLIMIT_LOCKS] = "LimitLOCKS",
5025 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5026 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5027 [RLIMIT_NICE] = "LimitNICE",
5028 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5029 [RLIMIT_RTTIME] = "LimitRTTIME"
5032 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5034 static const char* const ip_tos_table[] = {
5035 [IPTOS_LOWDELAY] = "low-delay",
5036 [IPTOS_THROUGHPUT] = "throughput",
5037 [IPTOS_RELIABILITY] = "reliability",
5038 [IPTOS_LOWCOST] = "low-cost",
5041 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5043 static const char *const __signal_table[] = {
5060 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5071 [SIGVTALRM] = "VTALRM",
5073 [SIGWINCH] = "WINCH",
5079 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5081 const char *signal_to_string(int signo) {
5082 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5085 name = __signal_to_string(signo);
5089 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5090 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5092 snprintf(buf, sizeof(buf), "%d", signo);
5097 int signal_from_string(const char *s) {
5102 signo = __signal_from_string(s);
5106 if (startswith(s, "RTMIN+")) {
5110 if (safe_atou(s, &u) >= 0) {
5111 signo = (int) u + offset;
5112 if (signo > 0 && signo < _NSIG)
5118 bool kexec_loaded(void) {
5119 bool loaded = false;
5122 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5130 int prot_from_flags(int flags) {
5132 switch (flags & O_ACCMODE) {
5141 return PROT_READ|PROT_WRITE;
5148 char *format_bytes(char *buf, size_t l, off_t t) {
5151 static const struct {
5155 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5156 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5157 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5158 { "G", 1024ULL*1024ULL*1024ULL },
5159 { "M", 1024ULL*1024ULL },
5163 if (t == (off_t) -1)
5166 for (i = 0; i < ELEMENTSOF(table); i++) {
5168 if (t >= table[i].factor) {
5171 (unsigned long long) (t / table[i].factor),
5172 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5179 snprintf(buf, l, "%lluB", (unsigned long long) t);
5187 void* memdup(const void *p, size_t l) {
5200 int fd_inc_sndbuf(int fd, size_t n) {
5202 socklen_t l = sizeof(value);
5204 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5205 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5208 /* If we have the privileges we will ignore the kernel limit. */
5211 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5212 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5218 int fd_inc_rcvbuf(int fd, size_t n) {
5220 socklen_t l = sizeof(value);
5222 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5223 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5226 /* If we have the privileges we will ignore the kernel limit. */
5229 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5230 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5235 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5236 bool stdout_is_tty, stderr_is_tty;
5237 pid_t parent_pid, agent_pid;
5238 sigset_t ss, saved_ss;
5246 /* Spawns a temporary TTY agent, making sure it goes away when
5249 parent_pid = getpid();
5251 /* First we temporarily block all signals, so that the new
5252 * child has them blocked initially. This way, we can be sure
5253 * that SIGTERMs are not lost we might send to the agent. */
5254 assert_se(sigfillset(&ss) >= 0);
5255 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5258 if (agent_pid < 0) {
5259 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5263 if (agent_pid != 0) {
5264 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5271 * Make sure the agent goes away when the parent dies */
5272 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5273 _exit(EXIT_FAILURE);
5275 /* Make sure we actually can kill the agent, if we need to, in
5276 * case somebody invoked us from a shell script that trapped
5277 * SIGTERM or so... */
5278 reset_all_signal_handlers();
5279 reset_signal_mask();
5281 /* Check whether our parent died before we were able
5282 * to set the death signal and unblock the signals */
5283 if (getppid() != parent_pid)
5284 _exit(EXIT_SUCCESS);
5286 /* Don't leak fds to the agent */
5287 close_all_fds(except, n_except);
5289 stdout_is_tty = isatty(STDOUT_FILENO);
5290 stderr_is_tty = isatty(STDERR_FILENO);
5292 if (!stdout_is_tty || !stderr_is_tty) {
5295 /* Detach from stdout/stderr. and reopen
5296 * /dev/tty for them. This is important to
5297 * ensure that when systemctl is started via
5298 * popen() or a similar call that expects to
5299 * read EOF we actually do generate EOF and
5300 * not delay this indefinitely by because we
5301 * keep an unused copy of stdin around. */
5302 fd = open("/dev/tty", O_WRONLY);
5304 log_error_errno(errno, "Failed to open /dev/tty: %m");
5305 _exit(EXIT_FAILURE);
5309 dup2(fd, STDOUT_FILENO);
5312 dup2(fd, STDERR_FILENO);
5318 /* Count arguments */
5320 for (n = 0; va_arg(ap, char*); n++)
5325 l = alloca(sizeof(char *) * (n + 1));
5327 /* Fill in arguments */
5329 for (i = 0; i <= n; i++)
5330 l[i] = va_arg(ap, char*);
5334 _exit(EXIT_FAILURE);
5337 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5338 struct rlimit highest, fixed;
5342 if (setrlimit(resource, rlim) >= 0)
5348 /* So we failed to set the desired setrlimit, then let's try
5349 * to get as close as we can */
5350 assert_se(getrlimit(resource, &highest) == 0);
5352 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5353 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5355 if (setrlimit(resource, &fixed) < 0)
5361 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5362 _cleanup_fclose_ FILE *f = NULL;
5373 path = procfs_file_alloca(pid, "environ");
5375 f = fopen(path, "re");
5383 char line[LINE_MAX];
5386 for (i = 0; i < sizeof(line)-1; i++) {
5390 if (_unlikely_(c == EOF)) {
5400 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5401 value = strdup(line + l + 1);
5415 bool http_etag_is_valid(const char *etag) {
5419 if (!endswith(etag, "\""))
5422 if (!startswith(etag, "\"") && !startswith(etag, "W/\""))
5428 bool http_url_is_valid(const char *url) {
5434 p = startswith(url, "http://");
5436 p = startswith(url, "https://");
5443 return ascii_is_valid(p);
5446 bool documentation_url_is_valid(const char *url) {
5452 if (http_url_is_valid(url))
5455 p = startswith(url, "file:/");
5457 p = startswith(url, "info:");
5459 p = startswith(url, "man:");
5464 return ascii_is_valid(p);
5467 bool in_initrd(void) {
5468 static int saved = -1;
5474 /* We make two checks here:
5476 * 1. the flag file /etc/initrd-release must exist
5477 * 2. the root file system must be a memory file system
5479 * The second check is extra paranoia, since misdetecting an
5480 * initrd can have bad bad consequences due the initrd
5481 * emptying when transititioning to the main systemd.
5484 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5485 statfs("/", &s) >= 0 &&
5486 is_temporary_fs(&s);
5491 void warn_melody(void) {
5492 _cleanup_close_ int fd = -1;
5494 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5498 /* Yeah, this is synchronous. Kinda sucks. But well... */
5500 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5501 usleep(125*USEC_PER_MSEC);
5503 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5504 usleep(125*USEC_PER_MSEC);
5506 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5507 usleep(125*USEC_PER_MSEC);
5509 ioctl(fd, KIOCSOUND, 0);
5512 int make_console_stdio(void) {
5515 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5517 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5519 return log_error_errno(fd, "Failed to acquire terminal: %m");
5523 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5528 int get_home_dir(char **_h) {
5536 /* Take the user specified one */
5537 e = secure_getenv("HOME");
5538 if (e && path_is_absolute(e)) {
5547 /* Hardcode home directory for root to avoid NSS */
5550 h = strdup("/root");
5558 /* Check the database... */
5562 return errno > 0 ? -errno : -ESRCH;
5564 if (!path_is_absolute(p->pw_dir))
5567 h = strdup(p->pw_dir);
5575 int get_shell(char **_s) {
5583 /* Take the user specified one */
5584 e = getenv("SHELL");
5594 /* Hardcode home directory for root to avoid NSS */
5597 s = strdup("/bin/sh");
5605 /* Check the database... */
5609 return errno > 0 ? -errno : -ESRCH;
5611 if (!path_is_absolute(p->pw_shell))
5614 s = strdup(p->pw_shell);
5622 bool filename_is_valid(const char *p) {
5636 if (strlen(p) > FILENAME_MAX)
5642 bool string_is_safe(const char *p) {
5648 for (t = p; *t; t++) {
5649 if (*t > 0 && *t < ' ')
5652 if (strchr("\\\"\'\0x7f", *t))
5660 * Check if a string contains control characters. If 'ok' is non-NULL
5661 * it may be a string containing additional CCs to be considered OK.
5663 bool string_has_cc(const char *p, const char *ok) {
5668 for (t = p; *t; t++) {
5669 if (ok && strchr(ok, *t))
5672 if (*t > 0 && *t < ' ')
5682 bool path_is_safe(const char *p) {
5687 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5690 if (strlen(p) > PATH_MAX)
5693 /* The following two checks are not really dangerous, but hey, they still are confusing */
5694 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5697 if (strstr(p, "//"))
5703 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5704 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5705 int (*compar) (const void *, const void *, void *), void *arg) {
5714 p = (void *)(((const char *) base) + (idx * size));
5715 comparison = compar(key, p, arg);
5718 else if (comparison > 0)
5726 void init_gettext(void) {
5727 setlocale(LC_ALL, "");
5728 textdomain(GETTEXT_PACKAGE);
5731 bool is_locale_utf8(void) {
5733 static int cached_answer = -1;
5735 if (cached_answer >= 0)
5738 if (!setlocale(LC_ALL, "")) {
5739 cached_answer = true;
5743 set = nl_langinfo(CODESET);
5745 cached_answer = true;
5749 if (streq(set, "UTF-8")) {
5750 cached_answer = true;
5754 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5755 * unset and everything can do to UTF-8 nowadays. */
5756 set = setlocale(LC_CTYPE, NULL);
5758 cached_answer = true;
5762 /* Check result, but ignore the result if C was set
5766 !getenv("LC_ALL") &&
5767 !getenv("LC_CTYPE") &&
5771 return (bool) cached_answer;
5774 const char *draw_special_char(DrawSpecialChar ch) {
5775 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5778 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5779 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5780 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5781 [DRAW_TREE_SPACE] = " ", /* */
5782 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5783 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5784 [DRAW_ARROW] = "\342\206\222", /* → */
5785 [DRAW_DASH] = "\342\200\223", /* – */
5788 /* ASCII fallback */ {
5789 [DRAW_TREE_VERTICAL] = "| ",
5790 [DRAW_TREE_BRANCH] = "|-",
5791 [DRAW_TREE_RIGHT] = "`-",
5792 [DRAW_TREE_SPACE] = " ",
5793 [DRAW_TRIANGULAR_BULLET] = ">",
5794 [DRAW_BLACK_CIRCLE] = "*",
5795 [DRAW_ARROW] = "->",
5800 return draw_table[!is_locale_utf8()][ch];
5803 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5806 size_t l, old_len, new_len;
5812 old_len = strlen(old_string);
5813 new_len = strlen(new_string);
5826 if (!startswith(f, old_string)) {
5832 nl = l - old_len + new_len;
5833 a = realloc(r, nl + 1);
5841 t = stpcpy(t, new_string);
5853 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5854 const char *i, *begin = NULL;
5859 } state = STATE_OTHER;
5861 size_t osz = 0, isz;
5867 /* Strips ANSI color and replaces TABs by 8 spaces */
5869 isz = _isz ? *_isz : strlen(*ibuf);
5871 f = open_memstream(&obuf, &osz);
5875 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5880 if (i >= *ibuf + isz) /* EOT */
5882 else if (*i == '\x1B')
5883 state = STATE_ESCAPE;
5884 else if (*i == '\t')
5891 if (i >= *ibuf + isz) { /* EOT */
5894 } else if (*i == '[') {
5895 state = STATE_BRACKET;
5900 state = STATE_OTHER;
5907 if (i >= *ibuf + isz || /* EOT */
5908 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5911 state = STATE_OTHER;
5913 } else if (*i == 'm')
5914 state = STATE_OTHER;
5936 int on_ac_power(void) {
5937 bool found_offline = false, found_online = false;
5938 _cleanup_closedir_ DIR *d = NULL;
5940 d = opendir("/sys/class/power_supply");
5942 return errno == ENOENT ? true : -errno;
5946 _cleanup_close_ int fd = -1, device = -1;
5952 if (!de && errno != 0)
5958 if (hidden_file(de->d_name))
5961 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
5963 if (errno == ENOENT || errno == ENOTDIR)
5969 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5971 if (errno == ENOENT)
5977 n = read(fd, contents, sizeof(contents));
5981 if (n != 6 || memcmp(contents, "Mains\n", 6))
5985 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
5987 if (errno == ENOENT)
5993 n = read(fd, contents, sizeof(contents));
5997 if (n != 2 || contents[1] != '\n')
6000 if (contents[0] == '1') {
6001 found_online = true;
6003 } else if (contents[0] == '0')
6004 found_offline = true;
6009 return found_online || !found_offline;
6012 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6019 if (!path_strv_resolve_uniq(search, root))
6022 STRV_FOREACH(i, search) {
6023 _cleanup_free_ char *p = NULL;
6027 p = strjoin(root, *i, "/", path, NULL);
6029 p = strjoin(*i, "/", path, NULL);
6039 if (errno != ENOENT)
6046 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6047 _cleanup_strv_free_ char **copy = NULL;
6053 if (path_is_absolute(path)) {
6056 f = fopen(path, mode);
6065 copy = strv_copy((char**) search);
6069 return search_and_fopen_internal(path, mode, root, copy, _f);
6072 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6073 _cleanup_strv_free_ char **s = NULL;
6075 if (path_is_absolute(path)) {
6078 f = fopen(path, mode);
6087 s = strv_split_nulstr(search);
6091 return search_and_fopen_internal(path, mode, root, s, _f);
6094 char *strextend(char **x, ...) {
6101 l = f = *x ? strlen(*x) : 0;
6108 t = va_arg(ap, const char *);
6113 if (n > ((size_t) -1) - l) {
6122 r = realloc(*x, l+1);
6132 t = va_arg(ap, const char *);
6146 char *strrep(const char *s, unsigned n) {
6154 p = r = malloc(l * n + 1);
6158 for (i = 0; i < n; i++)
6165 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6172 if (*allocated >= need)
6175 newalloc = MAX(need * 2, 64u / size);
6176 a = newalloc * size;
6178 /* check for overflows */
6179 if (a < size * need)
6187 *allocated = newalloc;
6191 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6200 q = greedy_realloc(p, allocated, need, size);
6204 if (*allocated > prev)
6205 memzero(q + prev * size, (*allocated - prev) * size);
6210 bool id128_is_valid(const char *s) {
6216 /* Simple formatted 128bit hex string */
6218 for (i = 0; i < l; i++) {
6221 if (!(c >= '0' && c <= '9') &&
6222 !(c >= 'a' && c <= 'z') &&
6223 !(c >= 'A' && c <= 'Z'))
6227 } else if (l == 36) {
6229 /* Formatted UUID */
6231 for (i = 0; i < l; i++) {
6234 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6238 if (!(c >= '0' && c <= '9') &&
6239 !(c >= 'a' && c <= 'z') &&
6240 !(c >= 'A' && c <= 'Z'))
6251 int split_pair(const char *s, const char *sep, char **l, char **r) {
6266 a = strndup(s, x - s);
6270 b = strdup(x + strlen(sep));
6282 int shall_restore_state(void) {
6283 _cleanup_free_ char *value = NULL;
6286 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6292 return parse_boolean(value) != 0;
6295 int proc_cmdline(char **ret) {
6298 if (detect_container(NULL) > 0)
6299 return get_process_cmdline(1, 0, false, ret);
6301 return read_one_line_file("/proc/cmdline", ret);
6304 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6305 _cleanup_free_ char *line = NULL;
6311 r = proc_cmdline(&line);
6317 _cleanup_free_ char *word = NULL;
6320 r = unquote_first_word(&p, &word, UNQUOTE_RELAX);
6326 /* Filter out arguments that are intended only for the
6328 if (!in_initrd() && startswith(word, "rd."))
6331 value = strchr(word, '=');
6335 r = parse_item(word, value);
6343 int get_proc_cmdline_key(const char *key, char **value) {
6344 _cleanup_free_ char *line = NULL, *ret = NULL;
6351 r = proc_cmdline(&line);
6357 _cleanup_free_ char *word = NULL;
6360 r = unquote_first_word(&p, &word, UNQUOTE_RELAX);
6366 /* Filter out arguments that are intended only for the
6368 if (!in_initrd() && startswith(word, "rd."))
6372 e = startswith(word, key);
6376 r = free_and_strdup(&ret, e);
6382 if (streq(word, key))
6396 int container_get_leader(const char *machine, pid_t *pid) {
6397 _cleanup_free_ char *s = NULL, *class = NULL;
6405 p = strjoina("/run/systemd/machines/", machine);
6406 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6414 if (!streq_ptr(class, "container"))
6417 r = parse_pid(s, &leader);
6427 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6428 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6436 mntns = procfs_file_alloca(pid, "ns/mnt");
6437 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6445 pidns = procfs_file_alloca(pid, "ns/pid");
6446 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6454 netns = procfs_file_alloca(pid, "ns/net");
6455 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6463 root = procfs_file_alloca(pid, "root");
6464 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6470 *pidns_fd = pidnsfd;
6473 *mntns_fd = mntnsfd;
6476 *netns_fd = netnsfd;
6481 pidnsfd = mntnsfd = netnsfd = -1;
6486 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6489 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6493 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6497 if (setns(netns_fd, CLONE_NEWNET) < 0)
6501 if (fchdir(root_fd) < 0)
6504 if (chroot(".") < 0)
6508 if (setresgid(0, 0, 0) < 0)
6511 if (setgroups(0, NULL) < 0)
6514 if (setresuid(0, 0, 0) < 0)
6520 bool pid_is_unwaited(pid_t pid) {
6521 /* Checks whether a PID is still valid at all, including a zombie */
6526 if (kill(pid, 0) >= 0)
6529 return errno != ESRCH;
6532 bool pid_is_alive(pid_t pid) {
6535 /* Checks whether a PID is still valid and not a zombie */
6540 r = get_process_state(pid);
6541 if (r == -ENOENT || r == 'Z')
6547 int getpeercred(int fd, struct ucred *ucred) {
6548 socklen_t n = sizeof(struct ucred);
6555 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6559 if (n != sizeof(struct ucred))
6562 /* Check if the data is actually useful and not suppressed due
6563 * to namespacing issues */
6566 if (u.uid == UID_INVALID)
6568 if (u.gid == GID_INVALID)
6575 int getpeersec(int fd, char **ret) {
6587 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6591 if (errno != ERANGE)
6598 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6614 /* This is much like like mkostemp() but is subject to umask(). */
6615 int mkostemp_safe(char *pattern, int flags) {
6616 _cleanup_umask_ mode_t u;
6623 fd = mkostemp(pattern, flags);
6630 int open_tmpfile(const char *path, int flags) {
6637 /* Try O_TMPFILE first, if it is supported */
6638 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6643 /* Fall back to unguessable name + unlinking */
6644 p = strjoina(path, "/systemd-tmp-XXXXXX");
6646 fd = mkostemp_safe(p, flags);
6654 int fd_warn_permissions(const char *path, int fd) {
6657 if (fstat(fd, &st) < 0)
6660 if (st.st_mode & 0111)
6661 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6663 if (st.st_mode & 0002)
6664 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6666 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6667 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6672 unsigned long personality_from_string(const char *p) {
6674 /* Parse a personality specifier. We introduce our own
6675 * identifiers that indicate specific ABIs, rather than just
6676 * hints regarding the register size, since we want to keep
6677 * things open for multiple locally supported ABIs for the
6678 * same register size. We try to reuse the ABI identifiers
6679 * used by libseccomp. */
6681 #if defined(__x86_64__)
6683 if (streq(p, "x86"))
6686 if (streq(p, "x86-64"))
6689 #elif defined(__i386__)
6691 if (streq(p, "x86"))
6695 /* personality(7) documents that 0xffffffffUL is used for
6696 * querying the current personality, hence let's use that here
6697 * as error indicator. */
6698 return 0xffffffffUL;
6701 const char* personality_to_string(unsigned long p) {
6703 #if defined(__x86_64__)
6705 if (p == PER_LINUX32)
6711 #elif defined(__i386__)
6720 uint64_t physical_memory(void) {
6723 /* We return this as uint64_t in case we are running as 32bit
6724 * process on a 64bit kernel with huge amounts of memory */
6726 mem = sysconf(_SC_PHYS_PAGES);
6729 return (uint64_t) mem * (uint64_t) page_size();
6732 void hexdump(FILE *f, const void *p, size_t s) {
6733 const uint8_t *b = p;
6736 assert(s == 0 || b);
6741 fprintf(f, "%04x ", n);
6743 for (i = 0; i < 16; i++) {
6748 fprintf(f, "%02x ", b[i]);
6756 for (i = 0; i < 16; i++) {
6761 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6775 int update_reboot_param_file(const char *param) {
6780 r = write_string_file(REBOOT_PARAM_FILE, param);
6782 log_error("Failed to write reboot param to "
6783 REBOOT_PARAM_FILE": %s", strerror(-r));
6785 unlink(REBOOT_PARAM_FILE);
6790 int umount_recursive(const char *prefix, int flags) {
6794 /* Try to umount everything recursively below a
6795 * directory. Also, take care of stacked mounts, and keep
6796 * unmounting them until they are gone. */
6799 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6804 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6805 if (!proc_self_mountinfo)
6809 _cleanup_free_ char *path = NULL, *p = NULL;
6812 k = fscanf(proc_self_mountinfo,
6813 "%*s " /* (1) mount id */
6814 "%*s " /* (2) parent id */
6815 "%*s " /* (3) major:minor */
6816 "%*s " /* (4) root */
6817 "%ms " /* (5) mount point */
6818 "%*s" /* (6) mount options */
6819 "%*[^-]" /* (7) optional fields */
6820 "- " /* (8) separator */
6821 "%*s " /* (9) file system type */
6822 "%*s" /* (10) mount source */
6823 "%*s" /* (11) mount options 2 */
6824 "%*[^\n]", /* some rubbish at the end */
6833 r = cunescape(path, UNESCAPE_RELAX, &p);
6837 if (!path_startswith(p, prefix))
6840 if (umount2(p, flags) < 0) {
6856 static int get_mount_flags(const char *path, unsigned long *flags) {
6859 if (statvfs(path, &buf) < 0)
6861 *flags = buf.f_flag;
6865 int bind_remount_recursive(const char *prefix, bool ro) {
6866 _cleanup_set_free_free_ Set *done = NULL;
6867 _cleanup_free_ char *cleaned = NULL;
6870 /* Recursively remount a directory (and all its submounts)
6871 * read-only or read-write. If the directory is already
6872 * mounted, we reuse the mount and simply mark it
6873 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6874 * operation). If it isn't we first make it one. Afterwards we
6875 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6876 * submounts we can access, too. When mounts are stacked on
6877 * the same mount point we only care for each individual
6878 * "top-level" mount on each point, as we cannot
6879 * influence/access the underlying mounts anyway. We do not
6880 * have any effect on future submounts that might get
6881 * propagated, they migt be writable. This includes future
6882 * submounts that have been triggered via autofs. */
6884 cleaned = strdup(prefix);
6888 path_kill_slashes(cleaned);
6890 done = set_new(&string_hash_ops);
6895 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6896 _cleanup_set_free_free_ Set *todo = NULL;
6897 bool top_autofs = false;
6899 unsigned long orig_flags;
6901 todo = set_new(&string_hash_ops);
6905 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6906 if (!proc_self_mountinfo)
6910 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6913 k = fscanf(proc_self_mountinfo,
6914 "%*s " /* (1) mount id */
6915 "%*s " /* (2) parent id */
6916 "%*s " /* (3) major:minor */
6917 "%*s " /* (4) root */
6918 "%ms " /* (5) mount point */
6919 "%*s" /* (6) mount options (superblock) */
6920 "%*[^-]" /* (7) optional fields */
6921 "- " /* (8) separator */
6922 "%ms " /* (9) file system type */
6923 "%*s" /* (10) mount source */
6924 "%*s" /* (11) mount options (bind mount) */
6925 "%*[^\n]", /* some rubbish at the end */
6935 r = cunescape(path, UNESCAPE_RELAX, &p);
6939 /* Let's ignore autofs mounts. If they aren't
6940 * triggered yet, we want to avoid triggering
6941 * them, as we don't make any guarantees for
6942 * future submounts anyway. If they are
6943 * already triggered, then we will find
6944 * another entry for this. */
6945 if (streq(type, "autofs")) {
6946 top_autofs = top_autofs || path_equal(cleaned, p);
6950 if (path_startswith(p, cleaned) &&
6951 !set_contains(done, p)) {
6953 r = set_consume(todo, p);
6963 /* If we have no submounts to process anymore and if
6964 * the root is either already done, or an autofs, we
6966 if (set_isempty(todo) &&
6967 (top_autofs || set_contains(done, cleaned)))
6970 if (!set_contains(done, cleaned) &&
6971 !set_contains(todo, cleaned)) {
6972 /* The prefix directory itself is not yet a
6973 * mount, make it one. */
6974 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
6978 (void) get_mount_flags(cleaned, &orig_flags);
6979 orig_flags &= ~MS_RDONLY;
6981 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
6984 x = strdup(cleaned);
6988 r = set_consume(done, x);
6993 while ((x = set_steal_first(todo))) {
6995 r = set_consume(done, x);
7001 /* Try to reuse the original flag set, but
7002 * don't care for errors, in case of
7003 * obstructed mounts */
7005 (void) get_mount_flags(x, &orig_flags);
7006 orig_flags &= ~MS_RDONLY;
7008 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7010 /* Deal with mount points that are
7011 * obstructed by a later mount */
7013 if (errno != ENOENT)
7021 int fflush_and_check(FILE *f) {
7028 return errno ? -errno : -EIO;
7033 int tempfn_xxxxxx(const char *p, char **ret) {
7045 * /foo/bar/.#waldoXXXXXX
7049 if (!filename_is_valid(fn))
7052 t = new(char, strlen(p) + 2 + 6 + 1);
7056 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7058 *ret = path_kill_slashes(t);
7062 int tempfn_random(const char *p, char **ret) {
7076 * /foo/bar/.#waldobaa2a261115984a9
7080 if (!filename_is_valid(fn))
7083 t = new(char, strlen(p) + 2 + 16 + 1);
7087 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7090 for (i = 0; i < 16; i++) {
7091 *(x++) = hexchar(u & 0xF);
7097 *ret = path_kill_slashes(t);
7101 int tempfn_random_child(const char *p, char **ret) {
7112 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7115 t = new(char, strlen(p) + 3 + 16 + 1);
7119 x = stpcpy(stpcpy(t, p), "/.#");
7122 for (i = 0; i < 16; i++) {
7123 *(x++) = hexchar(u & 0xF);
7129 *ret = path_kill_slashes(t);
7133 /* make sure the hostname is not "localhost" */
7134 bool is_localhost(const char *hostname) {
7137 /* This tries to identify local host and domain names
7138 * described in RFC6761 plus the redhatism of .localdomain */
7140 return streq(hostname, "localhost") ||
7141 streq(hostname, "localhost.") ||
7142 streq(hostname, "localdomain.") ||
7143 streq(hostname, "localdomain") ||
7144 endswith(hostname, ".localhost") ||
7145 endswith(hostname, ".localhost.") ||
7146 endswith(hostname, ".localdomain") ||
7147 endswith(hostname, ".localdomain.");
7150 int take_password_lock(const char *root) {
7152 struct flock flock = {
7154 .l_whence = SEEK_SET,
7162 /* This is roughly the same as lckpwdf(), but not as awful. We
7163 * don't want to use alarm() and signals, hence we implement
7164 * our own trivial version of this.
7166 * Note that shadow-utils also takes per-database locks in
7167 * addition to lckpwdf(). However, we don't given that they
7168 * are redundant as they they invoke lckpwdf() first and keep
7169 * it during everything they do. The per-database locks are
7170 * awfully racy, and thus we just won't do them. */
7173 path = strjoina(root, "/etc/.pwd.lock");
7175 path = "/etc/.pwd.lock";
7177 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7181 r = fcntl(fd, F_SETLKW, &flock);
7190 int is_symlink(const char *path) {
7193 if (lstat(path, &info) < 0)
7196 return !!S_ISLNK(info.st_mode);
7199 int is_dir(const char* path, bool follow) {
7204 r = stat(path, &st);
7206 r = lstat(path, &st);
7210 return !!S_ISDIR(st.st_mode);
7213 int unquote_first_word(const char **p, char **ret, UnquoteFlags flags) {
7214 _cleanup_free_ char *s = NULL;
7215 size_t allocated = 0, sz = 0;
7223 SINGLE_QUOTE_ESCAPE,
7225 DOUBLE_QUOTE_ESCAPE,
7233 /* Parses the first word of a string, and returns it in
7234 * *ret. Removes all quotes in the process. When parsing fails
7235 * (because of an uneven number of quotes or similar), leaves
7236 * the pointer *p at the first invalid character. */
7246 else if (strchr(WHITESPACE, c))
7256 state = SINGLE_QUOTE;
7258 state = VALUE_ESCAPE;
7260 state = DOUBLE_QUOTE;
7261 else if (strchr(WHITESPACE, c))
7264 if (!GREEDY_REALLOC(s, allocated, sz+2))
7274 if (flags & UNQUOTE_RELAX)
7279 if (!GREEDY_REALLOC(s, allocated, sz+7))
7282 if (flags & UNQUOTE_CUNESCAPE) {
7285 r = cunescape_one(*p, (size_t) -1, &c, &u);
7292 s[sz++] = c; /* normal explicit char */
7294 sz += utf8_encode_unichar(s + sz, u); /* unicode chars we'll encode as utf8 */
7303 if (flags & UNQUOTE_RELAX)
7306 } else if (c == '\'')
7309 state = SINGLE_QUOTE_ESCAPE;
7311 if (!GREEDY_REALLOC(s, allocated, sz+2))
7319 case SINGLE_QUOTE_ESCAPE:
7321 if (flags & UNQUOTE_RELAX)
7326 if (!GREEDY_REALLOC(s, allocated, sz+7))
7329 if (flags & UNQUOTE_CUNESCAPE) {
7332 r = cunescape_one(*p, (size_t) -1, &c, &u);
7341 sz += utf8_encode_unichar(s + sz, u);
7345 state = SINGLE_QUOTE;
7354 state = DOUBLE_QUOTE_ESCAPE;
7356 if (!GREEDY_REALLOC(s, allocated, sz+2))
7364 case DOUBLE_QUOTE_ESCAPE:
7366 if (flags & UNQUOTE_RELAX)
7371 if (!GREEDY_REALLOC(s, allocated, sz+7))
7374 if (flags & UNQUOTE_CUNESCAPE) {
7377 r = cunescape_one(*p, (size_t) -1, &c, &u);
7386 sz += utf8_encode_unichar(s + sz, u);
7390 state = DOUBLE_QUOTE;
7396 if (!strchr(WHITESPACE, c))
7418 int unquote_many_words(const char **p, UnquoteFlags flags, ...) {
7423 /* Parses a number of words from a string, stripping any
7424 * quotes if necessary. */
7428 /* Count how many words are expected */
7429 va_start(ap, flags);
7431 if (!va_arg(ap, char **))
7440 /* Read all words into a temporary array */
7441 l = newa0(char*, n);
7442 for (c = 0; c < n; c++) {
7444 r = unquote_first_word(p, &l[c], flags);
7448 for (j = 0; j < c; j++)
7458 /* If we managed to parse all words, return them in the passed
7460 va_start(ap, flags);
7461 for (i = 0; i < n; i++) {
7464 v = va_arg(ap, char **);
7474 int free_and_strdup(char **p, const char *s) {
7479 /* Replaces a string pointer with an strdup()ed new string,
7480 * possibly freeing the old one. */
7495 int sethostname_idempotent(const char *s) {
7497 char buf[HOST_NAME_MAX + 1] = {};
7501 r = gethostname(buf, sizeof(buf));
7508 r = sethostname(s, strlen(s));
7515 int ptsname_malloc(int fd, char **ret) {
7528 if (ptsname_r(fd, c, l) == 0) {
7532 if (errno != ERANGE) {
7542 int openpt_in_namespace(pid_t pid, int flags) {
7543 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7544 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7546 struct cmsghdr cmsghdr;
7547 uint8_t buf[CMSG_SPACE(sizeof(int))];
7549 struct msghdr mh = {
7550 .msg_control = &control,
7551 .msg_controllen = sizeof(control),
7553 struct cmsghdr *cmsg;
7560 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7564 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7574 pair[0] = safe_close(pair[0]);
7576 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7578 _exit(EXIT_FAILURE);
7580 master = posix_openpt(flags);
7582 _exit(EXIT_FAILURE);
7584 cmsg = CMSG_FIRSTHDR(&mh);
7585 cmsg->cmsg_level = SOL_SOCKET;
7586 cmsg->cmsg_type = SCM_RIGHTS;
7587 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7588 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7590 mh.msg_controllen = cmsg->cmsg_len;
7592 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7593 _exit(EXIT_FAILURE);
7595 _exit(EXIT_SUCCESS);
7598 pair[1] = safe_close(pair[1]);
7600 r = wait_for_terminate(child, &si);
7603 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7606 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7609 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7610 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7614 fds = (int*) CMSG_DATA(cmsg);
7615 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7618 close_many(fds, n_fds);
7628 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7629 _cleanup_close_ int fd = -1;
7632 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7634 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7638 l = fgetxattr(fd, attribute, value, size);
7645 static int parse_crtime(le64_t le, usec_t *usec) {
7651 if (u == 0 || u == (uint64_t) -1)
7658 int fd_getcrtime(int fd, usec_t *usec) {
7665 /* Until Linux gets a real concept of birthtime/creation time,
7666 * let's fake one with xattrs */
7668 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7671 if (n != sizeof(le))
7674 return parse_crtime(le, usec);
7677 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7681 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7684 if (n != sizeof(le))
7687 return parse_crtime(le, usec);
7690 int path_getcrtime(const char *p, usec_t *usec) {
7697 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7700 if (n != sizeof(le))
7703 return parse_crtime(le, usec);
7706 int fd_setcrtime(int fd, usec_t usec) {
7712 usec = now(CLOCK_REALTIME);
7714 le = htole64((uint64_t) usec);
7715 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7721 int chattr_fd(int fd, unsigned value, unsigned mask) {
7722 unsigned old_attr, new_attr;
7729 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7732 new_attr = (old_attr & ~mask) | (value & mask);
7733 if (new_attr == old_attr)
7736 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7742 int chattr_path(const char *p, unsigned value, unsigned mask) {
7743 _cleanup_close_ int fd = -1;
7750 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7754 return chattr_fd(fd, value, mask);
7757 int read_attr_fd(int fd, unsigned *ret) {
7760 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7766 int read_attr_path(const char *p, unsigned *ret) {
7767 _cleanup_close_ int fd = -1;
7772 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7776 return read_attr_fd(fd, ret);
7779 int make_lock_file(const char *p, int operation, LockFile *ret) {
7780 _cleanup_close_ int fd = -1;
7781 _cleanup_free_ char *t = NULL;
7785 * We use UNPOSIX locks if they are available. They have nice
7786 * semantics, and are mostly compatible with NFS. However,
7787 * they are only available on new kernels. When we detect we
7788 * are running on an older kernel, then we fall back to good
7789 * old BSD locks. They also have nice semantics, but are
7790 * slightly problematic on NFS, where they are upgraded to
7791 * POSIX locks, even though locally they are orthogonal to
7801 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7802 .l_whence = SEEK_SET,
7806 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7810 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7813 /* If the kernel is too old, use good old BSD locks */
7814 if (errno == EINVAL)
7815 r = flock(fd, operation);
7818 return errno == EAGAIN ? -EBUSY : -errno;
7821 /* If we acquired the lock, let's check if the file
7822 * still exists in the file system. If not, then the
7823 * previous exclusive owner removed it and then closed
7824 * it. In such a case our acquired lock is worthless,
7825 * hence try again. */
7830 if (st.st_nlink > 0)
7833 fd = safe_close(fd);
7838 ret->operation = operation;
7846 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7854 if (!filename_is_valid(fn))
7857 t = newa(char, strlen(p) + 2 + 4 + 1);
7858 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7860 return make_lock_file(t, operation, ret);
7863 void release_lock_file(LockFile *f) {
7871 /* If we are the exclusive owner we can safely delete
7872 * the lock file itself. If we are not the exclusive
7873 * owner, we can try becoming it. */
7876 (f->operation & ~LOCK_NB) == LOCK_SH) {
7877 static const struct flock fl = {
7879 .l_whence = SEEK_SET,
7882 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7883 if (r < 0 && errno == EINVAL)
7884 r = flock(f->fd, LOCK_EX|LOCK_NB);
7887 f->operation = LOCK_EX|LOCK_NB;
7890 if ((f->operation & ~LOCK_NB) == LOCK_EX)
7891 unlink_noerrno(f->path);
7897 f->fd = safe_close(f->fd);
7901 static size_t nul_length(const uint8_t *p, size_t sz) {
7916 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
7917 const uint8_t *q, *w, *e;
7925 n = nul_length(q, e - q);
7927 /* If there are more than the specified run length of
7928 * NUL bytes, or if this is the beginning or the end
7929 * of the buffer, then seek instead of write */
7930 if ((n > run_length) ||
7931 (n > 0 && q == p) ||
7932 (n > 0 && q + n >= e)) {
7934 l = write(fd, w, q - w);
7941 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
7953 l = write(fd, w, q - w);
7960 return q - (const uint8_t*) p;
7963 void sigkill_wait(pid_t *pid) {
7969 if (kill(*pid, SIGKILL) > 0)
7970 (void) wait_for_terminate(*pid, NULL);
7973 int syslog_parse_priority(const char **p, int *priority, bool with_facility) {
7974 int a = 0, b = 0, c = 0;
7984 if (!strchr(*p, '>'))
7987 if ((*p)[2] == '>') {
7988 c = undecchar((*p)[1]);
7990 } else if ((*p)[3] == '>') {
7991 b = undecchar((*p)[1]);
7992 c = undecchar((*p)[2]);
7994 } else if ((*p)[4] == '>') {
7995 a = undecchar((*p)[1]);
7996 b = undecchar((*p)[2]);
7997 c = undecchar((*p)[3]);
8002 if (a < 0 || b < 0 || c < 0 ||
8003 (!with_facility && (a || b || c > 7)))
8007 *priority = a*100 + b*10 + c;
8009 *priority = (*priority & LOG_FACMASK) | c;
8015 ssize_t string_table_lookup(const char * const *table, size_t len, const char *key) {
8021 for (i = 0; i < len; ++i)
8022 if (streq_ptr(table[i], key))
8028 void cmsg_close_all(struct msghdr *mh) {
8029 struct cmsghdr *cmsg;
8033 for (cmsg = CMSG_FIRSTHDR(mh); cmsg; cmsg = CMSG_NXTHDR(mh, cmsg))
8034 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS)
8035 close_many((int*) CMSG_DATA(cmsg), (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int));
8038 int rename_noreplace(int olddirfd, const char *oldpath, int newdirfd, const char *newpath) {
8042 ret = renameat2(olddirfd, oldpath, newdirfd, newpath, RENAME_NOREPLACE);
8046 /* Even though renameat2() exists since Linux 3.15, btrfs added
8047 * support for it later. If it is not implemented, fallback to another
8049 if (errno != EINVAL)
8052 /* The link()/unlink() fallback does not work on directories. But
8053 * renameat() without RENAME_NOREPLACE gives the same semantics on
8054 * directories, except when newpath is an *empty* directory. This is
8056 ret = fstatat(olddirfd, oldpath, &buf, AT_SYMLINK_NOFOLLOW);
8057 if (ret >= 0 && S_ISDIR(buf.st_mode)) {
8058 ret = renameat(olddirfd, oldpath, newdirfd, newpath);
8059 return ret >= 0 ? 0 : -errno;
8062 /* If it is not a directory, use the link()/unlink() fallback. */
8063 ret = linkat(olddirfd, oldpath, newdirfd, newpath, 0);
8067 ret = unlinkat(olddirfd, oldpath, 0);
8069 /* backup errno before the following unlinkat() alters it */
8071 (void) unlinkat(newdirfd, newpath, 0);
8079 char *shell_maybe_quote(const char *s) {
8085 /* Encloses a string in double quotes if necessary to make it
8086 * OK as shell string. */
8088 for (p = s; *p; p++)
8091 strchr(SHELL_NEED_QUOTES, *p))
8097 r = new(char, 1+strlen(s)*2+1+1);
8103 t = mempcpy(t, s, p - s);
8107 if (strchr(SHELL_NEED_ESCAPE, *p))
8119 int parse_mode(const char *s, mode_t *ret) {
8127 l = strtol(s, &x, 8);
8131 if (!x || x == s || *x)
8133 if (l < 0 || l > 07777)