1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2010 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
33 #include <sys/resource.h>
34 #include <linux/sched.h>
35 #include <sys/types.h>
39 #include <sys/ioctl.h>
41 #include <linux/tiocl.h>
46 #include <sys/prctl.h>
47 #include <sys/utsname.h>
49 #include <netinet/ip.h>
58 #include <sys/mount.h>
59 #include <linux/magic.h>
63 #include <sys/personality.h>
64 #include <sys/xattr.h>
65 #include <sys/statvfs.h>
69 /* When we include libgen.h because we need dirname() we immediately
70 * undefine basename() since libgen.h defines it as a macro to the XDG
71 * version which is really broken. */
75 #ifdef HAVE_SYS_AUXV_H
88 #include "path-util.h"
89 #include "exit-status.h"
93 #include "device-nodes.h"
98 #include "sparse-endian.h"
101 char **saved_argv = NULL;
103 static volatile unsigned cached_columns = 0;
104 static volatile unsigned cached_lines = 0;
106 size_t page_size(void) {
107 static thread_local size_t pgsz = 0;
110 if (_likely_(pgsz > 0))
113 r = sysconf(_SC_PAGESIZE);
120 bool streq_ptr(const char *a, const char *b) {
122 /* Like streq(), but tries to make sense of NULL pointers */
133 char* endswith(const char *s, const char *postfix) {
140 pl = strlen(postfix);
143 return (char*) s + sl;
148 if (memcmp(s + sl - pl, postfix, pl) != 0)
151 return (char*) s + sl - pl;
154 char* first_word(const char *s, const char *word) {
161 /* Checks if the string starts with the specified word, either
162 * followed by NUL or by whitespace. Returns a pointer to the
163 * NUL or the first character after the whitespace. */
174 if (memcmp(s, word, wl) != 0)
181 if (!strchr(WHITESPACE, *p))
184 p += strspn(p, WHITESPACE);
188 static size_t cescape_char(char c, char *buf) {
189 char * buf_old = buf;
235 /* For special chars we prefer octal over
236 * hexadecimal encoding, simply because glib's
237 * g_strescape() does the same */
238 if ((c < ' ') || (c >= 127)) {
240 *(buf++) = octchar((unsigned char) c >> 6);
241 *(buf++) = octchar((unsigned char) c >> 3);
242 *(buf++) = octchar((unsigned char) c);
248 return buf - buf_old;
251 int close_nointr(int fd) {
258 * Just ignore EINTR; a retry loop is the wrong thing to do on
261 * http://lkml.indiana.edu/hypermail/linux/kernel/0509.1/0877.html
262 * https://bugzilla.gnome.org/show_bug.cgi?id=682819
263 * http://utcc.utoronto.ca/~cks/space/blog/unix/CloseEINTR
264 * https://sites.google.com/site/michaelsafyan/software-engineering/checkforeintrwheninvokingclosethinkagain
272 int safe_close(int fd) {
275 * Like close_nointr() but cannot fail. Guarantees errno is
276 * unchanged. Is a NOP with negative fds passed, and returns
277 * -1, so that it can be used in this syntax:
279 * fd = safe_close(fd);
285 /* The kernel might return pretty much any error code
286 * via close(), but the fd will be closed anyway. The
287 * only condition we want to check for here is whether
288 * the fd was invalid at all... */
290 assert_se(close_nointr(fd) != -EBADF);
296 void close_many(const int fds[], unsigned n_fd) {
299 assert(fds || n_fd <= 0);
301 for (i = 0; i < n_fd; i++)
305 int unlink_noerrno(const char *path) {
316 int parse_boolean(const char *v) {
319 if (streq(v, "1") || strcaseeq(v, "yes") || strcaseeq(v, "y") || strcaseeq(v, "true") || strcaseeq(v, "t") || strcaseeq(v, "on"))
321 else if (streq(v, "0") || strcaseeq(v, "no") || strcaseeq(v, "n") || strcaseeq(v, "false") || strcaseeq(v, "f") || strcaseeq(v, "off"))
327 int parse_pid(const char *s, pid_t* ret_pid) {
328 unsigned long ul = 0;
335 r = safe_atolu(s, &ul);
341 if ((unsigned long) pid != ul)
351 int parse_uid(const char *s, uid_t* ret_uid) {
352 unsigned long ul = 0;
359 r = safe_atolu(s, &ul);
365 if ((unsigned long) uid != ul)
368 /* Some libc APIs use UID_INVALID as special placeholder */
369 if (uid == (uid_t) 0xFFFFFFFF)
372 /* A long time ago UIDs where 16bit, hence explicitly avoid the 16bit -1 too */
373 if (uid == (uid_t) 0xFFFF)
380 int safe_atou(const char *s, unsigned *ret_u) {
388 l = strtoul(s, &x, 0);
390 if (!x || x == s || *x || errno)
391 return errno > 0 ? -errno : -EINVAL;
393 if ((unsigned long) (unsigned) l != l)
396 *ret_u = (unsigned) l;
400 int safe_atoi(const char *s, int *ret_i) {
408 l = strtol(s, &x, 0);
410 if (!x || x == s || *x || errno)
411 return errno > 0 ? -errno : -EINVAL;
413 if ((long) (int) l != l)
420 int safe_atou8(const char *s, uint8_t *ret) {
428 l = strtoul(s, &x, 0);
430 if (!x || x == s || *x || errno)
431 return errno > 0 ? -errno : -EINVAL;
433 if ((unsigned long) (uint8_t) l != l)
440 int safe_atou16(const char *s, uint16_t *ret) {
448 l = strtoul(s, &x, 0);
450 if (!x || x == s || *x || errno)
451 return errno > 0 ? -errno : -EINVAL;
453 if ((unsigned long) (uint16_t) l != l)
460 int safe_atoi16(const char *s, int16_t *ret) {
468 l = strtol(s, &x, 0);
470 if (!x || x == s || *x || errno)
471 return errno > 0 ? -errno : -EINVAL;
473 if ((long) (int16_t) l != l)
480 int safe_atollu(const char *s, long long unsigned *ret_llu) {
482 unsigned long long l;
488 l = strtoull(s, &x, 0);
490 if (!x || x == s || *x || errno)
491 return errno ? -errno : -EINVAL;
497 int safe_atolli(const char *s, long long int *ret_lli) {
505 l = strtoll(s, &x, 0);
507 if (!x || x == s || *x || errno)
508 return errno ? -errno : -EINVAL;
514 int safe_atod(const char *s, double *ret_d) {
522 loc = newlocale(LC_NUMERIC_MASK, "C", (locale_t) 0);
523 if (loc == (locale_t) 0)
527 d = strtod_l(s, &x, loc);
529 if (!x || x == s || *x || errno) {
531 return errno ? -errno : -EINVAL;
539 static size_t strcspn_escaped(const char *s, const char *reject) {
540 bool escaped = false;
543 for (n=0; s[n]; n++) {
546 else if (s[n] == '\\')
548 else if (strchr(reject, s[n]))
552 /* if s ends in \, return index of previous char */
556 /* Split a string into words. */
557 const char* split(const char **state, size_t *l, const char *separator, bool quoted) {
563 assert(**state == '\0');
567 current += strspn(current, separator);
573 if (quoted && strchr("\'\"", *current)) {
574 char quotechars[2] = {*current, '\0'};
576 *l = strcspn_escaped(current + 1, quotechars);
577 if (current[*l + 1] == '\0' ||
578 (current[*l + 2] && !strchr(separator, current[*l + 2]))) {
579 /* right quote missing or garbage at the end */
583 assert(current[*l + 1] == quotechars[0]);
584 *state = current++ + *l + 2;
586 *l = strcspn_escaped(current, separator);
587 if (current[*l] && !strchr(separator, current[*l])) {
588 /* unfinished escape */
592 *state = current + *l;
594 *l = strcspn(current, separator);
595 *state = current + *l;
601 int get_parent_of_pid(pid_t pid, pid_t *_ppid) {
603 _cleanup_free_ char *line = NULL;
615 p = procfs_file_alloca(pid, "stat");
616 r = read_one_line_file(p, &line);
620 /* Let's skip the pid and comm fields. The latter is enclosed
621 * in () but does not escape any () in its value, so let's
622 * skip over it manually */
624 p = strrchr(line, ')');
636 if ((long unsigned) (pid_t) ppid != ppid)
639 *_ppid = (pid_t) ppid;
644 int fchmod_umask(int fd, mode_t m) {
649 r = fchmod(fd, m & (~u)) < 0 ? -errno : 0;
655 char *truncate_nl(char *s) {
658 s[strcspn(s, NEWLINE)] = 0;
662 int get_process_state(pid_t pid) {
666 _cleanup_free_ char *line = NULL;
670 p = procfs_file_alloca(pid, "stat");
671 r = read_one_line_file(p, &line);
675 p = strrchr(line, ')');
681 if (sscanf(p, " %c", &state) != 1)
684 return (unsigned char) state;
687 int get_process_comm(pid_t pid, char **name) {
694 p = procfs_file_alloca(pid, "comm");
696 r = read_one_line_file(p, name);
703 int get_process_cmdline(pid_t pid, size_t max_length, bool comm_fallback, char **line) {
704 _cleanup_fclose_ FILE *f = NULL;
712 p = procfs_file_alloca(pid, "cmdline");
718 if (max_length == 0) {
719 size_t len = 0, allocated = 0;
721 while ((c = getc(f)) != EOF) {
723 if (!GREEDY_REALLOC(r, allocated, len+2)) {
728 r[len++] = isprint(c) ? c : ' ';
738 r = new(char, max_length);
744 while ((c = getc(f)) != EOF) {
766 size_t n = MIN(left-1, 3U);
773 /* Kernel threads have no argv[] */
775 _cleanup_free_ char *t = NULL;
783 h = get_process_comm(pid, &t);
787 r = strjoin("[", t, "]", NULL);
796 int is_kernel_thread(pid_t pid) {
808 p = procfs_file_alloca(pid, "cmdline");
813 count = fread(&c, 1, 1, f);
817 /* Kernel threads have an empty cmdline */
820 return eof ? 1 : -errno;
825 int get_process_capeff(pid_t pid, char **capeff) {
831 p = procfs_file_alloca(pid, "status");
833 return get_status_field(p, "\nCapEff:", capeff);
836 static int get_process_link_contents(const char *proc_file, char **name) {
842 r = readlink_malloc(proc_file, name);
844 return r == -ENOENT ? -ESRCH : r;
849 int get_process_exe(pid_t pid, char **name) {
856 p = procfs_file_alloca(pid, "exe");
857 r = get_process_link_contents(p, name);
861 d = endswith(*name, " (deleted)");
868 static int get_process_id(pid_t pid, const char *field, uid_t *uid) {
869 _cleanup_fclose_ FILE *f = NULL;
879 p = procfs_file_alloca(pid, "status");
884 FOREACH_LINE(line, f, return -errno) {
889 if (startswith(l, field)) {
891 l += strspn(l, WHITESPACE);
893 l[strcspn(l, WHITESPACE)] = 0;
895 return parse_uid(l, uid);
902 int get_process_uid(pid_t pid, uid_t *uid) {
903 return get_process_id(pid, "Uid:", uid);
906 int get_process_gid(pid_t pid, gid_t *gid) {
907 assert_cc(sizeof(uid_t) == sizeof(gid_t));
908 return get_process_id(pid, "Gid:", gid);
911 int get_process_cwd(pid_t pid, char **cwd) {
916 p = procfs_file_alloca(pid, "cwd");
918 return get_process_link_contents(p, cwd);
921 int get_process_root(pid_t pid, char **root) {
926 p = procfs_file_alloca(pid, "root");
928 return get_process_link_contents(p, root);
931 int get_process_environ(pid_t pid, char **env) {
932 _cleanup_fclose_ FILE *f = NULL;
933 _cleanup_free_ char *outcome = NULL;
936 size_t allocated = 0, sz = 0;
941 p = procfs_file_alloca(pid, "environ");
947 while ((c = fgetc(f)) != EOF) {
948 if (!GREEDY_REALLOC(outcome, allocated, sz + 5))
952 outcome[sz++] = '\n';
954 sz += cescape_char(c, outcome + sz);
964 char *strnappend(const char *s, const char *suffix, size_t b) {
972 return strndup(suffix, b);
981 if (b > ((size_t) -1) - a)
984 r = new(char, a+b+1);
989 memcpy(r+a, suffix, b);
995 char *strappend(const char *s, const char *suffix) {
996 return strnappend(s, suffix, suffix ? strlen(suffix) : 0);
999 int readlinkat_malloc(int fd, const char *p, char **ret) {
1014 n = readlinkat(fd, p, c, l-1);
1021 if ((size_t) n < l-1) {
1032 int readlink_malloc(const char *p, char **ret) {
1033 return readlinkat_malloc(AT_FDCWD, p, ret);
1036 int readlink_value(const char *p, char **ret) {
1037 _cleanup_free_ char *link = NULL;
1041 r = readlink_malloc(p, &link);
1045 value = basename(link);
1049 value = strdup(value);
1058 int readlink_and_make_absolute(const char *p, char **r) {
1059 _cleanup_free_ char *target = NULL;
1066 j = readlink_malloc(p, &target);
1070 k = file_in_same_dir(p, target);
1078 int readlink_and_canonicalize(const char *p, char **r) {
1085 j = readlink_and_make_absolute(p, &t);
1089 s = canonicalize_file_name(t);
1096 path_kill_slashes(*r);
1101 int reset_all_signal_handlers(void) {
1104 for (sig = 1; sig < _NSIG; sig++) {
1105 struct sigaction sa = {
1106 .sa_handler = SIG_DFL,
1107 .sa_flags = SA_RESTART,
1110 /* These two cannot be caught... */
1111 if (sig == SIGKILL || sig == SIGSTOP)
1114 /* On Linux the first two RT signals are reserved by
1115 * glibc, and sigaction() will return EINVAL for them. */
1116 if ((sigaction(sig, &sa, NULL) < 0))
1117 if (errno != EINVAL && r == 0)
1124 int reset_signal_mask(void) {
1127 if (sigemptyset(&ss) < 0)
1130 if (sigprocmask(SIG_SETMASK, &ss, NULL) < 0)
1136 char *strstrip(char *s) {
1139 /* Drops trailing whitespace. Modifies the string in
1140 * place. Returns pointer to first non-space character */
1142 s += strspn(s, WHITESPACE);
1144 for (e = strchr(s, 0); e > s; e --)
1145 if (!strchr(WHITESPACE, e[-1]))
1153 char *delete_chars(char *s, const char *bad) {
1156 /* Drops all whitespace, regardless where in the string */
1158 for (f = s, t = s; *f; f++) {
1159 if (strchr(bad, *f))
1170 char *file_in_same_dir(const char *path, const char *filename) {
1177 /* This removes the last component of path and appends
1178 * filename, unless the latter is absolute anyway or the
1181 if (path_is_absolute(filename))
1182 return strdup(filename);
1184 e = strrchr(path, '/');
1186 return strdup(filename);
1188 k = strlen(filename);
1189 ret = new(char, (e + 1 - path) + k + 1);
1193 memcpy(mempcpy(ret, path, e + 1 - path), filename, k + 1);
1197 int rmdir_parents(const char *path, const char *stop) {
1206 /* Skip trailing slashes */
1207 while (l > 0 && path[l-1] == '/')
1213 /* Skip last component */
1214 while (l > 0 && path[l-1] != '/')
1217 /* Skip trailing slashes */
1218 while (l > 0 && path[l-1] == '/')
1224 if (!(t = strndup(path, l)))
1227 if (path_startswith(stop, t)) {
1236 if (errno != ENOENT)
1243 char hexchar(int x) {
1244 static const char table[16] = "0123456789abcdef";
1246 return table[x & 15];
1249 int unhexchar(char c) {
1251 if (c >= '0' && c <= '9')
1254 if (c >= 'a' && c <= 'f')
1255 return c - 'a' + 10;
1257 if (c >= 'A' && c <= 'F')
1258 return c - 'A' + 10;
1263 char *hexmem(const void *p, size_t l) {
1267 z = r = malloc(l * 2 + 1);
1271 for (x = p; x < (const uint8_t*) p + l; x++) {
1272 *(z++) = hexchar(*x >> 4);
1273 *(z++) = hexchar(*x & 15);
1280 void *unhexmem(const char *p, size_t l) {
1286 z = r = malloc((l + 1) / 2 + 1);
1290 for (x = p; x < p + l; x += 2) {
1293 a = unhexchar(x[0]);
1295 b = unhexchar(x[1]);
1299 *(z++) = (uint8_t) a << 4 | (uint8_t) b;
1306 char octchar(int x) {
1307 return '0' + (x & 7);
1310 int unoctchar(char c) {
1312 if (c >= '0' && c <= '7')
1318 char decchar(int x) {
1319 return '0' + (x % 10);
1322 int undecchar(char c) {
1324 if (c >= '0' && c <= '9')
1330 char *cescape(const char *s) {
1336 /* Does C style string escaping. */
1338 r = new(char, strlen(s)*4 + 1);
1342 for (f = s, t = r; *f; f++)
1343 t += cescape_char(*f, t);
1350 char *cunescape_length_with_prefix(const char *s, size_t length, const char *prefix) {
1357 /* Undoes C style string escaping, and optionally prefixes it. */
1359 pl = prefix ? strlen(prefix) : 0;
1361 r = new(char, pl+length+1);
1366 memcpy(r, prefix, pl);
1368 for (f = s, t = r + pl; f < s + length; f++) {
1369 size_t remaining = s + length - f;
1370 assert(remaining > 0);
1372 if (*f != '\\') { /* a literal literal */
1377 if (--remaining == 0) { /* copy trailing backslash verbatim */
1418 /* This is an extension of the XDG syntax files */
1423 /* hexadecimal encoding */
1426 if (remaining >= 2) {
1427 a = unhexchar(f[1]);
1428 b = unhexchar(f[2]);
1431 if (a < 0 || b < 0 || (a == 0 && b == 0)) {
1432 /* Invalid escape code, let's take it literal then */
1436 *(t++) = (char) ((a << 4) | b);
1451 /* octal encoding */
1452 int a = -1, b = -1, c = -1;
1454 if (remaining >= 3) {
1455 a = unoctchar(f[0]);
1456 b = unoctchar(f[1]);
1457 c = unoctchar(f[2]);
1460 if (a < 0 || b < 0 || c < 0 || (a == 0 && b == 0 && c == 0)) {
1461 /* Invalid escape code, let's take it literal then */
1465 *(t++) = (char) ((a << 6) | (b << 3) | c);
1473 /* Invalid escape code, let's take it literal then */
1484 char *cunescape_length(const char *s, size_t length) {
1485 return cunescape_length_with_prefix(s, length, NULL);
1488 char *cunescape(const char *s) {
1491 return cunescape_length(s, strlen(s));
1494 char *xescape(const char *s, const char *bad) {
1498 /* Escapes all chars in bad, in addition to \ and all special
1499 * chars, in \xFF style escaping. May be reversed with
1502 r = new(char, strlen(s) * 4 + 1);
1506 for (f = s, t = r; *f; f++) {
1508 if ((*f < ' ') || (*f >= 127) ||
1509 (*f == '\\') || strchr(bad, *f)) {
1512 *(t++) = hexchar(*f >> 4);
1513 *(t++) = hexchar(*f);
1523 char *ascii_strlower(char *t) {
1528 for (p = t; *p; p++)
1529 if (*p >= 'A' && *p <= 'Z')
1530 *p = *p - 'A' + 'a';
1535 _pure_ static bool hidden_file_allow_backup(const char *filename) {
1539 filename[0] == '.' ||
1540 streq(filename, "lost+found") ||
1541 streq(filename, "aquota.user") ||
1542 streq(filename, "aquota.group") ||
1543 endswith(filename, ".rpmnew") ||
1544 endswith(filename, ".rpmsave") ||
1545 endswith(filename, ".rpmorig") ||
1546 endswith(filename, ".dpkg-old") ||
1547 endswith(filename, ".dpkg-new") ||
1548 endswith(filename, ".dpkg-tmp") ||
1549 endswith(filename, ".dpkg-dist") ||
1550 endswith(filename, ".dpkg-bak") ||
1551 endswith(filename, ".dpkg-backup") ||
1552 endswith(filename, ".dpkg-remove") ||
1553 endswith(filename, ".swp");
1556 bool hidden_file(const char *filename) {
1559 if (endswith(filename, "~"))
1562 return hidden_file_allow_backup(filename);
1565 int fd_nonblock(int fd, bool nonblock) {
1570 flags = fcntl(fd, F_GETFL, 0);
1575 nflags = flags | O_NONBLOCK;
1577 nflags = flags & ~O_NONBLOCK;
1579 if (nflags == flags)
1582 if (fcntl(fd, F_SETFL, nflags) < 0)
1588 int fd_cloexec(int fd, bool cloexec) {
1593 flags = fcntl(fd, F_GETFD, 0);
1598 nflags = flags | FD_CLOEXEC;
1600 nflags = flags & ~FD_CLOEXEC;
1602 if (nflags == flags)
1605 if (fcntl(fd, F_SETFD, nflags) < 0)
1611 _pure_ static bool fd_in_set(int fd, const int fdset[], unsigned n_fdset) {
1614 assert(n_fdset == 0 || fdset);
1616 for (i = 0; i < n_fdset; i++)
1623 int close_all_fds(const int except[], unsigned n_except) {
1624 _cleanup_closedir_ DIR *d = NULL;
1628 assert(n_except == 0 || except);
1630 d = opendir("/proc/self/fd");
1635 /* When /proc isn't available (for example in chroots)
1636 * the fallback is brute forcing through the fd
1639 assert_se(getrlimit(RLIMIT_NOFILE, &rl) >= 0);
1640 for (fd = 3; fd < (int) rl.rlim_max; fd ++) {
1642 if (fd_in_set(fd, except, n_except))
1645 if (close_nointr(fd) < 0)
1646 if (errno != EBADF && r == 0)
1653 while ((de = readdir(d))) {
1656 if (hidden_file(de->d_name))
1659 if (safe_atoi(de->d_name, &fd) < 0)
1660 /* Let's better ignore this, just in case */
1669 if (fd_in_set(fd, except, n_except))
1672 if (close_nointr(fd) < 0) {
1673 /* Valgrind has its own FD and doesn't want to have it closed */
1674 if (errno != EBADF && r == 0)
1682 bool chars_intersect(const char *a, const char *b) {
1685 /* Returns true if any of the chars in a are in b. */
1686 for (p = a; *p; p++)
1693 bool fstype_is_network(const char *fstype) {
1694 static const char table[] =
1708 x = startswith(fstype, "fuse.");
1712 return nulstr_contains(table, fstype);
1716 _cleanup_close_ int fd;
1718 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
1724 TIOCL_GETKMSGREDIRECT,
1728 if (ioctl(fd, TIOCLINUX, tiocl) < 0)
1731 vt = tiocl[0] <= 0 ? 1 : tiocl[0];
1734 if (ioctl(fd, VT_ACTIVATE, vt) < 0)
1740 int read_one_char(FILE *f, char *ret, usec_t t, bool *need_nl) {
1741 struct termios old_termios, new_termios;
1742 char c, line[LINE_MAX];
1747 if (tcgetattr(fileno(f), &old_termios) >= 0) {
1748 new_termios = old_termios;
1750 new_termios.c_lflag &= ~ICANON;
1751 new_termios.c_cc[VMIN] = 1;
1752 new_termios.c_cc[VTIME] = 0;
1754 if (tcsetattr(fileno(f), TCSADRAIN, &new_termios) >= 0) {
1757 if (t != USEC_INFINITY) {
1758 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0) {
1759 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1764 k = fread(&c, 1, 1, f);
1766 tcsetattr(fileno(f), TCSADRAIN, &old_termios);
1772 *need_nl = c != '\n';
1779 if (t != USEC_INFINITY) {
1780 if (fd_wait_for_event(fileno(f), POLLIN, t) <= 0)
1785 if (!fgets(line, sizeof(line), f))
1786 return errno ? -errno : -EIO;
1790 if (strlen(line) != 1)
1800 int ask_char(char *ret, const char *replies, const char *text, ...) {
1810 bool need_nl = true;
1813 fputs(ANSI_HIGHLIGHT_ON, stdout);
1820 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1824 r = read_one_char(stdin, &c, USEC_INFINITY, &need_nl);
1827 if (r == -EBADMSG) {
1828 puts("Bad input, please try again.");
1839 if (strchr(replies, c)) {
1844 puts("Read unexpected character, please try again.");
1848 int ask_string(char **ret, const char *text, ...) {
1853 char line[LINE_MAX];
1857 fputs(ANSI_HIGHLIGHT_ON, stdout);
1864 fputs(ANSI_HIGHLIGHT_OFF, stdout);
1869 if (!fgets(line, sizeof(line), stdin))
1870 return errno ? -errno : -EIO;
1872 if (!endswith(line, "\n"))
1891 int reset_terminal_fd(int fd, bool switch_to_text) {
1892 struct termios termios;
1895 /* Set terminal to some sane defaults */
1899 /* We leave locked terminal attributes untouched, so that
1900 * Plymouth may set whatever it wants to set, and we don't
1901 * interfere with that. */
1903 /* Disable exclusive mode, just in case */
1904 ioctl(fd, TIOCNXCL);
1906 /* Switch to text mode */
1908 ioctl(fd, KDSETMODE, KD_TEXT);
1910 /* Enable console unicode mode */
1911 ioctl(fd, KDSKBMODE, K_UNICODE);
1913 if (tcgetattr(fd, &termios) < 0) {
1918 /* We only reset the stuff that matters to the software. How
1919 * hardware is set up we don't touch assuming that somebody
1920 * else will do that for us */
1922 termios.c_iflag &= ~(IGNBRK | BRKINT | ISTRIP | INLCR | IGNCR | IUCLC);
1923 termios.c_iflag |= ICRNL | IMAXBEL | IUTF8;
1924 termios.c_oflag |= ONLCR;
1925 termios.c_cflag |= CREAD;
1926 termios.c_lflag = ISIG | ICANON | IEXTEN | ECHO | ECHOE | ECHOK | ECHOCTL | ECHOPRT | ECHOKE;
1928 termios.c_cc[VINTR] = 03; /* ^C */
1929 termios.c_cc[VQUIT] = 034; /* ^\ */
1930 termios.c_cc[VERASE] = 0177;
1931 termios.c_cc[VKILL] = 025; /* ^X */
1932 termios.c_cc[VEOF] = 04; /* ^D */
1933 termios.c_cc[VSTART] = 021; /* ^Q */
1934 termios.c_cc[VSTOP] = 023; /* ^S */
1935 termios.c_cc[VSUSP] = 032; /* ^Z */
1936 termios.c_cc[VLNEXT] = 026; /* ^V */
1937 termios.c_cc[VWERASE] = 027; /* ^W */
1938 termios.c_cc[VREPRINT] = 022; /* ^R */
1939 termios.c_cc[VEOL] = 0;
1940 termios.c_cc[VEOL2] = 0;
1942 termios.c_cc[VTIME] = 0;
1943 termios.c_cc[VMIN] = 1;
1945 if (tcsetattr(fd, TCSANOW, &termios) < 0)
1949 /* Just in case, flush all crap out */
1950 tcflush(fd, TCIOFLUSH);
1955 int reset_terminal(const char *name) {
1956 _cleanup_close_ int fd = -1;
1958 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
1962 return reset_terminal_fd(fd, true);
1965 int open_terminal(const char *name, int mode) {
1970 * If a TTY is in the process of being closed opening it might
1971 * cause EIO. This is horribly awful, but unlikely to be
1972 * changed in the kernel. Hence we work around this problem by
1973 * retrying a couple of times.
1975 * https://bugs.launchpad.net/ubuntu/+source/linux/+bug/554172/comments/245
1978 assert(!(mode & O_CREAT));
1981 fd = open(name, mode, 0);
1988 /* Max 1s in total */
1992 usleep(50 * USEC_PER_MSEC);
2010 int flush_fd(int fd) {
2011 struct pollfd pollfd = {
2021 r = poll(&pollfd, 1, 0);
2031 l = read(fd, buf, sizeof(buf));
2037 if (errno == EAGAIN)
2046 int acquire_terminal(
2050 bool ignore_tiocstty_eperm,
2053 int fd = -1, notify = -1, r = 0, wd = -1;
2058 /* We use inotify to be notified when the tty is closed. We
2059 * create the watch before checking if we can actually acquire
2060 * it, so that we don't lose any event.
2062 * Note: strictly speaking this actually watches for the
2063 * device being closed, it does *not* really watch whether a
2064 * tty loses its controlling process. However, unless some
2065 * rogue process uses TIOCNOTTY on /dev/tty *after* closing
2066 * its tty otherwise this will not become a problem. As long
2067 * as the administrator makes sure not configure any service
2068 * on the same tty as an untrusted user this should not be a
2069 * problem. (Which he probably should not do anyway.) */
2071 if (timeout != USEC_INFINITY)
2072 ts = now(CLOCK_MONOTONIC);
2074 if (!fail && !force) {
2075 notify = inotify_init1(IN_CLOEXEC | (timeout != USEC_INFINITY ? IN_NONBLOCK : 0));
2081 wd = inotify_add_watch(notify, name, IN_CLOSE);
2089 struct sigaction sa_old, sa_new = {
2090 .sa_handler = SIG_IGN,
2091 .sa_flags = SA_RESTART,
2095 r = flush_fd(notify);
2100 /* We pass here O_NOCTTY only so that we can check the return
2101 * value TIOCSCTTY and have a reliable way to figure out if we
2102 * successfully became the controlling process of the tty */
2103 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
2107 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2108 * if we already own the tty. */
2109 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2111 /* First, try to get the tty */
2112 if (ioctl(fd, TIOCSCTTY, force) < 0)
2115 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2117 /* Sometimes it makes sense to ignore TIOCSCTTY
2118 * returning EPERM, i.e. when very likely we already
2119 * are have this controlling terminal. */
2120 if (r < 0 && r == -EPERM && ignore_tiocstty_eperm)
2123 if (r < 0 && (force || fail || r != -EPERM)) {
2132 assert(notify >= 0);
2135 union inotify_event_buffer buffer;
2136 struct inotify_event *e;
2139 if (timeout != USEC_INFINITY) {
2142 n = now(CLOCK_MONOTONIC);
2143 if (ts + timeout < n) {
2148 r = fd_wait_for_event(fd, POLLIN, ts + timeout - n);
2158 l = read(notify, &buffer, sizeof(buffer));
2160 if (errno == EINTR || errno == EAGAIN)
2167 FOREACH_INOTIFY_EVENT(e, buffer, l) {
2168 if (e->wd != wd || !(e->mask & IN_CLOSE)) {
2177 /* We close the tty fd here since if the old session
2178 * ended our handle will be dead. It's important that
2179 * we do this after sleeping, so that we don't enter
2180 * an endless loop. */
2181 fd = safe_close(fd);
2186 r = reset_terminal_fd(fd, true);
2188 log_warning_errno(r, "Failed to reset terminal: %m");
2199 int release_terminal(void) {
2200 static const struct sigaction sa_new = {
2201 .sa_handler = SIG_IGN,
2202 .sa_flags = SA_RESTART,
2205 _cleanup_close_ int fd = -1;
2206 struct sigaction sa_old;
2209 fd = open("/dev/tty", O_RDWR|O_NOCTTY|O_NDELAY|O_CLOEXEC);
2213 /* Temporarily ignore SIGHUP, so that we don't get SIGHUP'ed
2214 * by our own TIOCNOTTY */
2215 assert_se(sigaction(SIGHUP, &sa_new, &sa_old) == 0);
2217 if (ioctl(fd, TIOCNOTTY) < 0)
2220 assert_se(sigaction(SIGHUP, &sa_old, NULL) == 0);
2225 int sigaction_many(const struct sigaction *sa, ...) {
2230 while ((sig = va_arg(ap, int)) > 0)
2231 if (sigaction(sig, sa, NULL) < 0)
2238 int ignore_signals(int sig, ...) {
2239 struct sigaction sa = {
2240 .sa_handler = SIG_IGN,
2241 .sa_flags = SA_RESTART,
2246 if (sigaction(sig, &sa, NULL) < 0)
2250 while ((sig = va_arg(ap, int)) > 0)
2251 if (sigaction(sig, &sa, NULL) < 0)
2258 int default_signals(int sig, ...) {
2259 struct sigaction sa = {
2260 .sa_handler = SIG_DFL,
2261 .sa_flags = SA_RESTART,
2266 if (sigaction(sig, &sa, NULL) < 0)
2270 while ((sig = va_arg(ap, int)) > 0)
2271 if (sigaction(sig, &sa, NULL) < 0)
2278 void safe_close_pair(int p[]) {
2282 /* Special case pairs which use the same fd in both
2284 p[0] = p[1] = safe_close(p[0]);
2288 p[0] = safe_close(p[0]);
2289 p[1] = safe_close(p[1]);
2292 ssize_t loop_read(int fd, void *buf, size_t nbytes, bool do_poll) {
2299 while (nbytes > 0) {
2302 k = read(fd, p, nbytes);
2307 if (errno == EAGAIN && do_poll) {
2309 /* We knowingly ignore any return value here,
2310 * and expect that any error/EOF is reported
2313 fd_wait_for_event(fd, POLLIN, USEC_INFINITY);
2317 return n > 0 ? n : -errno;
2331 int loop_write(int fd, const void *buf, size_t nbytes, bool do_poll) {
2332 const uint8_t *p = buf;
2339 while (nbytes > 0) {
2342 k = write(fd, p, nbytes);
2347 if (errno == EAGAIN && do_poll) {
2348 /* We knowingly ignore any return value here,
2349 * and expect that any error/EOF is reported
2352 fd_wait_for_event(fd, POLLOUT, USEC_INFINITY);
2359 if (k == 0) /* Can't really happen */
2369 int parse_size(const char *t, off_t base, off_t *size) {
2371 /* Soo, sometimes we want to parse IEC binary suffxies, and
2372 * sometimes SI decimal suffixes. This function can parse
2373 * both. Which one is the right way depends on the
2374 * context. Wikipedia suggests that SI is customary for
2375 * hardrware metrics and network speeds, while IEC is
2376 * customary for most data sizes used by software and volatile
2377 * (RAM) memory. Hence be careful which one you pick!
2379 * In either case we use just K, M, G as suffix, and not Ki,
2380 * Mi, Gi or so (as IEC would suggest). That's because that's
2381 * frickin' ugly. But this means you really need to make sure
2382 * to document which base you are parsing when you use this
2387 unsigned long long factor;
2390 static const struct table iec[] = {
2391 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2392 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
2393 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
2394 { "G", 1024ULL*1024ULL*1024ULL },
2395 { "M", 1024ULL*1024ULL },
2401 static const struct table si[] = {
2402 { "E", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2403 { "P", 1000ULL*1000ULL*1000ULL*1000ULL*1000ULL },
2404 { "T", 1000ULL*1000ULL*1000ULL*1000ULL },
2405 { "G", 1000ULL*1000ULL*1000ULL },
2406 { "M", 1000ULL*1000ULL },
2412 const struct table *table;
2414 unsigned long long r = 0;
2415 unsigned n_entries, start_pos = 0;
2418 assert(base == 1000 || base == 1024);
2423 n_entries = ELEMENTSOF(si);
2426 n_entries = ELEMENTSOF(iec);
2432 unsigned long long l2;
2438 l = strtoll(p, &e, 10);
2451 if (*e >= '0' && *e <= '9') {
2454 /* strotoull itself would accept space/+/- */
2455 l2 = strtoull(e, &e2, 10);
2457 if (errno == ERANGE)
2460 /* Ignore failure. E.g. 10.M is valid */
2467 e += strspn(e, WHITESPACE);
2469 for (i = start_pos; i < n_entries; i++)
2470 if (startswith(e, table[i].suffix)) {
2471 unsigned long long tmp;
2472 if ((unsigned long long) l + (frac > 0) > ULLONG_MAX / table[i].factor)
2474 tmp = l * table[i].factor + (unsigned long long) (frac * table[i].factor);
2475 if (tmp > ULLONG_MAX - r)
2479 if ((unsigned long long) (off_t) r != r)
2482 p = e + strlen(table[i].suffix);
2498 int make_stdio(int fd) {
2503 r = dup2(fd, STDIN_FILENO);
2504 s = dup2(fd, STDOUT_FILENO);
2505 t = dup2(fd, STDERR_FILENO);
2510 if (r < 0 || s < 0 || t < 0)
2513 /* Explicitly unset O_CLOEXEC, since if fd was < 3, then
2514 * dup2() was a NOP and the bit hence possibly set. */
2515 fd_cloexec(STDIN_FILENO, false);
2516 fd_cloexec(STDOUT_FILENO, false);
2517 fd_cloexec(STDERR_FILENO, false);
2522 int make_null_stdio(void) {
2525 null_fd = open("/dev/null", O_RDWR|O_NOCTTY);
2529 return make_stdio(null_fd);
2532 bool is_device_path(const char *path) {
2534 /* Returns true on paths that refer to a device, either in
2535 * sysfs or in /dev */
2538 path_startswith(path, "/dev/") ||
2539 path_startswith(path, "/sys/");
2542 int dir_is_empty(const char *path) {
2543 _cleanup_closedir_ DIR *d;
2554 if (!de && errno != 0)
2560 if (!hidden_file(de->d_name))
2565 char* dirname_malloc(const char *path) {
2566 char *d, *dir, *dir2;
2583 int dev_urandom(void *p, size_t n) {
2584 static int have_syscall = -1;
2588 /* Gathers some randomness from the kernel. This call will
2589 * never block, and will always return some data from the
2590 * kernel, regardless if the random pool is fully initialized
2591 * or not. It thus makes no guarantee for the quality of the
2592 * returned entropy, but is good enough for or usual usecases
2593 * of seeding the hash functions for hashtable */
2595 /* Use the getrandom() syscall unless we know we don't have
2596 * it, or when the requested size is too large for it. */
2597 if (have_syscall != 0 || (size_t) (int) n != n) {
2598 r = getrandom(p, n, GRND_NONBLOCK);
2600 have_syscall = true;
2605 if (errno == ENOSYS)
2606 /* we lack the syscall, continue with
2607 * reading from /dev/urandom */
2608 have_syscall = false;
2609 else if (errno == EAGAIN)
2610 /* not enough entropy for now. Let's
2611 * remember to use the syscall the
2612 * next time, again, but also read
2613 * from /dev/urandom for now, which
2614 * doesn't care about the current
2615 * amount of entropy. */
2616 have_syscall = true;
2620 /* too short read? */
2624 fd = open("/dev/urandom", O_RDONLY|O_CLOEXEC|O_NOCTTY);
2626 return errno == ENOENT ? -ENOSYS : -errno;
2628 k = loop_read(fd, p, n, true);
2633 if ((size_t) k != n)
2639 void initialize_srand(void) {
2640 static bool srand_called = false;
2642 #ifdef HAVE_SYS_AUXV_H
2651 #ifdef HAVE_SYS_AUXV_H
2652 /* The kernel provides us with a bit of entropy in auxv, so
2653 * let's try to make use of that to seed the pseudo-random
2654 * generator. It's better than nothing... */
2656 auxv = (void*) getauxval(AT_RANDOM);
2658 x ^= *(unsigned*) auxv;
2661 x ^= (unsigned) now(CLOCK_REALTIME);
2662 x ^= (unsigned) gettid();
2665 srand_called = true;
2668 void random_bytes(void *p, size_t n) {
2672 r = dev_urandom(p, n);
2676 /* If some idiot made /dev/urandom unavailable to us, he'll
2677 * get a PRNG instead. */
2681 for (q = p; q < (uint8_t*) p + n; q ++)
2685 void rename_process(const char name[8]) {
2688 /* This is a like a poor man's setproctitle(). It changes the
2689 * comm field, argv[0], and also the glibc's internally used
2690 * name of the process. For the first one a limit of 16 chars
2691 * applies, to the second one usually one of 10 (i.e. length
2692 * of "/sbin/init"), to the third one one of 7 (i.e. length of
2693 * "systemd"). If you pass a longer string it will be
2696 prctl(PR_SET_NAME, name);
2698 if (program_invocation_name)
2699 strncpy(program_invocation_name, name, strlen(program_invocation_name));
2701 if (saved_argc > 0) {
2705 strncpy(saved_argv[0], name, strlen(saved_argv[0]));
2707 for (i = 1; i < saved_argc; i++) {
2711 memzero(saved_argv[i], strlen(saved_argv[i]));
2716 void sigset_add_many(sigset_t *ss, ...) {
2723 while ((sig = va_arg(ap, int)) > 0)
2724 assert_se(sigaddset(ss, sig) == 0);
2728 int sigprocmask_many(int how, ...) {
2733 assert_se(sigemptyset(&ss) == 0);
2736 while ((sig = va_arg(ap, int)) > 0)
2737 assert_se(sigaddset(&ss, sig) == 0);
2740 if (sigprocmask(how, &ss, NULL) < 0)
2746 char* gethostname_malloc(void) {
2749 assert_se(uname(&u) >= 0);
2751 if (!isempty(u.nodename) && !streq(u.nodename, "(none)"))
2752 return strdup(u.nodename);
2754 return strdup(u.sysname);
2757 bool hostname_is_set(void) {
2760 assert_se(uname(&u) >= 0);
2762 return !isempty(u.nodename) && !streq(u.nodename, "(none)");
2765 char *lookup_uid(uid_t uid) {
2768 _cleanup_free_ char *buf = NULL;
2769 struct passwd pwbuf, *pw = NULL;
2771 /* Shortcut things to avoid NSS lookups */
2773 return strdup("root");
2775 bufsize = sysconf(_SC_GETPW_R_SIZE_MAX);
2779 buf = malloc(bufsize);
2783 if (getpwuid_r(uid, &pwbuf, buf, bufsize, &pw) == 0 && pw)
2784 return strdup(pw->pw_name);
2786 if (asprintf(&name, UID_FMT, uid) < 0)
2792 char* getlogname_malloc(void) {
2796 if (isatty(STDIN_FILENO) && fstat(STDIN_FILENO, &st) >= 0)
2801 return lookup_uid(uid);
2804 char *getusername_malloc(void) {
2811 return lookup_uid(getuid());
2814 int getttyname_malloc(int fd, char **ret) {
2824 r = ttyname_r(fd, path, sizeof(path));
2829 p = startswith(path, "/dev/");
2830 c = strdup(p ?: path);
2847 int getttyname_harder(int fd, char **r) {
2851 k = getttyname_malloc(fd, &s);
2855 if (streq(s, "tty")) {
2857 return get_ctty(0, NULL, r);
2864 int get_ctty_devnr(pid_t pid, dev_t *d) {
2866 _cleanup_free_ char *line = NULL;
2868 unsigned long ttynr;
2872 p = procfs_file_alloca(pid, "stat");
2873 r = read_one_line_file(p, &line);
2877 p = strrchr(line, ')');
2887 "%*d " /* session */
2892 if (major(ttynr) == 0 && minor(ttynr) == 0)
2901 int get_ctty(pid_t pid, dev_t *_devnr, char **r) {
2902 char fn[sizeof("/dev/char/")-1 + 2*DECIMAL_STR_MAX(unsigned) + 1 + 1], *b = NULL;
2903 _cleanup_free_ char *s = NULL;
2910 k = get_ctty_devnr(pid, &devnr);
2914 sprintf(fn, "/dev/char/%u:%u", major(devnr), minor(devnr));
2916 k = readlink_malloc(fn, &s);
2922 /* This is an ugly hack */
2923 if (major(devnr) == 136) {
2924 asprintf(&b, "pts/%u", minor(devnr));
2928 /* Probably something like the ptys which have no
2929 * symlink in /dev/char. Let's return something
2930 * vaguely useful. */
2936 if (startswith(s, "/dev/"))
2938 else if (startswith(s, "../"))
2956 int rm_rf_children_dangerous(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
2957 _cleanup_closedir_ DIR *d = NULL;
2962 /* This returns the first error we run into, but nevertheless
2963 * tries to go on. This closes the passed fd. */
2969 return errno == ENOENT ? 0 : -errno;
2974 bool is_dir, keep_around;
2981 if (errno != 0 && ret == 0)
2986 if (streq(de->d_name, ".") || streq(de->d_name, ".."))
2989 if (de->d_type == DT_UNKNOWN ||
2991 (de->d_type == DT_DIR && root_dev)) {
2992 if (fstatat(fd, de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0) {
2993 if (ret == 0 && errno != ENOENT)
2998 is_dir = S_ISDIR(st.st_mode);
3001 (st.st_uid == 0 || st.st_uid == getuid()) &&
3002 (st.st_mode & S_ISVTX);
3004 is_dir = de->d_type == DT_DIR;
3005 keep_around = false;
3011 /* if root_dev is set, remove subdirectories only, if device is same as dir */
3012 if (root_dev && st.st_dev != root_dev->st_dev)
3015 subdir_fd = openat(fd, de->d_name,
3016 O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3017 if (subdir_fd < 0) {
3018 if (ret == 0 && errno != ENOENT)
3023 r = rm_rf_children_dangerous(subdir_fd, only_dirs, honour_sticky, root_dev);
3024 if (r < 0 && ret == 0)
3028 if (unlinkat(fd, de->d_name, AT_REMOVEDIR) < 0) {
3029 if (ret == 0 && errno != ENOENT)
3033 } else if (!only_dirs && !keep_around) {
3035 if (unlinkat(fd, de->d_name, 0) < 0) {
3036 if (ret == 0 && errno != ENOENT)
3043 _pure_ static int is_temporary_fs(struct statfs *s) {
3046 return F_TYPE_EQUAL(s->f_type, TMPFS_MAGIC) ||
3047 F_TYPE_EQUAL(s->f_type, RAMFS_MAGIC);
3050 int is_fd_on_temporary_fs(int fd) {
3053 if (fstatfs(fd, &s) < 0)
3056 return is_temporary_fs(&s);
3059 int rm_rf_children(int fd, bool only_dirs, bool honour_sticky, struct stat *root_dev) {
3064 if (fstatfs(fd, &s) < 0) {
3069 /* We refuse to clean disk file systems with this call. This
3070 * is extra paranoia just to be sure we never ever remove
3072 if (!is_temporary_fs(&s)) {
3073 log_error("Attempted to remove disk file system, and we can't allow that.");
3078 return rm_rf_children_dangerous(fd, only_dirs, honour_sticky, root_dev);
3081 static int file_is_priv_sticky(const char *p) {
3086 if (lstat(p, &st) < 0)
3090 (st.st_uid == 0 || st.st_uid == getuid()) &&
3091 (st.st_mode & S_ISVTX);
3094 static int rm_rf_internal(const char *path, bool only_dirs, bool delete_root, bool honour_sticky, bool dangerous) {
3100 /* We refuse to clean the root file system with this
3101 * call. This is extra paranoia to never cause a really
3102 * seriously broken system. */
3103 if (path_equal(path, "/")) {
3104 log_error("Attempted to remove entire root file system, and we can't allow that.");
3108 fd = open(path, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|O_NOFOLLOW|O_NOATIME);
3111 if (errno != ENOTDIR && errno != ELOOP)
3115 if (statfs(path, &s) < 0)
3118 if (!is_temporary_fs(&s)) {
3119 log_error("Attempted to remove disk file system, and we can't allow that.");
3124 if (delete_root && !only_dirs)
3125 if (unlink(path) < 0 && errno != ENOENT)
3132 if (fstatfs(fd, &s) < 0) {
3137 if (!is_temporary_fs(&s)) {
3138 log_error("Attempted to remove disk file system, and we can't allow that.");
3144 r = rm_rf_children_dangerous(fd, only_dirs, honour_sticky, NULL);
3147 if (honour_sticky && file_is_priv_sticky(path) > 0)
3150 if (rmdir(path) < 0 && errno != ENOENT) {
3159 int rm_rf(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3160 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, false);
3163 int rm_rf_dangerous(const char *path, bool only_dirs, bool delete_root, bool honour_sticky) {
3164 return rm_rf_internal(path, only_dirs, delete_root, honour_sticky, true);
3167 int chmod_and_chown(const char *path, mode_t mode, uid_t uid, gid_t gid) {
3170 /* Under the assumption that we are running privileged we
3171 * first change the access mode and only then hand out
3172 * ownership to avoid a window where access is too open. */
3174 if (mode != MODE_INVALID)
3175 if (chmod(path, mode) < 0)
3178 if (uid != UID_INVALID || gid != GID_INVALID)
3179 if (chown(path, uid, gid) < 0)
3185 int fchmod_and_fchown(int fd, mode_t mode, uid_t uid, gid_t gid) {
3188 /* Under the assumption that we are running privileged we
3189 * first change the access mode and only then hand out
3190 * ownership to avoid a window where access is too open. */
3192 if (mode != MODE_INVALID)
3193 if (fchmod(fd, mode) < 0)
3196 if (uid != UID_INVALID || gid != GID_INVALID)
3197 if (fchown(fd, uid, gid) < 0)
3203 cpu_set_t* cpu_set_malloc(unsigned *ncpus) {
3207 /* Allocates the cpuset in the right size */
3210 if (!(r = CPU_ALLOC(n)))
3213 if (sched_getaffinity(0, CPU_ALLOC_SIZE(n), r) >= 0) {
3214 CPU_ZERO_S(CPU_ALLOC_SIZE(n), r);
3224 if (errno != EINVAL)
3231 int status_vprintf(const char *status, bool ellipse, bool ephemeral, const char *format, va_list ap) {
3232 static const char status_indent[] = " "; /* "[" STATUS "] " */
3233 _cleanup_free_ char *s = NULL;
3234 _cleanup_close_ int fd = -1;
3235 struct iovec iovec[6] = {};
3237 static bool prev_ephemeral;
3241 /* This is independent of logging, as status messages are
3242 * optional and go exclusively to the console. */
3244 if (vasprintf(&s, format, ap) < 0)
3247 fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
3260 sl = status ? sizeof(status_indent)-1 : 0;
3266 e = ellipsize(s, emax, 50);
3274 IOVEC_SET_STRING(iovec[n++], "\r" ANSI_ERASE_TO_END_OF_LINE);
3275 prev_ephemeral = ephemeral;
3278 if (!isempty(status)) {
3279 IOVEC_SET_STRING(iovec[n++], "[");
3280 IOVEC_SET_STRING(iovec[n++], status);
3281 IOVEC_SET_STRING(iovec[n++], "] ");
3283 IOVEC_SET_STRING(iovec[n++], status_indent);
3286 IOVEC_SET_STRING(iovec[n++], s);
3288 IOVEC_SET_STRING(iovec[n++], "\n");
3290 if (writev(fd, iovec, n) < 0)
3296 int status_printf(const char *status, bool ellipse, bool ephemeral, const char *format, ...) {
3302 va_start(ap, format);
3303 r = status_vprintf(status, ellipse, ephemeral, format, ap);
3309 char *replace_env(const char *format, char **env) {
3316 const char *e, *word = format;
3321 for (e = format; *e; e ++) {
3332 k = strnappend(r, word, e-word-1);
3342 } else if (*e == '$') {
3343 k = strnappend(r, word, e-word);
3360 t = strempty(strv_env_get_n(env, word+2, e-word-2));
3362 k = strappend(r, t);
3376 k = strnappend(r, word, e-word);
3388 char **replace_env_argv(char **argv, char **env) {
3390 unsigned k = 0, l = 0;
3392 l = strv_length(argv);
3394 ret = new(char*, l+1);
3398 STRV_FOREACH(i, argv) {
3400 /* If $FOO appears as single word, replace it by the split up variable */
3401 if ((*i)[0] == '$' && (*i)[1] != '{') {
3406 e = strv_env_get(env, *i+1);
3410 r = strv_split_quoted(&m, e, true);
3422 w = realloc(ret, sizeof(char*) * (l+1));
3432 memcpy(ret + k, m, q * sizeof(char*));
3440 /* If ${FOO} appears as part of a word, replace it by the variable as-is */
3441 ret[k] = replace_env(*i, env);
3453 int fd_columns(int fd) {
3454 struct winsize ws = {};
3456 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3465 unsigned columns(void) {
3469 if (_likely_(cached_columns > 0))
3470 return cached_columns;
3473 e = getenv("COLUMNS");
3475 (void) safe_atoi(e, &c);
3478 c = fd_columns(STDOUT_FILENO);
3484 return cached_columns;
3487 int fd_lines(int fd) {
3488 struct winsize ws = {};
3490 if (ioctl(fd, TIOCGWINSZ, &ws) < 0)
3499 unsigned lines(void) {
3503 if (_likely_(cached_lines > 0))
3504 return cached_lines;
3507 e = getenv("LINES");
3509 (void) safe_atoi(e, &l);
3512 l = fd_lines(STDOUT_FILENO);
3518 return cached_lines;
3521 /* intended to be used as a SIGWINCH sighandler */
3522 void columns_lines_cache_reset(int signum) {
3528 static int cached_on_tty = -1;
3530 if (_unlikely_(cached_on_tty < 0))
3531 cached_on_tty = isatty(STDOUT_FILENO) > 0;
3533 return cached_on_tty;
3536 int files_same(const char *filea, const char *fileb) {
3539 if (stat(filea, &a) < 0)
3542 if (stat(fileb, &b) < 0)
3545 return a.st_dev == b.st_dev &&
3546 a.st_ino == b.st_ino;
3549 int running_in_chroot(void) {
3552 ret = files_same("/proc/1/root", "/");
3559 static char *ascii_ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3564 assert(percent <= 100);
3565 assert(new_length >= 3);
3567 if (old_length <= 3 || old_length <= new_length)
3568 return strndup(s, old_length);
3570 r = new0(char, new_length+1);
3574 x = (new_length * percent) / 100;
3576 if (x > new_length - 3)
3584 s + old_length - (new_length - x - 3),
3585 new_length - x - 3);
3590 char *ellipsize_mem(const char *s, size_t old_length, size_t new_length, unsigned percent) {
3594 unsigned k, len, len2;
3597 assert(percent <= 100);
3598 assert(new_length >= 3);
3600 /* if no multibyte characters use ascii_ellipsize_mem for speed */
3601 if (ascii_is_valid(s))
3602 return ascii_ellipsize_mem(s, old_length, new_length, percent);
3604 if (old_length <= 3 || old_length <= new_length)
3605 return strndup(s, old_length);
3607 x = (new_length * percent) / 100;
3609 if (x > new_length - 3)
3613 for (i = s; k < x && i < s + old_length; i = utf8_next_char(i)) {
3616 c = utf8_encoded_to_unichar(i);
3619 k += unichar_iswide(c) ? 2 : 1;
3622 if (k > x) /* last character was wide and went over quota */
3625 for (j = s + old_length; k < new_length && j > i; ) {
3628 j = utf8_prev_char(j);
3629 c = utf8_encoded_to_unichar(j);
3632 k += unichar_iswide(c) ? 2 : 1;
3636 /* we don't actually need to ellipsize */
3638 return memdup(s, old_length + 1);
3640 /* make space for ellipsis */
3641 j = utf8_next_char(j);
3644 len2 = s + old_length - j;
3645 e = new(char, len + 3 + len2 + 1);
3650 printf("old_length=%zu new_length=%zu x=%zu len=%u len2=%u k=%u\n",
3651 old_length, new_length, x, len, len2, k);
3655 e[len] = 0xe2; /* tri-dot ellipsis: … */
3659 memcpy(e + len + 3, j, len2 + 1);
3664 char *ellipsize(const char *s, size_t length, unsigned percent) {
3665 return ellipsize_mem(s, strlen(s), length, percent);
3668 int touch_file(const char *path, bool parents, usec_t stamp, uid_t uid, gid_t gid, mode_t mode) {
3669 _cleanup_close_ int fd;
3675 mkdir_parents(path, 0755);
3677 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY, mode > 0 ? mode : 0644);
3682 r = fchmod(fd, mode);
3687 if (uid != UID_INVALID || gid != GID_INVALID) {
3688 r = fchown(fd, uid, gid);
3693 if (stamp != USEC_INFINITY) {
3694 struct timespec ts[2];
3696 timespec_store(&ts[0], stamp);
3698 r = futimens(fd, ts);
3700 r = futimens(fd, NULL);
3707 int touch(const char *path) {
3708 return touch_file(path, false, USEC_INFINITY, UID_INVALID, GID_INVALID, 0);
3711 char *unquote(const char *s, const char* quotes) {
3715 /* This is rather stupid, simply removes the heading and
3716 * trailing quotes if there is one. Doesn't care about
3717 * escaping or anything. We should make this smarter one
3724 if (strchr(quotes, s[0]) && s[l-1] == s[0])
3725 return strndup(s+1, l-2);
3730 char *normalize_env_assignment(const char *s) {
3731 _cleanup_free_ char *value = NULL;
3735 eq = strchr(s, '=');
3745 memmove(r, t, strlen(t) + 1);
3750 name = strndupa(s, eq - s);
3751 p = strdupa(eq + 1);
3753 value = unquote(strstrip(p), QUOTES);
3757 return strjoin(strstrip(name), "=", value, NULL);
3760 int wait_for_terminate(pid_t pid, siginfo_t *status) {
3771 if (waitid(P_PID, pid, status, WEXITED) < 0) {
3785 * < 0 : wait_for_terminate() failed to get the state of the
3786 * process, the process was terminated by a signal, or
3787 * failed for an unknown reason.
3788 * >=0 : The process terminated normally, and its exit code is
3791 * That is, success is indicated by a return value of zero, and an
3792 * error is indicated by a non-zero value.
3794 * A warning is emitted if the process terminates abnormally,
3795 * and also if it returns non-zero unless check_exit_code is true.
3797 int wait_for_terminate_and_warn(const char *name, pid_t pid, bool check_exit_code) {
3804 r = wait_for_terminate(pid, &status);
3806 return log_warning_errno(r, "Failed to wait for %s: %m", name);
3808 if (status.si_code == CLD_EXITED) {
3809 if (status.si_status != 0)
3810 log_full(check_exit_code ? LOG_WARNING : LOG_DEBUG,
3811 "%s failed with error code %i.", name, status.si_status);
3813 log_debug("%s succeeded.", name);
3815 return status.si_status;
3816 } else if (status.si_code == CLD_KILLED ||
3817 status.si_code == CLD_DUMPED) {
3819 log_warning("%s terminated by signal %s.", name, signal_to_string(status.si_status));
3823 log_warning("%s failed due to unknown reason.", name);
3827 noreturn void freeze(void) {
3829 /* Make sure nobody waits for us on a socket anymore */
3830 close_all_fds(NULL, 0);
3838 bool null_or_empty(struct stat *st) {
3841 if (S_ISREG(st->st_mode) && st->st_size <= 0)
3844 if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode))
3850 int null_or_empty_path(const char *fn) {
3855 if (stat(fn, &st) < 0)
3858 return null_or_empty(&st);
3861 int null_or_empty_fd(int fd) {
3866 if (fstat(fd, &st) < 0)
3869 return null_or_empty(&st);
3872 DIR *xopendirat(int fd, const char *name, int flags) {
3876 assert(!(flags & O_CREAT));
3878 nfd = openat(fd, name, O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC|flags, 0);
3891 int signal_from_string_try_harder(const char *s) {
3895 signo = signal_from_string(s);
3897 if (startswith(s, "SIG"))
3898 return signal_from_string(s+3);
3903 static char *tag_to_udev_node(const char *tagvalue, const char *by) {
3904 _cleanup_free_ char *t = NULL, *u = NULL;
3907 u = unquote(tagvalue, "\"\'");
3911 enc_len = strlen(u) * 4 + 1;
3912 t = new(char, enc_len);
3916 if (encode_devnode_name(u, t, enc_len) < 0)
3919 return strjoin("/dev/disk/by-", by, "/", t, NULL);
3922 char *fstab_node_to_udev_node(const char *p) {
3925 if (startswith(p, "LABEL="))
3926 return tag_to_udev_node(p+6, "label");
3928 if (startswith(p, "UUID="))
3929 return tag_to_udev_node(p+5, "uuid");
3931 if (startswith(p, "PARTUUID="))
3932 return tag_to_udev_node(p+9, "partuuid");
3934 if (startswith(p, "PARTLABEL="))
3935 return tag_to_udev_node(p+10, "partlabel");
3940 bool tty_is_vc(const char *tty) {
3943 return vtnr_from_tty(tty) >= 0;
3946 bool tty_is_console(const char *tty) {
3949 if (startswith(tty, "/dev/"))
3952 return streq(tty, "console");
3955 int vtnr_from_tty(const char *tty) {
3960 if (startswith(tty, "/dev/"))
3963 if (!startswith(tty, "tty") )
3966 if (tty[3] < '0' || tty[3] > '9')
3969 r = safe_atoi(tty+3, &i);
3973 if (i < 0 || i > 63)
3979 char *resolve_dev_console(char **active) {
3982 /* Resolve where /dev/console is pointing to, if /sys is actually ours
3983 * (i.e. not read-only-mounted which is a sign for container setups) */
3985 if (path_is_read_only_fs("/sys") > 0)
3988 if (read_one_line_file("/sys/class/tty/console/active", active) < 0)
3991 /* If multiple log outputs are configured the last one is what
3992 * /dev/console points to */
3993 tty = strrchr(*active, ' ');
3999 if (streq(tty, "tty0")) {
4002 /* Get the active VC (e.g. tty1) */
4003 if (read_one_line_file("/sys/class/tty/tty0/active", &tmp) >= 0) {
4005 tty = *active = tmp;
4012 bool tty_is_vc_resolve(const char *tty) {
4013 _cleanup_free_ char *active = NULL;
4017 if (startswith(tty, "/dev/"))
4020 if (streq(tty, "console")) {
4021 tty = resolve_dev_console(&active);
4026 return tty_is_vc(tty);
4029 const char *default_term_for_tty(const char *tty) {
4032 return tty_is_vc_resolve(tty) ? "TERM=linux" : "TERM=vt220";
4035 bool dirent_is_file(const struct dirent *de) {
4038 if (hidden_file(de->d_name))
4041 if (de->d_type != DT_REG &&
4042 de->d_type != DT_LNK &&
4043 de->d_type != DT_UNKNOWN)
4049 bool dirent_is_file_with_suffix(const struct dirent *de, const char *suffix) {
4052 if (de->d_type != DT_REG &&
4053 de->d_type != DT_LNK &&
4054 de->d_type != DT_UNKNOWN)
4057 if (hidden_file_allow_backup(de->d_name))
4060 return endswith(de->d_name, suffix);
4063 static int do_execute(char **directories, usec_t timeout, char *argv[]) {
4064 _cleanup_hashmap_free_free_ Hashmap *pids = NULL;
4065 _cleanup_set_free_free_ Set *seen = NULL;
4068 /* We fork this all off from a child process so that we can
4069 * somewhat cleanly make use of SIGALRM to set a time limit */
4071 reset_all_signal_handlers();
4072 reset_signal_mask();
4074 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4076 pids = hashmap_new(NULL);
4080 seen = set_new(&string_hash_ops);
4084 STRV_FOREACH(directory, directories) {
4085 _cleanup_closedir_ DIR *d;
4088 d = opendir(*directory);
4090 if (errno == ENOENT)
4093 return log_error_errno(errno, "Failed to open directory %s: %m", *directory);
4096 FOREACH_DIRENT(de, d, break) {
4097 _cleanup_free_ char *path = NULL;
4101 if (!dirent_is_file(de))
4104 if (set_contains(seen, de->d_name)) {
4105 log_debug("%1$s/%2$s skipped (%2$s was already seen).", *directory, de->d_name);
4109 r = set_put_strdup(seen, de->d_name);
4113 path = strjoin(*directory, "/", de->d_name, NULL);
4117 if (null_or_empty_path(path)) {
4118 log_debug("%s is empty (a mask).", path);
4121 log_debug("%s will be executed.", path);
4125 log_error_errno(errno, "Failed to fork: %m");
4127 } else if (pid == 0) {
4130 assert_se(prctl(PR_SET_PDEATHSIG, SIGTERM) == 0);
4140 return log_error_errno(errno, "Failed to execute %s: %m", path);
4143 log_debug("Spawned %s as " PID_FMT ".", path, pid);
4145 r = hashmap_put(pids, UINT_TO_PTR(pid), path);
4152 /* Abort execution of this process after the timout. We simply
4153 * rely on SIGALRM as default action terminating the process,
4154 * and turn on alarm(). */
4156 if (timeout != USEC_INFINITY)
4157 alarm((timeout + USEC_PER_SEC - 1) / USEC_PER_SEC);
4159 while (!hashmap_isempty(pids)) {
4160 _cleanup_free_ char *path = NULL;
4163 pid = PTR_TO_UINT(hashmap_first_key(pids));
4166 path = hashmap_remove(pids, UINT_TO_PTR(pid));
4169 wait_for_terminate_and_warn(path, pid, true);
4175 void execute_directories(const char* const* directories, usec_t timeout, char *argv[]) {
4179 char **dirs = (char**) directories;
4181 assert(!strv_isempty(dirs));
4183 name = basename(dirs[0]);
4184 assert(!isempty(name));
4186 /* Executes all binaries in the directories in parallel and waits
4187 * for them to finish. Optionally a timeout is applied. If a file
4188 * with the same name exists in more than one directory, the
4189 * earliest one wins. */
4191 executor_pid = fork();
4192 if (executor_pid < 0) {
4193 log_error_errno(errno, "Failed to fork: %m");
4196 } else if (executor_pid == 0) {
4197 r = do_execute(dirs, timeout, argv);
4198 _exit(r < 0 ? EXIT_FAILURE : EXIT_SUCCESS);
4201 wait_for_terminate_and_warn(name, executor_pid, true);
4204 int kill_and_sigcont(pid_t pid, int sig) {
4207 r = kill(pid, sig) < 0 ? -errno : 0;
4215 bool nulstr_contains(const char*nulstr, const char *needle) {
4221 NULSTR_FOREACH(i, nulstr)
4222 if (streq(i, needle))
4228 bool plymouth_running(void) {
4229 return access("/run/plymouth/pid", F_OK) >= 0;
4232 char* strshorten(char *s, size_t l) {
4241 static bool hostname_valid_char(char c) {
4243 (c >= 'a' && c <= 'z') ||
4244 (c >= 'A' && c <= 'Z') ||
4245 (c >= '0' && c <= '9') ||
4251 bool hostname_is_valid(const char *s) {
4258 /* Doesn't accept empty hostnames, hostnames with trailing or
4259 * leading dots, and hostnames with multiple dots in a
4260 * sequence. Also ensures that the length stays below
4263 for (p = s, dot = true; *p; p++) {
4270 if (!hostname_valid_char(*p))
4280 if (p-s > HOST_NAME_MAX)
4286 char* hostname_cleanup(char *s, bool lowercase) {
4290 for (p = s, d = s, dot = true; *p; p++) {
4297 } else if (hostname_valid_char(*p)) {
4298 *(d++) = lowercase ? tolower(*p) : *p;
4309 strshorten(s, HOST_NAME_MAX);
4314 bool machine_name_is_valid(const char *s) {
4316 if (!hostname_is_valid(s))
4319 /* Machine names should be useful hostnames, but also be
4320 * useful in unit names, hence we enforce a stricter length
4329 int pipe_eof(int fd) {
4330 struct pollfd pollfd = {
4332 .events = POLLIN|POLLHUP,
4337 r = poll(&pollfd, 1, 0);
4344 return pollfd.revents & POLLHUP;
4347 int fd_wait_for_event(int fd, int event, usec_t t) {
4349 struct pollfd pollfd = {
4357 r = ppoll(&pollfd, 1, t == USEC_INFINITY ? NULL : timespec_store(&ts, t), NULL);
4364 return pollfd.revents;
4367 int fopen_temporary(const char *path, FILE **_f, char **_temp_path) {
4376 r = tempfn_xxxxxx(path, &t);
4380 fd = mkostemp_safe(t, O_WRONLY|O_CLOEXEC);
4386 f = fdopen(fd, "we");
4399 int terminal_vhangup_fd(int fd) {
4402 if (ioctl(fd, TIOCVHANGUP) < 0)
4408 int terminal_vhangup(const char *name) {
4409 _cleanup_close_ int fd;
4411 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4415 return terminal_vhangup_fd(fd);
4418 int vt_disallocate(const char *name) {
4422 /* Deallocate the VT if possible. If not possible
4423 * (i.e. because it is the active one), at least clear it
4424 * entirely (including the scrollback buffer) */
4426 if (!startswith(name, "/dev/"))
4429 if (!tty_is_vc(name)) {
4430 /* So this is not a VT. I guess we cannot deallocate
4431 * it then. But let's at least clear the screen */
4433 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4438 "\033[r" /* clear scrolling region */
4439 "\033[H" /* move home */
4440 "\033[2J", /* clear screen */
4447 if (!startswith(name, "/dev/tty"))
4450 r = safe_atou(name+8, &u);
4457 /* Try to deallocate */
4458 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
4462 r = ioctl(fd, VT_DISALLOCATE, u);
4471 /* Couldn't deallocate, so let's clear it fully with
4473 fd = open_terminal(name, O_RDWR|O_NOCTTY|O_CLOEXEC);
4478 "\033[r" /* clear scrolling region */
4479 "\033[H" /* move home */
4480 "\033[3J", /* clear screen including scrollback, requires Linux 2.6.40 */
4487 int symlink_atomic(const char *from, const char *to) {
4488 _cleanup_free_ char *t = NULL;
4494 r = tempfn_random(to, &t);
4498 if (symlink(from, t) < 0)
4501 if (rename(t, to) < 0) {
4509 int mknod_atomic(const char *path, mode_t mode, dev_t dev) {
4510 _cleanup_free_ char *t = NULL;
4515 r = tempfn_random(path, &t);
4519 if (mknod(t, mode, dev) < 0)
4522 if (rename(t, path) < 0) {
4530 int mkfifo_atomic(const char *path, mode_t mode) {
4531 _cleanup_free_ char *t = NULL;
4536 r = tempfn_random(path, &t);
4540 if (mkfifo(t, mode) < 0)
4543 if (rename(t, path) < 0) {
4551 bool display_is_local(const char *display) {
4555 display[0] == ':' &&
4556 display[1] >= '0' &&
4560 int socket_from_display(const char *display, char **path) {
4567 if (!display_is_local(display))
4570 k = strspn(display+1, "0123456789");
4572 f = new(char, strlen("/tmp/.X11-unix/X") + k + 1);
4576 c = stpcpy(f, "/tmp/.X11-unix/X");
4577 memcpy(c, display+1, k);
4586 const char **username,
4587 uid_t *uid, gid_t *gid,
4589 const char **shell) {
4597 /* We enforce some special rules for uid=0: in order to avoid
4598 * NSS lookups for root we hardcode its data. */
4600 if (streq(*username, "root") || streq(*username, "0")) {
4618 if (parse_uid(*username, &u) >= 0) {
4622 /* If there are multiple users with the same id, make
4623 * sure to leave $USER to the configured value instead
4624 * of the first occurrence in the database. However if
4625 * the uid was configured by a numeric uid, then let's
4626 * pick the real username from /etc/passwd. */
4628 *username = p->pw_name;
4631 p = getpwnam(*username);
4635 return errno > 0 ? -errno : -ESRCH;
4647 *shell = p->pw_shell;
4652 char* uid_to_name(uid_t uid) {
4657 return strdup("root");
4661 return strdup(p->pw_name);
4663 if (asprintf(&r, UID_FMT, uid) < 0)
4669 char* gid_to_name(gid_t gid) {
4674 return strdup("root");
4678 return strdup(p->gr_name);
4680 if (asprintf(&r, GID_FMT, gid) < 0)
4686 int get_group_creds(const char **groupname, gid_t *gid) {
4692 /* We enforce some special rules for gid=0: in order to avoid
4693 * NSS lookups for root we hardcode its data. */
4695 if (streq(*groupname, "root") || streq(*groupname, "0")) {
4696 *groupname = "root";
4704 if (parse_gid(*groupname, &id) >= 0) {
4709 *groupname = g->gr_name;
4712 g = getgrnam(*groupname);
4716 return errno > 0 ? -errno : -ESRCH;
4724 int in_gid(gid_t gid) {
4726 int ngroups_max, r, i;
4728 if (getgid() == gid)
4731 if (getegid() == gid)
4734 ngroups_max = sysconf(_SC_NGROUPS_MAX);
4735 assert(ngroups_max > 0);
4737 gids = alloca(sizeof(gid_t) * ngroups_max);
4739 r = getgroups(ngroups_max, gids);
4743 for (i = 0; i < r; i++)
4750 int in_group(const char *name) {
4754 r = get_group_creds(&name, &gid);
4761 int glob_exists(const char *path) {
4762 _cleanup_globfree_ glob_t g = {};
4768 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4770 if (k == GLOB_NOMATCH)
4772 else if (k == GLOB_NOSPACE)
4775 return !strv_isempty(g.gl_pathv);
4777 return errno ? -errno : -EIO;
4780 int glob_extend(char ***strv, const char *path) {
4781 _cleanup_globfree_ glob_t g = {};
4786 k = glob(path, GLOB_NOSORT|GLOB_BRACE, NULL, &g);
4788 if (k == GLOB_NOMATCH)
4790 else if (k == GLOB_NOSPACE)
4792 else if (k != 0 || strv_isempty(g.gl_pathv))
4793 return errno ? -errno : -EIO;
4795 STRV_FOREACH(p, g.gl_pathv) {
4796 k = strv_extend(strv, *p);
4804 int dirent_ensure_type(DIR *d, struct dirent *de) {
4810 if (de->d_type != DT_UNKNOWN)
4813 if (fstatat(dirfd(d), de->d_name, &st, AT_SYMLINK_NOFOLLOW) < 0)
4817 S_ISREG(st.st_mode) ? DT_REG :
4818 S_ISDIR(st.st_mode) ? DT_DIR :
4819 S_ISLNK(st.st_mode) ? DT_LNK :
4820 S_ISFIFO(st.st_mode) ? DT_FIFO :
4821 S_ISSOCK(st.st_mode) ? DT_SOCK :
4822 S_ISCHR(st.st_mode) ? DT_CHR :
4823 S_ISBLK(st.st_mode) ? DT_BLK :
4829 int get_files_in_directory(const char *path, char ***list) {
4830 _cleanup_closedir_ DIR *d = NULL;
4831 size_t bufsize = 0, n = 0;
4832 _cleanup_strv_free_ char **l = NULL;
4836 /* Returns all files in a directory in *list, and the number
4837 * of files as return value. If list is NULL returns only the
4849 if (!de && errno != 0)
4854 dirent_ensure_type(d, de);
4856 if (!dirent_is_file(de))
4860 /* one extra slot is needed for the terminating NULL */
4861 if (!GREEDY_REALLOC(l, bufsize, n + 2))
4864 l[n] = strdup(de->d_name);
4875 l = NULL; /* avoid freeing */
4881 char *strjoin(const char *x, ...) {
4895 t = va_arg(ap, const char *);
4900 if (n > ((size_t) -1) - l) {
4924 t = va_arg(ap, const char *);
4938 bool is_main_thread(void) {
4939 static thread_local int cached = 0;
4941 if (_unlikely_(cached == 0))
4942 cached = getpid() == gettid() ? 1 : -1;
4947 int block_get_whole_disk(dev_t d, dev_t *ret) {
4954 /* If it has a queue this is good enough for us */
4955 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", major(d), minor(d)) < 0)
4958 r = access(p, F_OK);
4966 /* If it is a partition find the originating device */
4967 if (asprintf(&p, "/sys/dev/block/%u:%u/partition", major(d), minor(d)) < 0)
4970 r = access(p, F_OK);
4976 /* Get parent dev_t */
4977 if (asprintf(&p, "/sys/dev/block/%u:%u/../dev", major(d), minor(d)) < 0)
4980 r = read_one_line_file(p, &s);
4986 r = sscanf(s, "%u:%u", &m, &n);
4992 /* Only return this if it is really good enough for us. */
4993 if (asprintf(&p, "/sys/dev/block/%u:%u/queue", m, n) < 0)
4996 r = access(p, F_OK);
5000 *ret = makedev(m, n);
5007 static const char *const ioprio_class_table[] = {
5008 [IOPRIO_CLASS_NONE] = "none",
5009 [IOPRIO_CLASS_RT] = "realtime",
5010 [IOPRIO_CLASS_BE] = "best-effort",
5011 [IOPRIO_CLASS_IDLE] = "idle"
5014 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ioprio_class, int, INT_MAX);
5016 static const char *const sigchld_code_table[] = {
5017 [CLD_EXITED] = "exited",
5018 [CLD_KILLED] = "killed",
5019 [CLD_DUMPED] = "dumped",
5020 [CLD_TRAPPED] = "trapped",
5021 [CLD_STOPPED] = "stopped",
5022 [CLD_CONTINUED] = "continued",
5025 DEFINE_STRING_TABLE_LOOKUP(sigchld_code, int);
5027 static const char *const log_facility_unshifted_table[LOG_NFACILITIES] = {
5028 [LOG_FAC(LOG_KERN)] = "kern",
5029 [LOG_FAC(LOG_USER)] = "user",
5030 [LOG_FAC(LOG_MAIL)] = "mail",
5031 [LOG_FAC(LOG_DAEMON)] = "daemon",
5032 [LOG_FAC(LOG_AUTH)] = "auth",
5033 [LOG_FAC(LOG_SYSLOG)] = "syslog",
5034 [LOG_FAC(LOG_LPR)] = "lpr",
5035 [LOG_FAC(LOG_NEWS)] = "news",
5036 [LOG_FAC(LOG_UUCP)] = "uucp",
5037 [LOG_FAC(LOG_CRON)] = "cron",
5038 [LOG_FAC(LOG_AUTHPRIV)] = "authpriv",
5039 [LOG_FAC(LOG_FTP)] = "ftp",
5040 [LOG_FAC(LOG_LOCAL0)] = "local0",
5041 [LOG_FAC(LOG_LOCAL1)] = "local1",
5042 [LOG_FAC(LOG_LOCAL2)] = "local2",
5043 [LOG_FAC(LOG_LOCAL3)] = "local3",
5044 [LOG_FAC(LOG_LOCAL4)] = "local4",
5045 [LOG_FAC(LOG_LOCAL5)] = "local5",
5046 [LOG_FAC(LOG_LOCAL6)] = "local6",
5047 [LOG_FAC(LOG_LOCAL7)] = "local7"
5050 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_facility_unshifted, int, LOG_FAC(~0));
5052 static const char *const log_level_table[] = {
5053 [LOG_EMERG] = "emerg",
5054 [LOG_ALERT] = "alert",
5055 [LOG_CRIT] = "crit",
5057 [LOG_WARNING] = "warning",
5058 [LOG_NOTICE] = "notice",
5059 [LOG_INFO] = "info",
5060 [LOG_DEBUG] = "debug"
5063 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(log_level, int, LOG_DEBUG);
5065 static const char* const sched_policy_table[] = {
5066 [SCHED_OTHER] = "other",
5067 [SCHED_BATCH] = "batch",
5068 [SCHED_IDLE] = "idle",
5069 [SCHED_FIFO] = "fifo",
5073 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(sched_policy, int, INT_MAX);
5075 static const char* const rlimit_table[_RLIMIT_MAX] = {
5076 [RLIMIT_CPU] = "LimitCPU",
5077 [RLIMIT_FSIZE] = "LimitFSIZE",
5078 [RLIMIT_DATA] = "LimitDATA",
5079 [RLIMIT_STACK] = "LimitSTACK",
5080 [RLIMIT_CORE] = "LimitCORE",
5081 [RLIMIT_RSS] = "LimitRSS",
5082 [RLIMIT_NOFILE] = "LimitNOFILE",
5083 [RLIMIT_AS] = "LimitAS",
5084 [RLIMIT_NPROC] = "LimitNPROC",
5085 [RLIMIT_MEMLOCK] = "LimitMEMLOCK",
5086 [RLIMIT_LOCKS] = "LimitLOCKS",
5087 [RLIMIT_SIGPENDING] = "LimitSIGPENDING",
5088 [RLIMIT_MSGQUEUE] = "LimitMSGQUEUE",
5089 [RLIMIT_NICE] = "LimitNICE",
5090 [RLIMIT_RTPRIO] = "LimitRTPRIO",
5091 [RLIMIT_RTTIME] = "LimitRTTIME"
5094 DEFINE_STRING_TABLE_LOOKUP(rlimit, int);
5096 static const char* const ip_tos_table[] = {
5097 [IPTOS_LOWDELAY] = "low-delay",
5098 [IPTOS_THROUGHPUT] = "throughput",
5099 [IPTOS_RELIABILITY] = "reliability",
5100 [IPTOS_LOWCOST] = "low-cost",
5103 DEFINE_STRING_TABLE_LOOKUP_WITH_FALLBACK(ip_tos, int, 0xff);
5105 static const char *const __signal_table[] = {
5122 [SIGSTKFLT] = "STKFLT", /* Linux on SPARC doesn't know SIGSTKFLT */
5133 [SIGVTALRM] = "VTALRM",
5135 [SIGWINCH] = "WINCH",
5141 DEFINE_PRIVATE_STRING_TABLE_LOOKUP(__signal, int);
5143 const char *signal_to_string(int signo) {
5144 static thread_local char buf[sizeof("RTMIN+")-1 + DECIMAL_STR_MAX(int) + 1];
5147 name = __signal_to_string(signo);
5151 if (signo >= SIGRTMIN && signo <= SIGRTMAX)
5152 snprintf(buf, sizeof(buf), "RTMIN+%d", signo - SIGRTMIN);
5154 snprintf(buf, sizeof(buf), "%d", signo);
5159 int signal_from_string(const char *s) {
5164 signo = __signal_from_string(s);
5168 if (startswith(s, "RTMIN+")) {
5172 if (safe_atou(s, &u) >= 0) {
5173 signo = (int) u + offset;
5174 if (signo > 0 && signo < _NSIG)
5180 bool kexec_loaded(void) {
5181 bool loaded = false;
5184 if (read_one_line_file("/sys/kernel/kexec_loaded", &s) >= 0) {
5192 int prot_from_flags(int flags) {
5194 switch (flags & O_ACCMODE) {
5203 return PROT_READ|PROT_WRITE;
5210 char *format_bytes(char *buf, size_t l, off_t t) {
5213 static const struct {
5217 { "E", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5218 { "P", 1024ULL*1024ULL*1024ULL*1024ULL*1024ULL },
5219 { "T", 1024ULL*1024ULL*1024ULL*1024ULL },
5220 { "G", 1024ULL*1024ULL*1024ULL },
5221 { "M", 1024ULL*1024ULL },
5225 if (t == (off_t) -1)
5228 for (i = 0; i < ELEMENTSOF(table); i++) {
5230 if (t >= table[i].factor) {
5233 (unsigned long long) (t / table[i].factor),
5234 (unsigned long long) (((t*10ULL) / table[i].factor) % 10ULL),
5241 snprintf(buf, l, "%lluB", (unsigned long long) t);
5249 void* memdup(const void *p, size_t l) {
5262 int fd_inc_sndbuf(int fd, size_t n) {
5264 socklen_t l = sizeof(value);
5266 r = getsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, &l);
5267 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5270 /* If we have the privileges we will ignore the kernel limit. */
5273 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
5274 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
5280 int fd_inc_rcvbuf(int fd, size_t n) {
5282 socklen_t l = sizeof(value);
5284 r = getsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, &l);
5285 if (r >= 0 && l == sizeof(value) && (size_t) value >= n*2)
5288 /* If we have the privileges we will ignore the kernel limit. */
5291 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
5292 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
5297 int fork_agent(pid_t *pid, const int except[], unsigned n_except, const char *path, ...) {
5298 bool stdout_is_tty, stderr_is_tty;
5299 pid_t parent_pid, agent_pid;
5300 sigset_t ss, saved_ss;
5308 /* Spawns a temporary TTY agent, making sure it goes away when
5311 parent_pid = getpid();
5313 /* First we temporarily block all signals, so that the new
5314 * child has them blocked initially. This way, we can be sure
5315 * that SIGTERMs are not lost we might send to the agent. */
5316 assert_se(sigfillset(&ss) >= 0);
5317 assert_se(sigprocmask(SIG_SETMASK, &ss, &saved_ss) >= 0);
5320 if (agent_pid < 0) {
5321 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5325 if (agent_pid != 0) {
5326 assert_se(sigprocmask(SIG_SETMASK, &saved_ss, NULL) >= 0);
5333 * Make sure the agent goes away when the parent dies */
5334 if (prctl(PR_SET_PDEATHSIG, SIGTERM) < 0)
5335 _exit(EXIT_FAILURE);
5337 /* Make sure we actually can kill the agent, if we need to, in
5338 * case somebody invoked us from a shell script that trapped
5339 * SIGTERM or so... */
5340 reset_all_signal_handlers();
5341 reset_signal_mask();
5343 /* Check whether our parent died before we were able
5344 * to set the death signal and unblock the signals */
5345 if (getppid() != parent_pid)
5346 _exit(EXIT_SUCCESS);
5348 /* Don't leak fds to the agent */
5349 close_all_fds(except, n_except);
5351 stdout_is_tty = isatty(STDOUT_FILENO);
5352 stderr_is_tty = isatty(STDERR_FILENO);
5354 if (!stdout_is_tty || !stderr_is_tty) {
5357 /* Detach from stdout/stderr. and reopen
5358 * /dev/tty for them. This is important to
5359 * ensure that when systemctl is started via
5360 * popen() or a similar call that expects to
5361 * read EOF we actually do generate EOF and
5362 * not delay this indefinitely by because we
5363 * keep an unused copy of stdin around. */
5364 fd = open("/dev/tty", O_WRONLY);
5366 log_error_errno(errno, "Failed to open /dev/tty: %m");
5367 _exit(EXIT_FAILURE);
5371 dup2(fd, STDOUT_FILENO);
5374 dup2(fd, STDERR_FILENO);
5380 /* Count arguments */
5382 for (n = 0; va_arg(ap, char*); n++)
5387 l = alloca(sizeof(char *) * (n + 1));
5389 /* Fill in arguments */
5391 for (i = 0; i <= n; i++)
5392 l[i] = va_arg(ap, char*);
5396 _exit(EXIT_FAILURE);
5399 int setrlimit_closest(int resource, const struct rlimit *rlim) {
5400 struct rlimit highest, fixed;
5404 if (setrlimit(resource, rlim) >= 0)
5410 /* So we failed to set the desired setrlimit, then let's try
5411 * to get as close as we can */
5412 assert_se(getrlimit(resource, &highest) == 0);
5414 fixed.rlim_cur = MIN(rlim->rlim_cur, highest.rlim_max);
5415 fixed.rlim_max = MIN(rlim->rlim_max, highest.rlim_max);
5417 if (setrlimit(resource, &fixed) < 0)
5423 int getenv_for_pid(pid_t pid, const char *field, char **_value) {
5424 _cleanup_fclose_ FILE *f = NULL;
5435 path = procfs_file_alloca(pid, "environ");
5437 f = fopen(path, "re");
5445 char line[LINE_MAX];
5448 for (i = 0; i < sizeof(line)-1; i++) {
5452 if (_unlikely_(c == EOF)) {
5462 if (memcmp(line, field, l) == 0 && line[l] == '=') {
5463 value = strdup(line + l + 1);
5477 bool http_etag_is_valid(const char *etag) {
5481 if (!endswith(etag, "\""))
5484 if (!startswith(etag, "\"") && !startswith(etag, "W/\""))
5490 bool http_url_is_valid(const char *url) {
5496 p = startswith(url, "http://");
5498 p = startswith(url, "https://");
5505 return ascii_is_valid(p);
5508 bool documentation_url_is_valid(const char *url) {
5514 if (http_url_is_valid(url))
5517 p = startswith(url, "file:/");
5519 p = startswith(url, "info:");
5521 p = startswith(url, "man:");
5526 return ascii_is_valid(p);
5529 bool in_initrd(void) {
5530 static int saved = -1;
5536 /* We make two checks here:
5538 * 1. the flag file /etc/initrd-release must exist
5539 * 2. the root file system must be a memory file system
5541 * The second check is extra paranoia, since misdetecting an
5542 * initrd can have bad bad consequences due the initrd
5543 * emptying when transititioning to the main systemd.
5546 saved = access("/etc/initrd-release", F_OK) >= 0 &&
5547 statfs("/", &s) >= 0 &&
5548 is_temporary_fs(&s);
5553 void warn_melody(void) {
5554 _cleanup_close_ int fd = -1;
5556 fd = open("/dev/console", O_WRONLY|O_CLOEXEC|O_NOCTTY);
5560 /* Yeah, this is synchronous. Kinda sucks. But well... */
5562 ioctl(fd, KIOCSOUND, (int)(1193180/440));
5563 usleep(125*USEC_PER_MSEC);
5565 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5566 usleep(125*USEC_PER_MSEC);
5568 ioctl(fd, KIOCSOUND, (int)(1193180/220));
5569 usleep(125*USEC_PER_MSEC);
5571 ioctl(fd, KIOCSOUND, 0);
5574 int make_console_stdio(void) {
5577 /* Make /dev/console the controlling terminal and stdin/stdout/stderr */
5579 fd = acquire_terminal("/dev/console", false, true, true, USEC_INFINITY);
5581 return log_error_errno(fd, "Failed to acquire terminal: %m");
5585 return log_error_errno(r, "Failed to duplicate terminal fd: %m");
5590 int get_home_dir(char **_h) {
5598 /* Take the user specified one */
5599 e = secure_getenv("HOME");
5600 if (e && path_is_absolute(e)) {
5609 /* Hardcode home directory for root to avoid NSS */
5612 h = strdup("/root");
5620 /* Check the database... */
5624 return errno > 0 ? -errno : -ESRCH;
5626 if (!path_is_absolute(p->pw_dir))
5629 h = strdup(p->pw_dir);
5637 int get_shell(char **_s) {
5645 /* Take the user specified one */
5646 e = getenv("SHELL");
5656 /* Hardcode home directory for root to avoid NSS */
5659 s = strdup("/bin/sh");
5667 /* Check the database... */
5671 return errno > 0 ? -errno : -ESRCH;
5673 if (!path_is_absolute(p->pw_shell))
5676 s = strdup(p->pw_shell);
5684 bool filename_is_valid(const char *p) {
5698 if (strlen(p) > FILENAME_MAX)
5704 bool string_is_safe(const char *p) {
5710 for (t = p; *t; t++) {
5711 if (*t > 0 && *t < ' ')
5714 if (strchr("\\\"\'\0x7f", *t))
5722 * Check if a string contains control characters. If 'ok' is non-NULL
5723 * it may be a string containing additional CCs to be considered OK.
5725 bool string_has_cc(const char *p, const char *ok) {
5730 for (t = p; *t; t++) {
5731 if (ok && strchr(ok, *t))
5734 if (*t > 0 && *t < ' ')
5744 bool path_is_safe(const char *p) {
5749 if (streq(p, "..") || startswith(p, "../") || endswith(p, "/..") || strstr(p, "/../"))
5752 if (strlen(p) > PATH_MAX)
5755 /* The following two checks are not really dangerous, but hey, they still are confusing */
5756 if (streq(p, ".") || startswith(p, "./") || endswith(p, "/.") || strstr(p, "/./"))
5759 if (strstr(p, "//"))
5765 /* hey glibc, APIs with callbacks without a user pointer are so useless */
5766 void *xbsearch_r(const void *key, const void *base, size_t nmemb, size_t size,
5767 int (*compar) (const void *, const void *, void *), void *arg) {
5776 p = (void *)(((const char *) base) + (idx * size));
5777 comparison = compar(key, p, arg);
5780 else if (comparison > 0)
5788 void init_gettext(void) {
5789 setlocale(LC_ALL, "");
5790 textdomain(GETTEXT_PACKAGE);
5793 bool is_locale_utf8(void) {
5795 static int cached_answer = -1;
5797 if (cached_answer >= 0)
5800 if (!setlocale(LC_ALL, "")) {
5801 cached_answer = true;
5805 set = nl_langinfo(CODESET);
5807 cached_answer = true;
5811 if (streq(set, "UTF-8")) {
5812 cached_answer = true;
5816 /* For LC_CTYPE=="C" return true, because CTYPE is effectly
5817 * unset and everything can do to UTF-8 nowadays. */
5818 set = setlocale(LC_CTYPE, NULL);
5820 cached_answer = true;
5824 /* Check result, but ignore the result if C was set
5828 !getenv("LC_ALL") &&
5829 !getenv("LC_CTYPE") &&
5833 return (bool) cached_answer;
5836 const char *draw_special_char(DrawSpecialChar ch) {
5837 static const char *draw_table[2][_DRAW_SPECIAL_CHAR_MAX] = {
5840 [DRAW_TREE_VERTICAL] = "\342\224\202 ", /* │ */
5841 [DRAW_TREE_BRANCH] = "\342\224\234\342\224\200", /* ├─ */
5842 [DRAW_TREE_RIGHT] = "\342\224\224\342\224\200", /* └─ */
5843 [DRAW_TREE_SPACE] = " ", /* */
5844 [DRAW_TRIANGULAR_BULLET] = "\342\200\243", /* ‣ */
5845 [DRAW_BLACK_CIRCLE] = "\342\227\217", /* ● */
5846 [DRAW_ARROW] = "\342\206\222", /* → */
5847 [DRAW_DASH] = "\342\200\223", /* – */
5850 /* ASCII fallback */ {
5851 [DRAW_TREE_VERTICAL] = "| ",
5852 [DRAW_TREE_BRANCH] = "|-",
5853 [DRAW_TREE_RIGHT] = "`-",
5854 [DRAW_TREE_SPACE] = " ",
5855 [DRAW_TRIANGULAR_BULLET] = ">",
5856 [DRAW_BLACK_CIRCLE] = "*",
5857 [DRAW_ARROW] = "->",
5862 return draw_table[!is_locale_utf8()][ch];
5865 char *strreplace(const char *text, const char *old_string, const char *new_string) {
5868 size_t l, old_len, new_len;
5874 old_len = strlen(old_string);
5875 new_len = strlen(new_string);
5888 if (!startswith(f, old_string)) {
5894 nl = l - old_len + new_len;
5895 a = realloc(r, nl + 1);
5903 t = stpcpy(t, new_string);
5915 char *strip_tab_ansi(char **ibuf, size_t *_isz) {
5916 const char *i, *begin = NULL;
5921 } state = STATE_OTHER;
5923 size_t osz = 0, isz;
5929 /* Strips ANSI color and replaces TABs by 8 spaces */
5931 isz = _isz ? *_isz : strlen(*ibuf);
5933 f = open_memstream(&obuf, &osz);
5937 for (i = *ibuf; i < *ibuf + isz + 1; i++) {
5942 if (i >= *ibuf + isz) /* EOT */
5944 else if (*i == '\x1B')
5945 state = STATE_ESCAPE;
5946 else if (*i == '\t')
5953 if (i >= *ibuf + isz) { /* EOT */
5956 } else if (*i == '[') {
5957 state = STATE_BRACKET;
5962 state = STATE_OTHER;
5969 if (i >= *ibuf + isz || /* EOT */
5970 (!(*i >= '0' && *i <= '9') && *i != ';' && *i != 'm')) {
5973 state = STATE_OTHER;
5975 } else if (*i == 'm')
5976 state = STATE_OTHER;
5998 int on_ac_power(void) {
5999 bool found_offline = false, found_online = false;
6000 _cleanup_closedir_ DIR *d = NULL;
6002 d = opendir("/sys/class/power_supply");
6008 _cleanup_close_ int fd = -1, device = -1;
6014 if (!de && errno != 0)
6020 if (hidden_file(de->d_name))
6023 device = openat(dirfd(d), de->d_name, O_DIRECTORY|O_RDONLY|O_CLOEXEC|O_NOCTTY);
6025 if (errno == ENOENT || errno == ENOTDIR)
6031 fd = openat(device, "type", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6033 if (errno == ENOENT)
6039 n = read(fd, contents, sizeof(contents));
6043 if (n != 6 || memcmp(contents, "Mains\n", 6))
6047 fd = openat(device, "online", O_RDONLY|O_CLOEXEC|O_NOCTTY);
6049 if (errno == ENOENT)
6055 n = read(fd, contents, sizeof(contents));
6059 if (n != 2 || contents[1] != '\n')
6062 if (contents[0] == '1') {
6063 found_online = true;
6065 } else if (contents[0] == '0')
6066 found_offline = true;
6071 return found_online || !found_offline;
6074 static int search_and_fopen_internal(const char *path, const char *mode, const char *root, char **search, FILE **_f) {
6081 if (!path_strv_resolve_uniq(search, root))
6084 STRV_FOREACH(i, search) {
6085 _cleanup_free_ char *p = NULL;
6089 p = strjoin(root, *i, "/", path, NULL);
6091 p = strjoin(*i, "/", path, NULL);
6101 if (errno != ENOENT)
6108 int search_and_fopen(const char *path, const char *mode, const char *root, const char **search, FILE **_f) {
6109 _cleanup_strv_free_ char **copy = NULL;
6115 if (path_is_absolute(path)) {
6118 f = fopen(path, mode);
6127 copy = strv_copy((char**) search);
6131 return search_and_fopen_internal(path, mode, root, copy, _f);
6134 int search_and_fopen_nulstr(const char *path, const char *mode, const char *root, const char *search, FILE **_f) {
6135 _cleanup_strv_free_ char **s = NULL;
6137 if (path_is_absolute(path)) {
6140 f = fopen(path, mode);
6149 s = strv_split_nulstr(search);
6153 return search_and_fopen_internal(path, mode, root, s, _f);
6156 char *strextend(char **x, ...) {
6163 l = f = *x ? strlen(*x) : 0;
6170 t = va_arg(ap, const char *);
6175 if (n > ((size_t) -1) - l) {
6184 r = realloc(*x, l+1);
6194 t = va_arg(ap, const char *);
6208 char *strrep(const char *s, unsigned n) {
6216 p = r = malloc(l * n + 1);
6220 for (i = 0; i < n; i++)
6227 void* greedy_realloc(void **p, size_t *allocated, size_t need, size_t size) {
6234 if (*allocated >= need)
6237 newalloc = MAX(need * 2, 64u / size);
6238 a = newalloc * size;
6240 /* check for overflows */
6241 if (a < size * need)
6249 *allocated = newalloc;
6253 void* greedy_realloc0(void **p, size_t *allocated, size_t need, size_t size) {
6262 q = greedy_realloc(p, allocated, need, size);
6266 if (*allocated > prev)
6267 memzero(q + prev * size, (*allocated - prev) * size);
6272 bool id128_is_valid(const char *s) {
6278 /* Simple formatted 128bit hex string */
6280 for (i = 0; i < l; i++) {
6283 if (!(c >= '0' && c <= '9') &&
6284 !(c >= 'a' && c <= 'z') &&
6285 !(c >= 'A' && c <= 'Z'))
6289 } else if (l == 36) {
6291 /* Formatted UUID */
6293 for (i = 0; i < l; i++) {
6296 if ((i == 8 || i == 13 || i == 18 || i == 23)) {
6300 if (!(c >= '0' && c <= '9') &&
6301 !(c >= 'a' && c <= 'z') &&
6302 !(c >= 'A' && c <= 'Z'))
6313 int split_pair(const char *s, const char *sep, char **l, char **r) {
6328 a = strndup(s, x - s);
6332 b = strdup(x + strlen(sep));
6344 int shall_restore_state(void) {
6345 _cleanup_free_ char *value = NULL;
6348 r = get_proc_cmdline_key("systemd.restore_state=", &value);
6354 return parse_boolean(value) != 0;
6357 int proc_cmdline(char **ret) {
6360 if (detect_container(NULL) > 0)
6361 return get_process_cmdline(1, 0, false, ret);
6363 return read_one_line_file("/proc/cmdline", ret);
6366 int parse_proc_cmdline(int (*parse_item)(const char *key, const char *value)) {
6367 _cleanup_free_ char *line = NULL;
6373 r = proc_cmdline(&line);
6379 _cleanup_free_ char *word = NULL;
6382 r = unquote_first_word(&p, &word, true);
6388 /* Filter out arguments that are intended only for the
6390 if (!in_initrd() && startswith(word, "rd."))
6393 value = strchr(word, '=');
6397 r = parse_item(word, value);
6405 int get_proc_cmdline_key(const char *key, char **value) {
6406 _cleanup_free_ char *line = NULL, *ret = NULL;
6413 r = proc_cmdline(&line);
6419 _cleanup_free_ char *word = NULL;
6422 r = unquote_first_word(&p, &word, true);
6428 /* Filter out arguments that are intended only for the
6430 if (!in_initrd() && startswith(word, "rd."))
6434 e = startswith(word, key);
6438 r = free_and_strdup(&ret, e);
6444 if (streq(word, key))
6458 int container_get_leader(const char *machine, pid_t *pid) {
6459 _cleanup_free_ char *s = NULL, *class = NULL;
6467 p = strjoina("/run/systemd/machines/", machine);
6468 r = parse_env_file(p, NEWLINE, "LEADER", &s, "CLASS", &class, NULL);
6476 if (!streq_ptr(class, "container"))
6479 r = parse_pid(s, &leader);
6489 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *root_fd) {
6490 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1;
6498 mntns = procfs_file_alloca(pid, "ns/mnt");
6499 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6507 pidns = procfs_file_alloca(pid, "ns/pid");
6508 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6516 netns = procfs_file_alloca(pid, "ns/net");
6517 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
6525 root = procfs_file_alloca(pid, "root");
6526 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
6532 *pidns_fd = pidnsfd;
6535 *mntns_fd = mntnsfd;
6538 *netns_fd = netnsfd;
6543 pidnsfd = mntnsfd = netnsfd = -1;
6548 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int root_fd) {
6551 if (setns(pidns_fd, CLONE_NEWPID) < 0)
6555 if (setns(mntns_fd, CLONE_NEWNS) < 0)
6559 if (setns(netns_fd, CLONE_NEWNET) < 0)
6563 if (fchdir(root_fd) < 0)
6566 if (chroot(".") < 0)
6570 if (setresgid(0, 0, 0) < 0)
6573 if (setgroups(0, NULL) < 0)
6576 if (setresuid(0, 0, 0) < 0)
6582 bool pid_is_unwaited(pid_t pid) {
6583 /* Checks whether a PID is still valid at all, including a zombie */
6588 if (kill(pid, 0) >= 0)
6591 return errno != ESRCH;
6594 bool pid_is_alive(pid_t pid) {
6597 /* Checks whether a PID is still valid and not a zombie */
6602 r = get_process_state(pid);
6603 if (r == -ENOENT || r == 'Z')
6609 int getpeercred(int fd, struct ucred *ucred) {
6610 socklen_t n = sizeof(struct ucred);
6617 r = getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &u, &n);
6621 if (n != sizeof(struct ucred))
6624 /* Check if the data is actually useful and not suppressed due
6625 * to namespacing issues */
6628 if (u.uid == UID_INVALID)
6630 if (u.gid == GID_INVALID)
6637 int getpeersec(int fd, char **ret) {
6649 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6653 if (errno != ERANGE)
6660 r = getsockopt(fd, SOL_SOCKET, SO_PEERSEC, s, &n);
6676 /* This is much like like mkostemp() but is subject to umask(). */
6677 int mkostemp_safe(char *pattern, int flags) {
6678 _cleanup_umask_ mode_t u;
6685 fd = mkostemp(pattern, flags);
6692 int open_tmpfile(const char *path, int flags) {
6699 /* Try O_TMPFILE first, if it is supported */
6700 fd = open(path, flags|O_TMPFILE, S_IRUSR|S_IWUSR);
6705 /* Fall back to unguessable name + unlinking */
6706 p = strjoina(path, "/systemd-tmp-XXXXXX");
6708 fd = mkostemp_safe(p, flags);
6716 int fd_warn_permissions(const char *path, int fd) {
6719 if (fstat(fd, &st) < 0)
6722 if (st.st_mode & 0111)
6723 log_warning("Configuration file %s is marked executable. Please remove executable permission bits. Proceeding anyway.", path);
6725 if (st.st_mode & 0002)
6726 log_warning("Configuration file %s is marked world-writable. Please remove world writability permission bits. Proceeding anyway.", path);
6728 if (getpid() == 1 && (st.st_mode & 0044) != 0044)
6729 log_warning("Configuration file %s is marked world-inaccessible. This has no effect as configuration data is accessible via APIs without restrictions. Proceeding anyway.", path);
6734 unsigned long personality_from_string(const char *p) {
6736 /* Parse a personality specifier. We introduce our own
6737 * identifiers that indicate specific ABIs, rather than just
6738 * hints regarding the register size, since we want to keep
6739 * things open for multiple locally supported ABIs for the
6740 * same register size. We try to reuse the ABI identifiers
6741 * used by libseccomp. */
6743 #if defined(__x86_64__)
6745 if (streq(p, "x86"))
6748 if (streq(p, "x86-64"))
6751 #elif defined(__i386__)
6753 if (streq(p, "x86"))
6757 /* personality(7) documents that 0xffffffffUL is used for
6758 * querying the current personality, hence let's use that here
6759 * as error indicator. */
6760 return 0xffffffffUL;
6763 const char* personality_to_string(unsigned long p) {
6765 #if defined(__x86_64__)
6767 if (p == PER_LINUX32)
6773 #elif defined(__i386__)
6782 uint64_t physical_memory(void) {
6785 /* We return this as uint64_t in case we are running as 32bit
6786 * process on a 64bit kernel with huge amounts of memory */
6788 mem = sysconf(_SC_PHYS_PAGES);
6791 return (uint64_t) mem * (uint64_t) page_size();
6794 void hexdump(FILE *f, const void *p, size_t s) {
6795 const uint8_t *b = p;
6798 assert(s == 0 || b);
6803 fprintf(f, "%04x ", n);
6805 for (i = 0; i < 16; i++) {
6810 fprintf(f, "%02x ", b[i]);
6818 for (i = 0; i < 16; i++) {
6823 fputc(isprint(b[i]) ? (char) b[i] : '.', f);
6837 int update_reboot_param_file(const char *param) {
6842 r = write_string_file(REBOOT_PARAM_FILE, param);
6844 log_error("Failed to write reboot param to "
6845 REBOOT_PARAM_FILE": %s", strerror(-r));
6847 unlink(REBOOT_PARAM_FILE);
6852 int umount_recursive(const char *prefix, int flags) {
6856 /* Try to umount everything recursively below a
6857 * directory. Also, take care of stacked mounts, and keep
6858 * unmounting them until they are gone. */
6861 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6866 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6867 if (!proc_self_mountinfo)
6871 _cleanup_free_ char *path = NULL, *p = NULL;
6874 k = fscanf(proc_self_mountinfo,
6875 "%*s " /* (1) mount id */
6876 "%*s " /* (2) parent id */
6877 "%*s " /* (3) major:minor */
6878 "%*s " /* (4) root */
6879 "%ms " /* (5) mount point */
6880 "%*s" /* (6) mount options */
6881 "%*[^-]" /* (7) optional fields */
6882 "- " /* (8) separator */
6883 "%*s " /* (9) file system type */
6884 "%*s" /* (10) mount source */
6885 "%*s" /* (11) mount options 2 */
6886 "%*[^\n]", /* some rubbish at the end */
6895 p = cunescape(path);
6899 if (!path_startswith(p, prefix))
6902 if (umount2(p, flags) < 0) {
6918 static int get_mount_flags(const char *path, unsigned long *flags) {
6921 if (statvfs(path, &buf) < 0)
6923 *flags = buf.f_flag;
6927 int bind_remount_recursive(const char *prefix, bool ro) {
6928 _cleanup_set_free_free_ Set *done = NULL;
6929 _cleanup_free_ char *cleaned = NULL;
6932 /* Recursively remount a directory (and all its submounts)
6933 * read-only or read-write. If the directory is already
6934 * mounted, we reuse the mount and simply mark it
6935 * MS_BIND|MS_RDONLY (or remove the MS_RDONLY for read-write
6936 * operation). If it isn't we first make it one. Afterwards we
6937 * apply MS_BIND|MS_RDONLY (or remove MS_RDONLY) to all
6938 * submounts we can access, too. When mounts are stacked on
6939 * the same mount point we only care for each individual
6940 * "top-level" mount on each point, as we cannot
6941 * influence/access the underlying mounts anyway. We do not
6942 * have any effect on future submounts that might get
6943 * propagated, they migt be writable. This includes future
6944 * submounts that have been triggered via autofs. */
6946 cleaned = strdup(prefix);
6950 path_kill_slashes(cleaned);
6952 done = set_new(&string_hash_ops);
6957 _cleanup_fclose_ FILE *proc_self_mountinfo = NULL;
6958 _cleanup_set_free_free_ Set *todo = NULL;
6959 bool top_autofs = false;
6961 unsigned long orig_flags;
6963 todo = set_new(&string_hash_ops);
6967 proc_self_mountinfo = fopen("/proc/self/mountinfo", "re");
6968 if (!proc_self_mountinfo)
6972 _cleanup_free_ char *path = NULL, *p = NULL, *type = NULL;
6975 k = fscanf(proc_self_mountinfo,
6976 "%*s " /* (1) mount id */
6977 "%*s " /* (2) parent id */
6978 "%*s " /* (3) major:minor */
6979 "%*s " /* (4) root */
6980 "%ms " /* (5) mount point */
6981 "%*s" /* (6) mount options (superblock) */
6982 "%*[^-]" /* (7) optional fields */
6983 "- " /* (8) separator */
6984 "%ms " /* (9) file system type */
6985 "%*s" /* (10) mount source */
6986 "%*s" /* (11) mount options (bind mount) */
6987 "%*[^\n]", /* some rubbish at the end */
6997 p = cunescape(path);
7001 /* Let's ignore autofs mounts. If they aren't
7002 * triggered yet, we want to avoid triggering
7003 * them, as we don't make any guarantees for
7004 * future submounts anyway. If they are
7005 * already triggered, then we will find
7006 * another entry for this. */
7007 if (streq(type, "autofs")) {
7008 top_autofs = top_autofs || path_equal(cleaned, p);
7012 if (path_startswith(p, cleaned) &&
7013 !set_contains(done, p)) {
7015 r = set_consume(todo, p);
7025 /* If we have no submounts to process anymore and if
7026 * the root is either already done, or an autofs, we
7028 if (set_isempty(todo) &&
7029 (top_autofs || set_contains(done, cleaned)))
7032 if (!set_contains(done, cleaned) &&
7033 !set_contains(todo, cleaned)) {
7034 /* The prefix directory itself is not yet a
7035 * mount, make it one. */
7036 if (mount(cleaned, cleaned, NULL, MS_BIND|MS_REC, NULL) < 0)
7040 (void) get_mount_flags(cleaned, &orig_flags);
7041 orig_flags &= ~MS_RDONLY;
7043 if (mount(NULL, prefix, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0)
7046 x = strdup(cleaned);
7050 r = set_consume(done, x);
7055 while ((x = set_steal_first(todo))) {
7057 r = set_consume(done, x);
7063 /* Try to reuse the original flag set, but
7064 * don't care for errors, in case of
7065 * obstructed mounts */
7067 (void) get_mount_flags(x, &orig_flags);
7068 orig_flags &= ~MS_RDONLY;
7070 if (mount(NULL, x, NULL, orig_flags|MS_BIND|MS_REMOUNT|(ro ? MS_RDONLY : 0), NULL) < 0) {
7072 /* Deal with mount points that are
7073 * obstructed by a later mount */
7075 if (errno != ENOENT)
7083 int fflush_and_check(FILE *f) {
7090 return errno ? -errno : -EIO;
7095 int tempfn_xxxxxx(const char *p, char **ret) {
7107 * /foo/bar/.#waldoXXXXXX
7111 if (!filename_is_valid(fn))
7114 t = new(char, strlen(p) + 2 + 6 + 1);
7118 strcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), "XXXXXX");
7120 *ret = path_kill_slashes(t);
7124 int tempfn_random(const char *p, char **ret) {
7138 * /foo/bar/.#waldobaa2a261115984a9
7142 if (!filename_is_valid(fn))
7145 t = new(char, strlen(p) + 2 + 16 + 1);
7149 x = stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn);
7152 for (i = 0; i < 16; i++) {
7153 *(x++) = hexchar(u & 0xF);
7159 *ret = path_kill_slashes(t);
7163 int tempfn_random_child(const char *p, char **ret) {
7174 * /foo/bar/waldo/.#3c2b6219aa75d7d0
7177 t = new(char, strlen(p) + 3 + 16 + 1);
7181 x = stpcpy(stpcpy(t, p), "/.#");
7184 for (i = 0; i < 16; i++) {
7185 *(x++) = hexchar(u & 0xF);
7191 *ret = path_kill_slashes(t);
7195 /* make sure the hostname is not "localhost" */
7196 bool is_localhost(const char *hostname) {
7199 /* This tries to identify local host and domain names
7200 * described in RFC6761 plus the redhatism of .localdomain */
7202 return streq(hostname, "localhost") ||
7203 streq(hostname, "localhost.") ||
7204 streq(hostname, "localdomain.") ||
7205 streq(hostname, "localdomain") ||
7206 endswith(hostname, ".localhost") ||
7207 endswith(hostname, ".localhost.") ||
7208 endswith(hostname, ".localdomain") ||
7209 endswith(hostname, ".localdomain.");
7212 int take_password_lock(const char *root) {
7214 struct flock flock = {
7216 .l_whence = SEEK_SET,
7224 /* This is roughly the same as lckpwdf(), but not as awful. We
7225 * don't want to use alarm() and signals, hence we implement
7226 * our own trivial version of this.
7228 * Note that shadow-utils also takes per-database locks in
7229 * addition to lckpwdf(). However, we don't given that they
7230 * are redundant as they they invoke lckpwdf() first and keep
7231 * it during everything they do. The per-database locks are
7232 * awfully racy, and thus we just won't do them. */
7235 path = strjoina(root, "/etc/.pwd.lock");
7237 path = "/etc/.pwd.lock";
7239 fd = open(path, O_WRONLY|O_CREAT|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW, 0600);
7243 r = fcntl(fd, F_SETLKW, &flock);
7252 int is_symlink(const char *path) {
7255 if (lstat(path, &info) < 0)
7258 return !!S_ISLNK(info.st_mode);
7261 int is_dir(const char* path, bool follow) {
7266 r = stat(path, &st);
7268 r = lstat(path, &st);
7272 return !!S_ISDIR(st.st_mode);
7275 int unquote_first_word(const char **p, char **ret, bool relax) {
7276 _cleanup_free_ char *s = NULL;
7277 size_t allocated = 0, sz = 0;
7284 SINGLE_QUOTE_ESCAPE,
7286 DOUBLE_QUOTE_ESCAPE,
7294 /* Parses the first word of a string, and returns it in
7295 * *ret. Removes all quotes in the process. When parsing fails
7296 * (because of an uneven number of quotes or similar), leaves
7297 * the pointer *p at the first invalid character. */
7307 else if (strchr(WHITESPACE, c))
7317 state = SINGLE_QUOTE;
7319 state = VALUE_ESCAPE;
7321 state = DOUBLE_QUOTE;
7322 else if (strchr(WHITESPACE, c))
7325 if (!GREEDY_REALLOC(s, allocated, sz+2))
7340 if (!GREEDY_REALLOC(s, allocated, sz+2))
7353 } else if (c == '\'')
7356 state = SINGLE_QUOTE_ESCAPE;
7358 if (!GREEDY_REALLOC(s, allocated, sz+2))
7366 case SINGLE_QUOTE_ESCAPE:
7373 if (!GREEDY_REALLOC(s, allocated, sz+2))
7377 state = SINGLE_QUOTE;
7386 state = DOUBLE_QUOTE_ESCAPE;
7388 if (!GREEDY_REALLOC(s, allocated, sz+2))
7396 case DOUBLE_QUOTE_ESCAPE:
7403 if (!GREEDY_REALLOC(s, allocated, sz+2))
7407 state = DOUBLE_QUOTE;
7413 if (!strchr(WHITESPACE, c))
7435 int unquote_many_words(const char **p, ...) {
7440 /* Parses a number of words from a string, stripping any
7441 * quotes if necessary. */
7445 /* Count how many words are expected */
7448 if (!va_arg(ap, char **))
7457 /* Read all words into a temporary array */
7458 l = newa0(char*, n);
7459 for (c = 0; c < n; c++) {
7461 r = unquote_first_word(p, &l[c], false);
7465 for (j = 0; j < c; j++)
7475 /* If we managed to parse all words, return them in the passed
7478 for (i = 0; i < n; i++) {
7481 v = va_arg(ap, char **);
7491 int free_and_strdup(char **p, const char *s) {
7496 /* Replaces a string pointer with an strdup()ed new string,
7497 * possibly freeing the old one. */
7512 int sethostname_idempotent(const char *s) {
7514 char buf[HOST_NAME_MAX + 1] = {};
7518 r = gethostname(buf, sizeof(buf));
7525 r = sethostname(s, strlen(s));
7532 int ptsname_malloc(int fd, char **ret) {
7545 if (ptsname_r(fd, c, l) == 0) {
7549 if (errno != ERANGE) {
7559 int openpt_in_namespace(pid_t pid, int flags) {
7560 _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, rootfd = -1;
7561 _cleanup_close_pair_ int pair[2] = { -1, -1 };
7563 struct cmsghdr cmsghdr;
7564 uint8_t buf[CMSG_SPACE(sizeof(int))];
7566 struct msghdr mh = {
7567 .msg_control = &control,
7568 .msg_controllen = sizeof(control),
7570 struct cmsghdr *cmsg;
7577 r = namespace_open(pid, &pidnsfd, &mntnsfd, NULL, &rootfd);
7581 if (socketpair(AF_UNIX, SOCK_DGRAM, 0, pair) < 0)
7591 pair[0] = safe_close(pair[0]);
7593 r = namespace_enter(pidnsfd, mntnsfd, -1, rootfd);
7595 _exit(EXIT_FAILURE);
7597 master = posix_openpt(flags);
7599 _exit(EXIT_FAILURE);
7601 cmsg = CMSG_FIRSTHDR(&mh);
7602 cmsg->cmsg_level = SOL_SOCKET;
7603 cmsg->cmsg_type = SCM_RIGHTS;
7604 cmsg->cmsg_len = CMSG_LEN(sizeof(int));
7605 memcpy(CMSG_DATA(cmsg), &master, sizeof(int));
7607 mh.msg_controllen = cmsg->cmsg_len;
7609 if (sendmsg(pair[1], &mh, MSG_NOSIGNAL) < 0)
7610 _exit(EXIT_FAILURE);
7612 _exit(EXIT_SUCCESS);
7615 pair[1] = safe_close(pair[1]);
7617 r = wait_for_terminate(child, &si);
7620 if (si.si_code != CLD_EXITED || si.si_status != EXIT_SUCCESS)
7623 if (recvmsg(pair[0], &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC) < 0)
7626 for (cmsg = CMSG_FIRSTHDR(&mh); cmsg; cmsg = CMSG_NXTHDR(&mh, cmsg))
7627 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
7631 fds = (int*) CMSG_DATA(cmsg);
7632 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
7635 close_many(fds, n_fds);
7645 ssize_t fgetxattrat_fake(int dirfd, const char *filename, const char *attribute, void *value, size_t size, int flags) {
7646 _cleanup_close_ int fd = -1;
7649 /* The kernel doesn't have a fgetxattrat() command, hence let's emulate one */
7651 fd = openat(dirfd, filename, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOATIME|(flags & AT_SYMLINK_NOFOLLOW ? O_NOFOLLOW : 0));
7655 l = fgetxattr(fd, attribute, value, size);
7662 static int parse_crtime(le64_t le, usec_t *usec) {
7668 if (u == 0 || u == (uint64_t) -1)
7675 int fd_getcrtime(int fd, usec_t *usec) {
7682 /* Until Linux gets a real concept of birthtime/creation time,
7683 * let's fake one with xattrs */
7685 n = fgetxattr(fd, "user.crtime_usec", &le, sizeof(le));
7688 if (n != sizeof(le))
7691 return parse_crtime(le, usec);
7694 int fd_getcrtime_at(int dirfd, const char *name, usec_t *usec, int flags) {
7698 n = fgetxattrat_fake(dirfd, name, "user.crtime_usec", &le, sizeof(le), flags);
7701 if (n != sizeof(le))
7704 return parse_crtime(le, usec);
7707 int path_getcrtime(const char *p, usec_t *usec) {
7714 n = getxattr(p, "user.crtime_usec", &le, sizeof(le));
7717 if (n != sizeof(le))
7720 return parse_crtime(le, usec);
7723 int fd_setcrtime(int fd, usec_t usec) {
7729 usec = now(CLOCK_REALTIME);
7731 le = htole64((uint64_t) usec);
7732 if (fsetxattr(fd, "user.crtime_usec", &le, sizeof(le), 0) < 0)
7738 int same_fd(int a, int b) {
7739 struct stat sta, stb;
7746 /* Compares two file descriptors. Note that semantics are
7747 * quite different depending on whether we have kcmp() or we
7748 * don't. If we have kcmp() this will only return true for
7749 * dup()ed file descriptors, but not otherwise. If we don't
7750 * have kcmp() this will also return true for two fds of the same
7751 * file, created by separate open() calls. Since we use this
7752 * call mostly for filtering out duplicates in the fd store
7753 * this difference hopefully doesn't matter too much. */
7758 /* Try to use kcmp() if we have it. */
7760 r = kcmp(pid, pid, KCMP_FILE, a, b);
7765 if (errno != ENOSYS)
7768 /* We don't have kcmp(), use fstat() instead. */
7769 if (fstat(a, &sta) < 0)
7772 if (fstat(b, &stb) < 0)
7775 if ((sta.st_mode & S_IFMT) != (stb.st_mode & S_IFMT))
7778 /* We consider all device fds different, since two device fds
7779 * might refer to quite different device contexts even though
7780 * they share the same inode and backing dev_t. */
7782 if (S_ISCHR(sta.st_mode) || S_ISBLK(sta.st_mode))
7785 if (sta.st_dev != stb.st_dev || sta.st_ino != stb.st_ino)
7788 /* The fds refer to the same inode on disk, let's also check
7789 * if they have the same fd flags. This is useful to
7790 * distuingish the read and write side of a pipe created with
7792 fa = fcntl(a, F_GETFL);
7796 fb = fcntl(b, F_GETFL);
7803 int chattr_fd(int fd, bool b, unsigned mask) {
7804 unsigned old_attr, new_attr;
7811 if (ioctl(fd, FS_IOC_GETFLAGS, &old_attr) < 0)
7815 new_attr = old_attr | mask;
7817 new_attr = old_attr & ~mask;
7819 if (new_attr == old_attr)
7822 if (ioctl(fd, FS_IOC_SETFLAGS, &new_attr) < 0)
7828 int chattr_path(const char *p, bool b, unsigned mask) {
7829 _cleanup_close_ int fd = -1;
7836 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7840 return chattr_fd(fd, b, mask);
7843 int read_attr_fd(int fd, unsigned *ret) {
7846 if (ioctl(fd, FS_IOC_GETFLAGS, ret) < 0)
7852 int read_attr_path(const char *p, unsigned *ret) {
7853 _cleanup_close_ int fd = -1;
7858 fd = open(p, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NOFOLLOW);
7862 return read_attr_fd(fd, ret);
7865 int make_lock_file(const char *p, int operation, LockFile *ret) {
7866 _cleanup_close_ int fd = -1;
7867 _cleanup_free_ char *t = NULL;
7871 * We use UNPOSIX locks if they are available. They have nice
7872 * semantics, and are mostly compatible with NFS. However,
7873 * they are only available on new kernels. When we detect we
7874 * are running on an older kernel, then we fall back to good
7875 * old BSD locks. They also have nice semantics, but are
7876 * slightly problematic on NFS, where they are upgraded to
7877 * POSIX locks, even though locally they are orthogonal to
7887 .l_type = (operation & ~LOCK_NB) == LOCK_EX ? F_WRLCK : F_RDLCK,
7888 .l_whence = SEEK_SET,
7892 fd = open(p, O_CREAT|O_RDWR|O_NOFOLLOW|O_CLOEXEC|O_NOCTTY, 0600);
7896 r = fcntl(fd, (operation & LOCK_NB) ? F_OFD_SETLK : F_OFD_SETLKW, &fl);
7899 /* If the kernel is too old, use good old BSD locks */
7900 if (errno == EINVAL)
7901 r = flock(fd, operation);
7904 return errno == EAGAIN ? -EBUSY : -errno;
7907 /* If we acquired the lock, let's check if the file
7908 * still exists in the file system. If not, then the
7909 * previous exclusive owner removed it and then closed
7910 * it. In such a case our acquired lock is worthless,
7911 * hence try again. */
7916 if (st.st_nlink > 0)
7919 fd = safe_close(fd);
7924 ret->operation = operation;
7932 int make_lock_file_for(const char *p, int operation, LockFile *ret) {
7940 if (!filename_is_valid(fn))
7943 t = newa(char, strlen(p) + 2 + 4 + 1);
7944 stpcpy(stpcpy(stpcpy(mempcpy(t, p, fn - p), ".#"), fn), ".lck");
7946 return make_lock_file(t, operation, ret);
7949 void release_lock_file(LockFile *f) {
7957 /* If we are the exclusive owner we can safely delete
7958 * the lock file itself. If we are not the exclusive
7959 * owner, we can try becoming it. */
7962 (f->operation & ~LOCK_NB) == LOCK_SH) {
7963 static const struct flock fl = {
7965 .l_whence = SEEK_SET,
7968 r = fcntl(f->fd, F_OFD_SETLK, &fl);
7969 if (r < 0 && errno == EINVAL)
7970 r = flock(f->fd, LOCK_EX|LOCK_NB);
7973 f->operation = LOCK_EX|LOCK_NB;
7976 if ((f->operation & ~LOCK_NB) == LOCK_EX)
7977 unlink_noerrno(f->path);
7983 f->fd = safe_close(f->fd);
7987 static size_t nul_length(const uint8_t *p, size_t sz) {
8002 ssize_t sparse_write(int fd, const void *p, size_t sz, size_t run_length) {
8003 const uint8_t *q, *w, *e;
8011 n = nul_length(q, e - q);
8013 /* If there are more than the specified run length of
8014 * NUL bytes, or if this is the beginning or the end
8015 * of the buffer, then seek instead of write */
8016 if ((n > run_length) ||
8017 (n > 0 && q == p) ||
8018 (n > 0 && q + n >= e)) {
8020 l = write(fd, w, q - w);
8027 if (lseek(fd, n, SEEK_CUR) == (off_t) -1)
8039 l = write(fd, w, q - w);
8046 return q - (const uint8_t*) p;
8049 void sigkill_wait(pid_t *pid) {
8055 if (kill(*pid, SIGKILL) > 0)
8056 (void) wait_for_terminate(*pid, NULL);
8059 int syslog_parse_priority(const char **p, int *priority, bool with_facility) {
8060 int a = 0, b = 0, c = 0;
8070 if (!strchr(*p, '>'))
8073 if ((*p)[2] == '>') {
8074 c = undecchar((*p)[1]);
8076 } else if ((*p)[3] == '>') {
8077 b = undecchar((*p)[1]);
8078 c = undecchar((*p)[2]);
8080 } else if ((*p)[4] == '>') {
8081 a = undecchar((*p)[1]);
8082 b = undecchar((*p)[2]);
8083 c = undecchar((*p)[3]);
8088 if (a < 0 || b < 0 || c < 0 ||
8089 (!with_facility && (a || b || c > 7)))
8093 *priority = a*100 + b*10 + c;
8095 *priority = (*priority & LOG_FACMASK) | c;
8101 ssize_t string_table_lookup(const char * const *table, size_t len, const char *key) {
8107 for (i = 0; i < len; ++i)
8108 if (streq_ptr(table[i], key))
8114 void cmsg_close_all(struct msghdr *mh) {
8115 struct cmsghdr *cmsg;
8119 for (cmsg = CMSG_FIRSTHDR(mh); cmsg; cmsg = CMSG_NXTHDR(mh, cmsg))
8120 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS)
8121 close_many((int*) CMSG_DATA(cmsg), (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int));