1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2011 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
26 #include <sys/inotify.h>
29 #include "sd-journal.h"
30 #include "journal-def.h"
31 #include "journal-file.h"
34 #include "path-util.h"
37 #include "journal-internal.h"
39 #define JOURNAL_FILES_MAX 1024
41 static void detach_location(sd_journal *j) {
47 j->current_file = NULL;
50 HASHMAP_FOREACH(f, j->files, i)
51 f->current_offset = 0;
54 static void reset_location(sd_journal *j) {
58 zero(j->current_location);
61 static void init_location(Location *l, LocationType type, JournalFile *f, Object *o) {
63 assert(type == LOCATION_DISCRETE || type == LOCATION_SEEK);
65 assert(o->object.type == OBJECT_ENTRY);
68 l->seqnum = le64toh(o->entry.seqnum);
69 l->seqnum_id = f->header->seqnum_id;
70 l->realtime = le64toh(o->entry.realtime);
71 l->monotonic = le64toh(o->entry.monotonic);
72 l->boot_id = o->entry.boot_id;
73 l->xor_hash = le64toh(o->entry.xor_hash);
75 l->seqnum_set = l->realtime_set = l->monotonic_set = l->xor_hash_set = true;
78 static void set_location(sd_journal *j, LocationType type, JournalFile *f, Object *o, uint64_t offset) {
80 assert(type == LOCATION_DISCRETE || type == LOCATION_SEEK);
84 init_location(&j->current_location, type, f, o);
89 f->current_offset = offset;
92 static int match_is_valid(const void *data, size_t size) {
100 if (startswith(data, "__"))
104 for (p = b; p < b + size; p++) {
112 if (*p >= 'A' && *p <= 'Z')
115 if (*p >= '0' && *p <= '9')
124 static bool same_field(const void *_a, size_t s, const void *_b, size_t t) {
125 const uint8_t *a = _a, *b = _b;
128 for (j = 0; j < s && j < t; j++) {
140 static Match *match_new(Match *p, MatchType t) {
151 LIST_PREPEND(Match, matches, p->matches, m);
157 static void match_free(Match *m) {
161 match_free(m->matches);
164 LIST_REMOVE(Match, matches, m->parent->matches, m);
170 static void match_free_if_empty(Match *m) {
179 _public_ int sd_journal_add_match(sd_journal *j, const void *data, size_t size) {
180 Match *l2, *l3, *add_here = NULL, *m;
192 if (!match_is_valid(data, size))
198 * level 3: concrete matches */
201 j->level0 = match_new(NULL, MATCH_OR_TERM);
207 j->level1 = match_new(j->level0, MATCH_AND_TERM);
212 assert(j->level0->type == MATCH_OR_TERM);
213 assert(j->level1->type == MATCH_AND_TERM);
215 le_hash = htole64(hash64(data, size));
217 LIST_FOREACH(matches, l2, j->level1->matches) {
218 assert(l2->type == MATCH_OR_TERM);
220 LIST_FOREACH(matches, l3, l2->matches) {
221 assert(l3->type == MATCH_DISCRETE);
223 /* Exactly the same match already? Then ignore
225 if (l3->le_hash == le_hash &&
227 memcmp(l3->data, data, size) == 0)
230 /* Same field? Then let's add this to this OR term */
231 if (same_field(data, size, l3->data, l3->size)) {
242 add_here = match_new(j->level1, MATCH_OR_TERM);
247 m = match_new(add_here, MATCH_DISCRETE);
251 m->le_hash = le_hash;
253 m->data = memdup(data, size);
263 match_free_if_empty(add_here);
266 match_free_if_empty(j->level1);
269 match_free_if_empty(j->level0);
274 _public_ int sd_journal_add_disjunction(sd_journal *j) {
285 if (!j->level1->matches)
288 m = match_new(j->level0, MATCH_AND_TERM);
296 static char *match_make_string(Match *m) {
299 bool enclose = false;
304 if (m->type == MATCH_DISCRETE)
305 return strndup(m->data, m->size);
308 LIST_FOREACH(matches, i, m->matches) {
311 t = match_make_string(i);
318 k = strjoin(p, m->type == MATCH_OR_TERM ? " OR " : " AND ", t, NULL);
335 r = strjoin("(", p, ")", NULL);
343 char *journal_make_match_string(sd_journal *j) {
346 return match_make_string(j->level0);
349 _public_ void sd_journal_flush_matches(sd_journal *j) {
355 match_free(j->level0);
357 j->level0 = j->level1 = NULL;
362 static int compare_entry_order(JournalFile *af, Object *_ao,
363 JournalFile *bf, uint64_t bp) {
373 /* The mmap cache might invalidate the object from the first
374 * file if we look at the one from the second file. Hence
375 * temporarily copy the header of the first one, and look at
377 ao = alloca(offsetof(EntryObject, items));
378 memcpy(ao, _ao, offsetof(EntryObject, items));
380 r = journal_file_move_to_object(bf, OBJECT_ENTRY, bp, &bo);
382 return strcmp(af->path, bf->path);
384 /* We operate on two different files here, hence we can access
385 * two objects at the same time, which we normally can't.
387 * If contents and timestamps match, these entries are
388 * identical, even if the seqnum does not match */
390 if (sd_id128_equal(ao->entry.boot_id, bo->entry.boot_id) &&
391 ao->entry.monotonic == bo->entry.monotonic &&
392 ao->entry.realtime == bo->entry.realtime &&
393 ao->entry.xor_hash == bo->entry.xor_hash)
396 if (sd_id128_equal(af->header->seqnum_id, bf->header->seqnum_id)) {
398 /* If this is from the same seqnum source, compare
400 a = le64toh(ao->entry.seqnum);
401 b = le64toh(bo->entry.seqnum);
408 /* Wow! This is weird, different data but the same
409 * seqnums? Something is borked, but let's make the
410 * best of it and compare by time. */
413 if (sd_id128_equal(ao->entry.boot_id, bo->entry.boot_id)) {
415 /* If the boot id matches compare monotonic time */
416 a = le64toh(ao->entry.monotonic);
417 b = le64toh(bo->entry.monotonic);
425 /* Otherwise compare UTC time */
426 a = le64toh(ao->entry.realtime);
427 b = le64toh(bo->entry.realtime);
434 /* Finally, compare by contents */
435 a = le64toh(ao->entry.xor_hash);
436 b = le64toh(bo->entry.xor_hash);
446 static int compare_with_location(JournalFile *af, Object *ao, Location *l) {
452 assert(l->type == LOCATION_DISCRETE || l->type == LOCATION_SEEK);
454 if (l->monotonic_set &&
455 sd_id128_equal(ao->entry.boot_id, l->boot_id) &&
457 le64toh(ao->entry.realtime) == l->realtime &&
459 le64toh(ao->entry.xor_hash) == l->xor_hash)
463 sd_id128_equal(af->header->seqnum_id, l->seqnum_id)) {
465 a = le64toh(ao->entry.seqnum);
473 if (l->monotonic_set &&
474 sd_id128_equal(ao->entry.boot_id, l->boot_id)) {
476 a = le64toh(ao->entry.monotonic);
478 if (a < l->monotonic)
480 if (a > l->monotonic)
484 if (l->realtime_set) {
486 a = le64toh(ao->entry.realtime);
494 if (l->xor_hash_set) {
495 a = le64toh(ao->entry.xor_hash);
506 static int next_for_match(
510 uint64_t after_offset,
511 direction_t direction,
523 if (m->type == MATCH_DISCRETE) {
526 r = journal_file_find_data_object_with_hash(f, m->data, m->size, le64toh(m->le_hash), NULL, &dp);
530 return journal_file_move_to_entry_by_offset_for_data(f, dp, after_offset, direction, ret, offset);
532 } else if (m->type == MATCH_OR_TERM) {
535 /* Find the earliest match beyond after_offset */
537 LIST_FOREACH(matches, i, m->matches) {
540 r = next_for_match(j, i, f, after_offset, direction, NULL, &cp);
544 if (np == 0 || (direction == DIRECTION_DOWN ? np > cp : np < cp))
549 } else if (m->type == MATCH_AND_TERM) {
551 bool continue_looking;
553 /* Always jump to the next matching entry and repeat
554 * this until we fine and offset that matches for all
562 continue_looking = false;
564 LIST_FOREACH(matches, i, m->matches) {
568 limit = after_offset;
569 else if (direction == DIRECTION_DOWN)
570 limit = MAX(np, after_offset);
572 limit = MIN(np, after_offset);
574 r = next_for_match(j, i, f, limit, direction, NULL, &cp);
578 if ((direction == DIRECTION_DOWN ? cp >= after_offset : cp <= after_offset) &&
579 (np == 0 || (direction == DIRECTION_DOWN ? cp > np : np < cp))) {
581 continue_looking = true;
585 } while (continue_looking);
591 r = journal_file_move_to_object(f, OBJECT_ENTRY, np, &n);
603 static int find_location_for_match(
607 direction_t direction,
617 if (m->type == MATCH_DISCRETE) {
620 r = journal_file_find_data_object_with_hash(f, m->data, m->size, le64toh(m->le_hash), NULL, &dp);
624 /* FIXME: missing: find by monotonic */
626 if (j->current_location.type == LOCATION_HEAD)
627 return journal_file_next_entry_for_data(f, NULL, 0, dp, DIRECTION_DOWN, ret, offset);
628 if (j->current_location.type == LOCATION_TAIL)
629 return journal_file_next_entry_for_data(f, NULL, 0, dp, DIRECTION_UP, ret, offset);
630 if (j->current_location.seqnum_set && sd_id128_equal(j->current_location.seqnum_id, f->header->seqnum_id))
631 return journal_file_move_to_entry_by_seqnum_for_data(f, dp, j->current_location.seqnum, direction, ret, offset);
632 if (j->current_location.monotonic_set) {
633 r = journal_file_move_to_entry_by_monotonic_for_data(f, dp, j->current_location.boot_id, j->current_location.monotonic, direction, ret, offset);
637 if (j->current_location.realtime_set)
638 return journal_file_move_to_entry_by_realtime_for_data(f, dp, j->current_location.realtime, direction, ret, offset);
640 return journal_file_next_entry_for_data(f, NULL, 0, dp, direction, ret, offset);
642 } else if (m->type == MATCH_OR_TERM) {
647 /* Find the earliest match */
649 LIST_FOREACH(matches, i, m->matches) {
652 r = find_location_for_match(j, i, f, direction, NULL, &cp);
656 if (np == 0 || (direction == DIRECTION_DOWN ? np > cp : np < cp))
664 r = journal_file_move_to_object(f, OBJECT_ENTRY, np, &n);
679 assert(m->type == MATCH_AND_TERM);
681 /* First jump to the last match, and then find the
682 * next one where all matches match */
687 LIST_FOREACH(matches, i, m->matches) {
690 r = find_location_for_match(j, i, f, direction, NULL, &cp);
694 if (np == 0 || (direction == DIRECTION_DOWN ? np < cp : np > cp))
698 return next_for_match(j, m, f, np, direction, ret, offset);
702 static int find_location_with_matches(
705 direction_t direction,
717 /* No matches is simple */
719 if (j->current_location.type == LOCATION_HEAD)
720 return journal_file_next_entry(f, NULL, 0, DIRECTION_DOWN, ret, offset);
721 if (j->current_location.type == LOCATION_TAIL)
722 return journal_file_next_entry(f, NULL, 0, DIRECTION_UP, ret, offset);
723 if (j->current_location.seqnum_set && sd_id128_equal(j->current_location.seqnum_id, f->header->seqnum_id))
724 return journal_file_move_to_entry_by_seqnum(f, j->current_location.seqnum, direction, ret, offset);
725 if (j->current_location.monotonic_set) {
726 r = journal_file_move_to_entry_by_monotonic(f, j->current_location.boot_id, j->current_location.monotonic, direction, ret, offset);
730 if (j->current_location.realtime_set)
731 return journal_file_move_to_entry_by_realtime(f, j->current_location.realtime, direction, ret, offset);
733 return journal_file_next_entry(f, NULL, 0, direction, ret, offset);
735 return find_location_for_match(j, j->level0, f, direction, ret, offset);
738 static int next_with_matches(
741 direction_t direction,
756 /* No matches is easy. We simple advance the file
759 return journal_file_next_entry(f, c, cp, direction, ret, offset);
761 /* If we have a match then we look for the next matching entry
762 * with an offset at least one step larger */
763 return next_for_match(j, j->level0, f, direction == DIRECTION_DOWN ? cp+1 : cp-1, direction, ret, offset);
766 static int next_beyond_location(sd_journal *j, JournalFile *f, direction_t direction, Object **ret, uint64_t *offset) {
774 if (f->current_offset > 0) {
775 cp = f->current_offset;
777 r = journal_file_move_to_object(f, OBJECT_ENTRY, cp, &c);
781 r = next_with_matches(j, f, direction, &c, &cp);
785 r = find_location_with_matches(j, f, direction, &c, &cp);
790 /* OK, we found the spot, now let's advance until to an entry
791 * that is actually different from what we were previously
792 * looking at. This is necessary to handle entries which exist
793 * in two (or more) journal files, and which shall all be
794 * suppressed but one. */
799 if (j->current_location.type == LOCATION_DISCRETE) {
802 k = compare_with_location(f, c, &j->current_location);
803 if (direction == DIRECTION_DOWN)
818 r = next_with_matches(j, f, direction, &c, &cp);
824 static int real_journal_next(sd_journal *j, direction_t direction) {
825 JournalFile *f, *new_file = NULL;
826 uint64_t new_offset = 0;
835 HASHMAP_FOREACH(f, j->files, i) {
838 r = next_beyond_location(j, f, direction, &o, &p);
840 log_debug("Can't iterate through %s, ignoring: %s", f->path, strerror(-r));
850 k = compare_entry_order(f, o, new_file, new_offset);
852 if (direction == DIRECTION_DOWN)
867 r = journal_file_move_to_object(new_file, OBJECT_ENTRY, new_offset, &o);
871 set_location(j, LOCATION_DISCRETE, new_file, o, new_offset);
876 _public_ int sd_journal_next(sd_journal *j) {
877 return real_journal_next(j, DIRECTION_DOWN);
880 _public_ int sd_journal_previous(sd_journal *j) {
881 return real_journal_next(j, DIRECTION_UP);
884 static int real_journal_next_skip(sd_journal *j, direction_t direction, uint64_t skip) {
891 /* If this is not a discrete skip, then at least
892 * resolve the current location */
893 if (j->current_location.type != LOCATION_DISCRETE)
894 return real_journal_next(j, direction);
900 r = real_journal_next(j, direction);
914 _public_ int sd_journal_next_skip(sd_journal *j, uint64_t skip) {
915 return real_journal_next_skip(j, DIRECTION_DOWN, skip);
918 _public_ int sd_journal_previous_skip(sd_journal *j, uint64_t skip) {
919 return real_journal_next_skip(j, DIRECTION_UP, skip);
922 _public_ int sd_journal_get_cursor(sd_journal *j, char **cursor) {
925 char bid[33], sid[33];
932 if (!j->current_file || j->current_file->current_offset <= 0)
933 return -EADDRNOTAVAIL;
935 r = journal_file_move_to_object(j->current_file, OBJECT_ENTRY, j->current_file->current_offset, &o);
939 sd_id128_to_string(j->current_file->header->seqnum_id, sid);
940 sd_id128_to_string(o->entry.boot_id, bid);
943 "s=%s;i=%llx;b=%s;m=%llx;t=%llx;x=%llx",
944 sid, (unsigned long long) le64toh(o->entry.seqnum),
945 bid, (unsigned long long) le64toh(o->entry.monotonic),
946 (unsigned long long) le64toh(o->entry.realtime),
947 (unsigned long long) le64toh(o->entry.xor_hash)) < 0)
953 _public_ int sd_journal_seek_cursor(sd_journal *j, const char *cursor) {
957 unsigned long long seqnum, monotonic, realtime, xor_hash;
959 seqnum_id_set = false,
962 monotonic_set = false,
963 realtime_set = false,
964 xor_hash_set = false;
965 sd_id128_t seqnum_id, boot_id;
972 FOREACH_WORD_SEPARATOR(w, l, cursor, ";", state) {
976 if (l < 2 || w[1] != '=')
979 item = strndup(w, l);
986 seqnum_id_set = true;
987 k = sd_id128_from_string(item+2, &seqnum_id);
992 if (sscanf(item+2, "%llx", &seqnum) != 1)
998 k = sd_id128_from_string(item+2, &boot_id);
1002 monotonic_set = true;
1003 if (sscanf(item+2, "%llx", &monotonic) != 1)
1008 realtime_set = true;
1009 if (sscanf(item+2, "%llx", &realtime) != 1)
1014 xor_hash_set = true;
1015 if (sscanf(item+2, "%llx", &xor_hash) != 1)
1026 if ((!seqnum_set || !seqnum_id_set) &&
1027 (!monotonic_set || !boot_id_set) &&
1033 j->current_location.type = LOCATION_SEEK;
1036 j->current_location.realtime = (uint64_t) realtime;
1037 j->current_location.realtime_set = true;
1040 if (seqnum_set && seqnum_id_set) {
1041 j->current_location.seqnum = (uint64_t) seqnum;
1042 j->current_location.seqnum_id = seqnum_id;
1043 j->current_location.seqnum_set = true;
1046 if (monotonic_set && boot_id_set) {
1047 j->current_location.monotonic = (uint64_t) monotonic;
1048 j->current_location.boot_id = boot_id;
1049 j->current_location.monotonic_set = true;
1053 j->current_location.xor_hash = (uint64_t) xor_hash;
1054 j->current_location.xor_hash_set = true;
1060 _public_ int sd_journal_seek_monotonic_usec(sd_journal *j, sd_id128_t boot_id, uint64_t usec) {
1065 j->current_location.type = LOCATION_SEEK;
1066 j->current_location.boot_id = boot_id;
1067 j->current_location.monotonic = usec;
1068 j->current_location.monotonic_set = true;
1073 _public_ int sd_journal_seek_realtime_usec(sd_journal *j, uint64_t usec) {
1078 j->current_location.type = LOCATION_SEEK;
1079 j->current_location.realtime = usec;
1080 j->current_location.realtime_set = true;
1085 _public_ int sd_journal_seek_head(sd_journal *j) {
1090 j->current_location.type = LOCATION_HEAD;
1095 _public_ int sd_journal_seek_tail(sd_journal *j) {
1100 j->current_location.type = LOCATION_TAIL;
1105 static int add_file(sd_journal *j, const char *prefix, const char *filename) {
1114 if ((j->flags & SD_JOURNAL_SYSTEM_ONLY) &&
1115 !(streq(filename, "system.journal") ||
1116 streq(filename, "system.journal~") ||
1117 (startswith(filename, "system@") &&
1118 (endswith(filename, ".journal") || endswith(filename, ".journal~")))))
1121 path = strjoin(prefix, "/", filename, NULL);
1125 if (hashmap_get(j->files, path)) {
1130 if (hashmap_size(j->files) >= JOURNAL_FILES_MAX) {
1131 log_debug("Too many open journal files, not adding %s, ignoring.", path);
1136 r = journal_file_open(path, O_RDONLY, 0, false, false, NULL, j->mmap, NULL, &f);
1140 if (errno == ENOENT)
1146 /* journal_file_dump(f); */
1148 r = hashmap_put(j->files, f->path, f);
1150 journal_file_close(f);
1154 j->current_invalidate_counter ++;
1156 log_debug("File %s got added.", f->path);
1161 static int remove_file(sd_journal *j, const char *prefix, const char *filename) {
1169 path = strjoin(prefix, "/", filename, NULL);
1173 f = hashmap_get(j->files, path);
1178 hashmap_remove(j->files, f->path);
1179 journal_file_close(f);
1181 j->current_invalidate_counter ++;
1183 log_debug("File %s got removed.", f->path);
1187 static int add_directory(sd_journal *j, const char *prefix, const char *dirname) {
1198 if ((j->flags & SD_JOURNAL_LOCAL_ONLY) &&
1199 (sd_id128_from_string(dirname, &id) < 0 ||
1200 sd_id128_get_machine(&mid) < 0 ||
1201 !sd_id128_equal(id, mid)))
1204 path = strjoin(prefix, "/", dirname, NULL);
1210 log_debug("Failed to open %s: %m", path);
1213 if (errno == ENOENT)
1218 m = hashmap_get(j->directories_by_path, path);
1220 m = new0(Directory, 1);
1230 if (hashmap_put(j->directories_by_path, m->path, m) < 0) {
1237 j->current_invalidate_counter ++;
1239 log_debug("Directory %s got added.", m->path);
1241 } else if (m->is_root) {
1248 if (m->wd <= 0 && j->inotify_fd >= 0) {
1250 m->wd = inotify_add_watch(j->inotify_fd, m->path,
1251 IN_CREATE|IN_MOVED_TO|IN_MODIFY|IN_ATTRIB|IN_DELETE|
1252 IN_DELETE_SELF|IN_MOVE_SELF|IN_UNMOUNT|
1255 if (m->wd > 0 && hashmap_put(j->directories_by_wd, INT_TO_PTR(m->wd), m) < 0)
1256 inotify_rm_watch(j->inotify_fd, m->wd);
1261 union dirent_storage buf;
1263 r = readdir_r(d, &buf.de, &de);
1267 if (dirent_is_file_with_suffix(de, ".journal") ||
1268 dirent_is_file_with_suffix(de, ".journal~")) {
1269 r = add_file(j, m->path, de->d_name);
1271 log_debug("Failed to add file %s/%s: %s", m->path, de->d_name, strerror(-r));
1280 static int add_root_directory(sd_journal *j, const char *p) {
1288 if ((j->flags & SD_JOURNAL_RUNTIME_ONLY) &&
1289 !path_startswith(p, "/run"))
1296 m = hashmap_get(j->directories_by_path, p);
1298 m = new0(Directory, 1);
1305 m->path = strdup(p);
1312 if (hashmap_put(j->directories_by_path, m->path, m) < 0) {
1319 j->current_invalidate_counter ++;
1321 log_debug("Root directory %s got added.", m->path);
1323 } else if (!m->is_root) {
1328 if (m->wd <= 0 && j->inotify_fd >= 0) {
1330 m->wd = inotify_add_watch(j->inotify_fd, m->path,
1331 IN_CREATE|IN_MOVED_TO|IN_MODIFY|IN_ATTRIB|IN_DELETE|
1334 if (m->wd > 0 && hashmap_put(j->directories_by_wd, INT_TO_PTR(m->wd), m) < 0)
1335 inotify_rm_watch(j->inotify_fd, m->wd);
1340 union dirent_storage buf;
1343 r = readdir_r(d, &buf.de, &de);
1347 if (dirent_is_file_with_suffix(de, ".journal") ||
1348 dirent_is_file_with_suffix(de, ".journal~")) {
1349 r = add_file(j, m->path, de->d_name);
1351 log_debug("Failed to add file %s/%s: %s", m->path, de->d_name, strerror(-r));
1353 } else if ((de->d_type == DT_DIR || de->d_type == DT_LNK || de->d_type == DT_UNKNOWN) &&
1354 sd_id128_from_string(de->d_name, &id) >= 0) {
1356 r = add_directory(j, m->path, de->d_name);
1358 log_debug("Failed to add directory %s/%s: %s", m->path, de->d_name, strerror(-r));
1367 static int remove_directory(sd_journal *j, Directory *d) {
1371 hashmap_remove(j->directories_by_wd, INT_TO_PTR(d->wd));
1373 if (j->inotify_fd >= 0)
1374 inotify_rm_watch(j->inotify_fd, d->wd);
1377 hashmap_remove(j->directories_by_path, d->path);
1380 log_debug("Root directory %s got removed.", d->path);
1382 log_debug("Directory %s got removed.", d->path);
1390 static int add_search_paths(sd_journal *j) {
1392 const char search_paths[] =
1393 "/run/log/journal\0"
1394 "/var/log/journal\0";
1399 /* We ignore most errors here, since the idea is to only open
1400 * what's actually accessible, and ignore the rest. */
1402 NULSTR_FOREACH(p, search_paths)
1403 add_root_directory(j, p);
1408 static int allocate_inotify(sd_journal *j) {
1411 if (j->inotify_fd < 0) {
1412 j->inotify_fd = inotify_init1(IN_NONBLOCK|IN_CLOEXEC);
1413 if (j->inotify_fd < 0)
1417 if (!j->directories_by_wd) {
1418 j->directories_by_wd = hashmap_new(trivial_hash_func, trivial_compare_func);
1419 if (!j->directories_by_wd)
1426 static sd_journal *journal_new(int flags, const char *path) {
1429 j = new0(sd_journal, 1);
1437 j->path = strdup(path);
1444 j->files = hashmap_new(string_hash_func, string_compare_func);
1451 j->directories_by_path = hashmap_new(string_hash_func, string_compare_func);
1452 if (!j->directories_by_path) {
1453 hashmap_free(j->files);
1459 j->mmap = mmap_cache_new();
1461 hashmap_free(j->files);
1462 hashmap_free(j->directories_by_path);
1471 _public_ int sd_journal_open(sd_journal **ret, int flags) {
1478 if (flags & ~(SD_JOURNAL_LOCAL_ONLY|
1479 SD_JOURNAL_RUNTIME_ONLY|
1480 SD_JOURNAL_SYSTEM_ONLY))
1483 j = journal_new(flags, NULL);
1487 r = add_search_paths(j);
1495 sd_journal_close(j);
1500 _public_ int sd_journal_open_directory(sd_journal **ret, const char *path, int flags) {
1507 if (!path || !path_is_absolute(path))
1513 j = journal_new(flags, path);
1517 r = add_root_directory(j, path);
1525 sd_journal_close(j);
1530 _public_ void sd_journal_close(sd_journal *j) {
1537 while ((f = hashmap_steal_first(j->files)))
1538 journal_file_close(f);
1540 hashmap_free(j->files);
1542 while ((d = hashmap_first(j->directories_by_path)))
1543 remove_directory(j, d);
1545 while ((d = hashmap_first(j->directories_by_wd)))
1546 remove_directory(j, d);
1548 hashmap_free(j->directories_by_path);
1549 hashmap_free(j->directories_by_wd);
1551 if (j->inotify_fd >= 0)
1552 close_nointr_nofail(j->inotify_fd);
1554 sd_journal_flush_matches(j);
1557 mmap_cache_unref(j->mmap);
1563 _public_ int sd_journal_get_realtime_usec(sd_journal *j, uint64_t *ret) {
1573 f = j->current_file;
1575 return -EADDRNOTAVAIL;
1577 if (f->current_offset <= 0)
1578 return -EADDRNOTAVAIL;
1580 r = journal_file_move_to_object(f, OBJECT_ENTRY, f->current_offset, &o);
1584 *ret = le64toh(o->entry.realtime);
1588 _public_ int sd_journal_get_monotonic_usec(sd_journal *j, uint64_t *ret, sd_id128_t *ret_boot_id) {
1597 f = j->current_file;
1599 return -EADDRNOTAVAIL;
1601 if (f->current_offset <= 0)
1602 return -EADDRNOTAVAIL;
1604 r = journal_file_move_to_object(f, OBJECT_ENTRY, f->current_offset, &o);
1609 *ret_boot_id = o->entry.boot_id;
1611 r = sd_id128_get_boot(&id);
1615 if (!sd_id128_equal(id, o->entry.boot_id))
1620 *ret = le64toh(o->entry.monotonic);
1625 static bool field_is_valid(const char *field) {
1633 if (startswith(field, "__"))
1636 for (p = field; *p; p++) {
1641 if (*p >= 'A' && *p <= 'Z')
1644 if (*p >= '0' && *p <= '9')
1653 _public_ int sd_journal_get_data(sd_journal *j, const char *field, const void **data, size_t *size) {
1656 size_t field_length;
1669 if (!field_is_valid(field))
1672 f = j->current_file;
1674 return -EADDRNOTAVAIL;
1676 if (f->current_offset <= 0)
1677 return -EADDRNOTAVAIL;
1679 r = journal_file_move_to_object(f, OBJECT_ENTRY, f->current_offset, &o);
1683 field_length = strlen(field);
1685 n = journal_file_entry_n_items(o);
1686 for (i = 0; i < n; i++) {
1691 p = le64toh(o->entry.items[i].object_offset);
1692 le_hash = o->entry.items[i].hash;
1693 r = journal_file_move_to_object(f, OBJECT_DATA, p, &o);
1697 if (le_hash != o->data.hash)
1700 l = le64toh(o->object.size) - offsetof(Object, data.payload);
1702 if (o->object.flags & OBJECT_COMPRESSED) {
1705 if (uncompress_startswith(o->data.payload, l,
1706 &f->compress_buffer, &f->compress_buffer_size,
1707 field, field_length, '=')) {
1711 if (!uncompress_blob(o->data.payload, l,
1712 &f->compress_buffer, &f->compress_buffer_size, &rsize))
1715 *data = f->compress_buffer;
1716 *size = (size_t) rsize;
1721 return -EPROTONOSUPPORT;
1724 } else if (l >= field_length+1 &&
1725 memcmp(o->data.payload, field, field_length) == 0 &&
1726 o->data.payload[field_length] == '=') {
1730 if ((uint64_t) t != l)
1733 *data = o->data.payload;
1739 r = journal_file_move_to_object(f, OBJECT_ENTRY, f->current_offset, &o);
1747 _public_ int sd_journal_enumerate_data(sd_journal *j, const void **data, size_t *size) {
1762 f = j->current_file;
1764 return -EADDRNOTAVAIL;
1766 if (f->current_offset <= 0)
1767 return -EADDRNOTAVAIL;
1769 r = journal_file_move_to_object(f, OBJECT_ENTRY, f->current_offset, &o);
1773 n = journal_file_entry_n_items(o);
1774 if (j->current_field >= n)
1777 p = le64toh(o->entry.items[j->current_field].object_offset);
1778 le_hash = o->entry.items[j->current_field].hash;
1779 r = journal_file_move_to_object(f, OBJECT_DATA, p, &o);
1783 if (le_hash != o->data.hash)
1786 l = le64toh(o->object.size) - offsetof(Object, data.payload);
1789 /* We can't read objects larger than 4G on a 32bit machine */
1790 if ((uint64_t) t != l)
1793 if (o->object.flags & OBJECT_COMPRESSED) {
1797 if (!uncompress_blob(o->data.payload, l, &f->compress_buffer, &f->compress_buffer_size, &rsize))
1800 *data = f->compress_buffer;
1801 *size = (size_t) rsize;
1803 return -EPROTONOSUPPORT;
1806 *data = o->data.payload;
1810 j->current_field ++;
1815 _public_ void sd_journal_restart_data(sd_journal *j) {
1819 j->current_field = 0;
1822 _public_ int sd_journal_get_fd(sd_journal *j) {
1828 if (j->inotify_fd >= 0)
1829 return j->inotify_fd;
1831 r = allocate_inotify(j);
1835 /* Iterate through all dirs again, to add them to the
1838 r = add_root_directory(j, j->path);
1840 r = add_search_paths(j);
1844 return j->inotify_fd;
1847 static void process_inotify_event(sd_journal *j, struct inotify_event *e) {
1854 /* Is this a subdirectory we watch? */
1855 d = hashmap_get(j->directories_by_wd, INT_TO_PTR(e->wd));
1859 if (!(e->mask & IN_ISDIR) && e->len > 0 &&
1860 (endswith(e->name, ".journal") ||
1861 endswith(e->name, ".journal~"))) {
1863 /* Event for a journal file */
1865 if (e->mask & (IN_CREATE|IN_MOVED_TO|IN_MODIFY|IN_ATTRIB)) {
1866 r = add_file(j, d->path, e->name);
1868 log_debug("Failed to add file %s/%s: %s", d->path, e->name, strerror(-r));
1870 } else if (e->mask & (IN_DELETE|IN_UNMOUNT)) {
1872 r = remove_file(j, d->path, e->name);
1874 log_debug("Failed to remove file %s/%s: %s", d->path, e->name, strerror(-r));
1877 } else if (!d->is_root && e->len == 0) {
1879 /* Event for a subdirectory */
1881 if (e->mask & (IN_DELETE_SELF|IN_MOVE_SELF|IN_UNMOUNT)) {
1882 r = remove_directory(j, d);
1884 log_debug("Failed to remove directory %s: %s", d->path, strerror(-r));
1888 } else if (d->is_root && (e->mask & IN_ISDIR) && e->len > 0 && sd_id128_from_string(e->name, &id) >= 0) {
1890 /* Event for root directory */
1892 if (e->mask & (IN_CREATE|IN_MOVED_TO|IN_MODIFY|IN_ATTRIB)) {
1893 r = add_directory(j, d->path, e->name);
1895 log_debug("Failed to add directory %s/%s: %s", d->path, e->name, strerror(-r));
1902 if (e->mask & IN_IGNORED)
1905 log_warning("Unknown inotify event.");
1908 static int determine_change(sd_journal *j) {
1913 b = j->current_invalidate_counter != j->last_invalidate_counter;
1914 j->last_invalidate_counter = j->current_invalidate_counter;
1916 return b ? SD_JOURNAL_INVALIDATE : SD_JOURNAL_APPEND;
1919 _public_ int sd_journal_process(sd_journal *j) {
1920 uint8_t buffer[sizeof(struct inotify_event) + FILENAME_MAX] _alignas_(struct inotify_event);
1921 bool got_something = false;
1927 struct inotify_event *e;
1930 l = read(j->inotify_fd, buffer, sizeof(buffer));
1932 if (errno == EAGAIN || errno == EINTR)
1933 return got_something ? determine_change(j) : SD_JOURNAL_NOP;
1938 got_something = true;
1940 e = (struct inotify_event*) buffer;
1944 process_inotify_event(j, e);
1946 step = sizeof(struct inotify_event) + e->len;
1947 assert(step <= (size_t) l);
1949 e = (struct inotify_event*) ((uint8_t*) e + step);
1954 return determine_change(j);
1957 _public_ int sd_journal_wait(sd_journal *j, uint64_t timeout_usec) {
1962 if (j->inotify_fd < 0) {
1964 /* This is the first invocation, hence create the
1966 r = sd_journal_get_fd(j);
1970 /* The journal might have changed since the context
1971 * object was created and we weren't watching before,
1972 * hence don't wait for anything, and return
1974 return determine_change(j);
1978 r = fd_wait_for_event(j->inotify_fd, POLLIN, timeout_usec);
1979 } while (r == -EINTR);
1984 return sd_journal_process(j);
1987 _public_ int sd_journal_get_cutoff_realtime_usec(sd_journal *j, uint64_t *from, uint64_t *to) {
1998 HASHMAP_FOREACH(f, j->files, i) {
2001 r = journal_file_get_cutoff_realtime_usec(f, &fr, &t);
2017 *from = MIN(fr, *from);
2023 return first ? 0 : 1;
2026 _public_ int sd_journal_get_cutoff_monotonic_usec(sd_journal *j, sd_id128_t boot_id, uint64_t *from, uint64_t *to) {
2037 HASHMAP_FOREACH(f, j->files, i) {
2040 r = journal_file_get_cutoff_monotonic_usec(f, boot_id, &fr, &t);
2056 *from = MIN(fr, *from);
2062 return first ? 0 : 1;
2065 void journal_print_header(sd_journal *j) {
2068 bool newline = false;
2072 HASHMAP_FOREACH(f, j->files, i) {
2078 journal_file_print_header(f);
2082 _public_ int sd_journal_get_usage(sd_journal *j, uint64_t *bytes) {
2092 HASHMAP_FOREACH(f, j->files, i) {
2095 if (fstat(f->fd, &st) < 0)
2098 sum += (uint64_t) st.st_blocks * 512ULL;
2105 /* _public_ int sd_journal_query_unique(sd_journal *j, const char *field) { */
2107 /* return -EINVAL; */
2109 /* return -EINVAL; */
2111 /* return -ENOTSUP; */
2114 /* _public_ int sd_journal_enumerate_unique(sd_journal *j, const void **data, size_t *l) { */
2116 /* return -EINVAL; */
2118 /* return -EINVAL; */
2120 /* return -EINVAL; */
2122 /* return -ENOTSUP; */
2125 /* _public_ void sd_journal_restart_unique(sd_journal *j) { */