hashmap: drop assert(h) from hashmap_next()

[elogind.git] / src / shared / hashmap.c
diff --git a/src/shared/hashmap.c b/src/shared/hashmap.c

index f06fce6ef30ed585fd753deec15ad0ee1668363f..8225b8ebccd5e742eea1f90b42091c1c48238254 100644 (file)
--- a/src/shared/hashmap.c
+++ b/src/shared/hashmap.c
@@ -24,13 +24,10 @@
  #include <string.h>
  #include <errno.h>
  
-#ifdef HAVE_SYS_AUXV_H
-#include <sys/auxv.h>
-#endif
-
  #include "util.h"
  #include "hashmap.h"
  #include "macro.h"
+#include "siphash24.h"
  
  #define INITIAL_N_BUCKETS 31
  
@@ -42,16 +39,15 @@ struct hashmap_entry {
  };
  
  struct Hashmap {
-        hash_func_t hash_func;
-        compare_func_t compare_func;
+        const struct hash_ops *hash_ops;
  
          struct hashmap_entry *iterate_list_head, *iterate_list_tail;
  
          struct hashmap_entry ** buckets;
          unsigned n_buckets, n_entries;
  
-        unsigned random_xor;
-        bool from_pool;
+        uint8_t hash_key[HASH_KEY_SIZE];
+        bool from_pool:1;
  };
  
  struct pool {
@@ -66,13 +62,14 @@ static void *first_hashmap_tile = NULL;
  static struct pool *first_entry_pool = NULL;
  static void *first_entry_tile = NULL;
  
-static void* allocate_tile(struct pool **first_pool, void **first_tile, size_t tile_size) {
+static void* allocate_tile(struct pool **first_pool, void **first_tile, size_t tile_size, unsigned at_least) {
          unsigned i;
  
          /* When a tile is released we add it to the list and simply
           * place the next pointer at its offset 0. */
  
          assert(tile_size >= sizeof(void*));
+        assert(at_least > 0);
  
          if (*first_tile) {
                  void *r;
@@ -88,7 +85,7 @@ static void* allocate_tile(struct pool **first_pool, void **first_tile, size_t t
                  struct pool *p;
  
                  n = *first_pool ? (*first_pool)->n_tiles : 0;
-                n = MAX(512U, n * 2);
+                n = MAX(at_least, n * 2);
                  size = PAGE_ALIGN(ALIGN(sizeof(struct pool)) + n*tile_size);
                  n = (size - ALIGN(sizeof(struct pool))) / tile_size;
  
@@ -133,69 +130,112 @@ __attribute__((destructor)) static void cleanup_pool(void) {
  
  #endif
  
-unsigned string_hash_func(const void *p) {
-        unsigned hash = 5381;
-        const signed char *c;
-
-        /* DJB's hash function */
-
-        for (c = p; *c; c++)
-                hash = (hash << 5) + hash + (unsigned) *c;
-
-        return hash;
+unsigned long string_hash_func(const void *p, const uint8_t hash_key[HASH_KEY_SIZE]) {
+        uint64_t u;
+        siphash24((uint8_t*) &u, p, strlen(p), hash_key);
+        return (unsigned long) u;
  }
  
  int string_compare_func(const void *a, const void *b) {
          return strcmp(a, b);
  }
  
-unsigned trivial_hash_func(const void *p) {
-        return PTR_TO_UINT(p);
+const struct hash_ops string_hash_ops = {
+        .hash = string_hash_func,
+        .compare = string_compare_func
+};
+
+unsigned long trivial_hash_func(const void *p, const uint8_t hash_key[HASH_KEY_SIZE]) {
+        uint64_t u;
+        siphash24((uint8_t*) &u, &p, sizeof(p), hash_key);
+        return (unsigned long) u;
  }
  
  int trivial_compare_func(const void *a, const void *b) {
          return a < b ? -1 : (a > b ? 1 : 0);
  }
  
-unsigned uint64_hash_func(const void *p) {
-        uint64_t u;
-
-        assert_cc(sizeof(uint64_t) == 2*sizeof(unsigned));
-
-        u = *(const uint64_t*) p;
+const struct hash_ops trivial_hash_ops = {
+        .hash = trivial_hash_func,
+        .compare = trivial_compare_func
+};
  
-        return (unsigned) ((u >> 32) ^ u);
+unsigned long uint64_hash_func(const void *p, const uint8_t hash_key[HASH_KEY_SIZE]) {
+        uint64_t u;
+        siphash24((uint8_t*) &u, p, sizeof(uint64_t), hash_key);
+        return (unsigned long) u;
  }
  
  int uint64_compare_func(const void *_a, const void *_b) {
          uint64_t a, b;
-
          a = *(const uint64_t*) _a;
          b = *(const uint64_t*) _b;
+        return a < b ? -1 : (a > b ? 1 : 0);
+}
  
+const struct hash_ops uint64_hash_ops = {
+        .hash = uint64_hash_func,
+        .compare = uint64_compare_func
+};
+
+#if SIZEOF_DEV_T != 8
+unsigned long devt_hash_func(const void *p, const uint8_t hash_key[HASH_KEY_SIZE]) {
+        uint64_t u;
+        siphash24((uint8_t*) &u, p, sizeof(dev_t), hash_key);
+        return (unsigned long) u;
+}
+
+int devt_compare_func(const void *_a, const void *_b) {
+        dev_t a, b;
+        a = *(const dev_t*) _a;
+        b = *(const dev_t*) _b;
          return a < b ? -1 : (a > b ? 1 : 0);
  }
  
+const struct hash_ops devt_hash_ops = {
+        .hash = devt_hash_func,
+        .compare = devt_compare_func
+};
+#endif
+
  static unsigned bucket_hash(Hashmap *h, const void *p) {
-        return (h->hash_func(p) ^ h->random_xor) % h->n_buckets;
+        return (unsigned) (h->hash_ops->hash(p, h->hash_key) % h->n_buckets);
  }
  
-Hashmap *hashmap_new(hash_func_t hash_func, compare_func_t compare_func) {
+static void get_hash_key(uint8_t hash_key[HASH_KEY_SIZE], bool reuse_is_ok) {
+        static uint8_t current[HASH_KEY_SIZE];
+        static bool current_initialized = false;
+
+        /* Returns a hash function key to use. In order to keep things
+         * fast we will not generate a new key each time we allocate a
+         * new hash table. Instead, we'll just reuse the most recently
+         * generated one, except if we never generated one or when we
+         * are rehashing an entire hash table because we reached a
+         * fill level */
+
+        if (!current_initialized || !reuse_is_ok) {
+                random_bytes(current, sizeof(current));
+                current_initialized = true;
+        }
+
+        memcpy(hash_key, current, sizeof(current));
+}
+
+Hashmap *hashmap_new(const struct hash_ops *hash_ops) {
          bool b;
          Hashmap *h;
          size_t size;
-        void *auxv;
  
          b = is_main_thread();
  
          size = ALIGN(sizeof(Hashmap)) + INITIAL_N_BUCKETS * sizeof(struct hashmap_entry*);
  
          if (b) {
-                h = allocate_tile(&first_hashmap_pool, &first_hashmap_tile, size);
+                h = allocate_tile(&first_hashmap_pool, &first_hashmap_tile, size, 8);
                  if (!h)
                          return NULL;
  
-                memset(h, 0, size);
+                memzero(h, size);
          } else {
                  h = malloc0(size);
  
@@ -203,8 +243,7 @@ Hashmap *hashmap_new(hash_func_t hash_func, compare_func_t compare_func) {
                          return NULL;
          }
  
-        h->hash_func = hash_func ? hash_func : trivial_hash_func;
-        h->compare_func = compare_func ? compare_func : trivial_compare_func;
+        h->hash_ops = hash_ops ? hash_ops : &trivial_hash_ops;
  
          h->n_buckets = INITIAL_N_BUCKETS;
          h->n_entries = 0;
@@ -214,23 +253,12 @@ Hashmap *hashmap_new(hash_func_t hash_func, compare_func_t compare_func) {
  
          h->from_pool = b;
  
-        /* Let's randomize our hash functions a bit so that they are
-         * harder to guess for clients. For this, start out by cheaply
-         * using some bits the kernel passed into the process using
-         * the auxiliary vector. If the hashmap grows later on we will
-         * rehash everything using a new random XOR mask from
-         * /dev/random. */
-#ifdef HAVE_SYS_AUXV_H
-        auxv = (void*) getauxval(AT_RANDOM);
-        h->random_xor = auxv ? *(unsigned*) auxv : random_u();
-#else
-        h->random_xor = random_u();
-#endif
+        get_hash_key(h->hash_key, true);
  
          return h;
  }
  
-int hashmap_ensure_allocated(Hashmap **h, hash_func_t hash_func, compare_func_t compare_func) {
+int hashmap_ensure_allocated(Hashmap **h, const struct hash_ops *hash_ops) {
          Hashmap *q;
  
          assert(h);
@@ -238,7 +266,7 @@ int hashmap_ensure_allocated(Hashmap **h, hash_func_t hash_func, compare_func_t
          if (*h)
                  return 0;
  
-        q = hashmap_new(hash_func, compare_func);
+        q = hashmap_new(hash_ops);
          if (!q)
                  return -ENOMEM;
  
@@ -396,7 +424,7 @@ static struct hashmap_entry *hash_scan(Hashmap *h, unsigned hash, const void *ke
          assert(hash < h->n_buckets);
  
          for (e = h->buckets[hash]; e; e = e->bucket_next)
-                if (h->compare_func(e->key, key) == 0)
+                if (h->hash_ops->compare(e->key, key) == 0)
                          return e;
  
          return NULL;
@@ -404,7 +432,8 @@ static struct hashmap_entry *hash_scan(Hashmap *h, unsigned hash, const void *ke
  
  static bool resize_buckets(Hashmap *h) {
          struct hashmap_entry **n, *i;
-        unsigned m, nxor;
+        unsigned m;
+        uint8_t nkey[HASH_KEY_SIZE];
  
          assert(h);
  
@@ -419,15 +448,15 @@ static bool resize_buckets(Hashmap *h) {
          if (!n)
                  return false;
  
-        /* Let's use a different randomized xor value for the
+        /* Let's use a different randomized hash key for the
           * extension, so that people cannot guess what we are using
           * here forever */
-        nxor = random_u();
+        get_hash_key(nkey, false);
  
          for (i = h->iterate_list_head; i; i = i->iterate_next) {
-                unsigned hash, x;
+                unsigned long old_bucket, new_bucket;
  
-                hash = h->hash_func(i->key);
+                old_bucket = h->hash_ops->hash(i->key, h->hash_key) % h->n_buckets;
  
                  /* First, drop from old bucket table */
                  if (i->bucket_next)
@@ -436,16 +465,16 @@ static bool resize_buckets(Hashmap *h) {
                  if (i->bucket_previous)
                          i->bucket_previous->bucket_next = i->bucket_next;
                  else
-                        h->buckets[(hash ^ h->random_xor) % h->n_buckets] = i->bucket_next;
+                        h->buckets[old_bucket] = i->bucket_next;
  
                  /* Then, add to new backet table */
-                x = (hash ^ nxor) % m;
+                new_bucket = h->hash_ops->hash(i->key, nkey) % m;
  
-                i->bucket_next = n[x];
+                i->bucket_next = n[new_bucket];
                  i->bucket_previous = NULL;
-                if (n[x])
-                        n[x]->bucket_previous = i;
-                n[x] = i;
+                if (n[new_bucket])
+                        n[new_bucket]->bucket_previous = i;
+                n[new_bucket] = i;
          }
  
          if (h->buckets != (struct hashmap_entry**) ((uint8_t*) h + ALIGN(sizeof(Hashmap))))
@@ -453,30 +482,22 @@ static bool resize_buckets(Hashmap *h) {
  
          h->buckets = n;
          h->n_buckets = m;
-        h->random_xor = nxor;
+
+        memcpy(h->hash_key, nkey, HASH_KEY_SIZE);
  
          return true;
  }
  
-int hashmap_put(Hashmap *h, const void *key, void *value) {
-        struct hashmap_entry *e;
-        unsigned hash;
-
-        assert(h);
+static int __hashmap_put(Hashmap *h, const void *key, void *value, unsigned hash) {
+        /* For when we know no such entry exists yet */
  
-        hash = bucket_hash(h, key);
-        e = hash_scan(h, hash, key);
-        if (e) {
-                if (e->value == value)
-                        return 0;
-                return -EEXIST;
-        }
+        struct hashmap_entry *e;
  
          if (resize_buckets(h))
                  hash = bucket_hash(h, key);
  
          if (h->from_pool)
-                e = allocate_tile(&first_entry_pool, &first_entry_tile, sizeof(struct hashmap_entry));
+                e = allocate_tile(&first_entry_pool, &first_entry_tile, sizeof(struct hashmap_entry), 64U);
          else
                  e = new(struct hashmap_entry, 1);
  
@@ -491,6 +512,23 @@ int hashmap_put(Hashmap *h, const void *key, void *value) {
          return 1;
  }
  
+int hashmap_put(Hashmap *h, const void *key, void *value) {
+        struct hashmap_entry *e;
+        unsigned hash;
+
+        assert(h);
+
+        hash = bucket_hash(h, key);
+        e = hash_scan(h, hash, key);
+        if (e) {
+                if (e->value == value)
+                        return 0;
+                return -EEXIST;
+        }
+
+        return __hashmap_put(h, key, value, hash);
+}
+
  int hashmap_replace(Hashmap *h, const void *key, void *value) {
          struct hashmap_entry *e;
          unsigned hash;
@@ -505,7 +543,7 @@ int hashmap_replace(Hashmap *h, const void *key, void *value) {
                  return 0;
          }
  
-        return hashmap_put(h, key, value);
+        return __hashmap_put(h, key, value, hash);
  }
  
  int hashmap_update(Hashmap *h, const void *key, void *value) {
@@ -585,6 +623,34 @@ void* hashmap_remove(Hashmap *h, const void *key) {
          return data;
  }
  
+void* hashmap_remove2(Hashmap *h, const void *key, void **rkey) {
+        struct hashmap_entry *e;
+        unsigned hash;
+        void *data;
+
+        if (!h) {
+                if (rkey)
+                        *rkey = NULL;
+                return NULL;
+        }
+
+        hash = bucket_hash(h, key);
+        e = hash_scan(h, hash, key);
+        if (!e) {
+                if (rkey)
+                        *rkey = NULL;
+                return NULL;
+        }
+
+        data = e->value;
+        if (rkey)
+                *rkey = (void*) e->key;
+
+        remove_entry(h, e);
+
+        return data;
+}
+
  int hashmap_remove_and_put(Hashmap *h, const void *old_key, const void *new_key, void *value) {
          struct hashmap_entry *e;
          unsigned old_hash, new_hash;
@@ -695,59 +761,6 @@ at_end:
          return NULL;
  }
  
-void *hashmap_iterate_backwards(Hashmap *h, Iterator *i, const void **key) {
-        struct hashmap_entry *e;
-
-        assert(i);
-
-        if (!h)
-                goto at_beginning;
-
-        if (*i == ITERATOR_FIRST)
-                goto at_beginning;
-
-        if (*i == ITERATOR_LAST && !h->iterate_list_tail)
-                goto at_beginning;
-
-        e = *i == ITERATOR_LAST ? h->iterate_list_tail : (struct hashmap_entry*) *i;
-
-        if (e->iterate_previous)
-                *i = (Iterator) e->iterate_previous;
-        else
-                *i = ITERATOR_FIRST;
-
-        if (key)
-                *key = e->key;
-
-        return e->value;
-
-at_beginning:
-        *i = ITERATOR_FIRST;
-
-        if (key)
-                *key = NULL;
-
-        return NULL;
-}
-
-void *hashmap_iterate_skip(Hashmap *h, const void *key, Iterator *i) {
-        unsigned hash;
-        struct hashmap_entry *e;
-
-        if (!h)
-                return NULL;
-
-        hash = bucket_hash(h, key);
-
-        e = hash_scan(h, hash, key);
-        if (!e)
-                return NULL;
-
-        *i = (Iterator) e;
-
-        return e->value;
-}
-
  void* hashmap_first(Hashmap *h) {
  
          if (!h)
@@ -770,17 +783,6 @@ void* hashmap_first_key(Hashmap *h) {
          return (void*) h->iterate_list_head->key;
  }
  
-void* hashmap_last(Hashmap *h) {
-
-        if (!h)
-                return NULL;
-
-        if (!h->iterate_list_tail)
-                return NULL;
-
-        return h->iterate_list_tail->value;
-}
-
  void* hashmap_steal_first(Hashmap *h) {
          void *data;
  
@@ -884,15 +886,15 @@ int hashmap_move_one(Hashmap *h, Hashmap *other, const void *key) {
          unsigned h_hash, other_hash;
          struct hashmap_entry *e;
  
-        if (!other)
-                return 0;
-
          assert(h);
  
          h_hash = bucket_hash(h, key);
          if (hash_scan(h, h_hash, key))
                  return -EEXIST;
  
+        if (!other)
+                return -ENOENT;
+
          other_hash = bucket_hash(other, key);
          e = hash_scan(other, other_hash, key);
          if (!e)
@@ -909,7 +911,7 @@ Hashmap *hashmap_copy(Hashmap *h) {
  
          assert(h);
  
-        copy = hashmap_new(h->hash_func, h->compare_func);
+        copy = hashmap_new(h->hash_ops);
          if (!copy)
                  return NULL;
  
@@ -943,7 +945,6 @@ void *hashmap_next(Hashmap *h, const void *key) {
          unsigned hash;
          struct hashmap_entry *e;
  
-        assert(h);
          assert(key);
  
          if (!h)