src/basic/hashmap.c

   1 /* SPDX-License-Identifier: LGPL-2.1+ */
   2 /***
   3   Copyright © 2014 Michal Schmidt
   4 ***/
   5
   6 #include <errno.h>
   7 #include <stdint.h>
   8 #include <stdlib.h>
   9 #include <string.h>
  10
  11 #include "alloc-util.h"
  12 #include "hashmap.h"
  13 #include "fileio.h"
  14 #include "macro.h"
  15 #include "mempool.h"
  16 #include "process-util.h"
  17 #include "random-util.h"
  18 #include "set.h"
  19 #include "siphash24.h"
  20 #include "string-util.h"
  21 #include "strv.h"
  22 #include "util.h"
  23
  24 #if ENABLE_DEBUG_HASHMAP
  25 #include <pthread.h>
  26 #include "list.h"
  27 #endif
  28
  29 /*
  30  * Implementation of hashmaps.
  31  * Addressing: open
  32  *   - uses less RAM compared to closed addressing (chaining), because
  33  *     our entries are small (especially in Sets, which tend to contain
  34  *     the majority of entries in systemd).
  35  * Collision resolution: Robin Hood
  36  *   - tends to equalize displacement of entries from their optimal buckets.
  37  * Probe sequence: linear
  38  *   - though theoretically worse than random probing/uniform hashing/double
  39  *     hashing, it is good for cache locality.
  40  *
  41  * References:
  42  * Celis, P. 1986. Robin Hood Hashing.
  43  * Ph.D. Dissertation. University of Waterloo, Waterloo, Ont., Canada, Canada.
  44  * https://cs.uwaterloo.ca/research/tr/1986/CS-86-14.pdf
  45  * - The results are derived for random probing. Suggests deletion with
  46  *   tombstones and two mean-centered search methods. None of that works
  47  *   well for linear probing.
  48  *
  49  * Janson, S. 2005. Individual displacements for linear probing hashing with different insertion policies.
  50  * ACM Trans. Algorithms 1, 2 (October 2005), 177-213.
  51  * DOI=10.1145/1103963.1103964 http://doi.acm.org/10.1145/1103963.1103964
  52  * http://www.math.uu.se/~svante/papers/sj157.pdf
  53  * - Applies to Robin Hood with linear probing. Contains remarks on
  54  *   the unsuitability of mean-centered search with linear probing.
  55  *
  56  * Viola, A. 2005. Exact distribution of individual displacements in linear probing hashing.
  57  * ACM Trans. Algorithms 1, 2 (October 2005), 214-242.
  58  * DOI=10.1145/1103963.1103965 http://doi.acm.org/10.1145/1103963.1103965
  59  * - Similar to Janson. Note that Viola writes about C_{m,n} (number of probes
  60  *   in a successful search), and Janson writes about displacement. C = d + 1.
  61  *
  62  * Goossaert, E. 2013. Robin Hood hashing: backward shift deletion.
  63  * http://codecapsule.com/2013/11/17/robin-hood-hashing-backward-shift-deletion/
  64  * - Explanation of backward shift deletion with pictures.
  65  *
  66  * Khuong, P. 2013. The Other Robin Hood Hashing.
  67  * http://www.pvk.ca/Blog/2013/11/26/the-other-robin-hood-hashing/
  68  * - Short summary of random vs. linear probing, and tombstones vs. backward shift.
  69  */
  70
  71 /*
  72  * XXX Ideas for improvement:
  73  * For unordered hashmaps, randomize iteration order, similarly to Perl:
  74  * http://blog.booking.com/hardening-perls-hash-function.html
  75  */
  76
  77 /* INV_KEEP_FREE = 1 / (1 - max_load_factor)
  78  * e.g. 1 / (1 - 0.8) = 5 ... keep one fifth of the buckets free. */
  79 #define INV_KEEP_FREE            5U
  80
  81 /* Fields common to entries of all hashmap/set types */
  82 struct hashmap_base_entry {
  83         const void *key;
  84 };
  85
  86 /* Entry types for specific hashmap/set types
  87  * hashmap_base_entry must be at the beginning of each entry struct. */
  88
  89 struct plain_hashmap_entry {
  90         struct hashmap_base_entry b;
  91         void *value;
  92 };
  93
  94 struct ordered_hashmap_entry {
  95         struct plain_hashmap_entry p;
  96         unsigned iterate_next, iterate_previous;
  97 };
  98
  99 struct set_entry {
 100         struct hashmap_base_entry b;
 101 };
 102
 103 /* In several functions it is advantageous to have the hash table extended
 104  * virtually by a couple of additional buckets. We reserve special index values
 105  * for these "swap" buckets. */
 106 #define _IDX_SWAP_BEGIN     (UINT_MAX - 3)
 107 #define IDX_PUT             (_IDX_SWAP_BEGIN + 0)
 108 #define IDX_TMP             (_IDX_SWAP_BEGIN + 1)
 109 #define _IDX_SWAP_END       (_IDX_SWAP_BEGIN + 2)
 110
 111 #define IDX_FIRST           (UINT_MAX - 1) /* special index for freshly initialized iterators */
 112 #define IDX_NIL             UINT_MAX       /* special index value meaning "none" or "end" */
 113
 114 assert_cc(IDX_FIRST == _IDX_SWAP_END);
 115 assert_cc(IDX_FIRST == _IDX_ITERATOR_FIRST);
 116
 117 /* Storage space for the "swap" buckets.
 118  * All entry types can fit into a ordered_hashmap_entry. */
 119 struct swap_entries {
 120         struct ordered_hashmap_entry e[_IDX_SWAP_END - _IDX_SWAP_BEGIN];
 121 };
 122
 123 /* Distance from Initial Bucket */
 124 typedef uint8_t dib_raw_t;
 125 #define DIB_RAW_OVERFLOW ((dib_raw_t)0xfdU)   /* indicates DIB value is greater than representable */
 126 #define DIB_RAW_REHASH   ((dib_raw_t)0xfeU)   /* entry yet to be rehashed during in-place resize */
 127 #define DIB_RAW_FREE     ((dib_raw_t)0xffU)   /* a free bucket */
 128 #define DIB_RAW_INIT     ((char)DIB_RAW_FREE) /* a byte to memset a DIB store with when initializing */
 129
 130 #define DIB_FREE UINT_MAX
 131
 132 #if ENABLE_DEBUG_HASHMAP
 133 struct hashmap_debug_info {
 134         LIST_FIELDS(struct hashmap_debug_info, debug_list);
 135         unsigned max_entries;  /* high watermark of n_entries */
 136
 137         /* who allocated this hashmap */
 138         int line;
 139         const char *file;
 140         const char *func;
 141
 142         /* fields to detect modification while iterating */
 143         unsigned put_count;    /* counts puts into the hashmap */
 144         unsigned rem_count;    /* counts removals from hashmap */
 145         unsigned last_rem_idx; /* remembers last removal index */
 146 };
 147
 148 /* Tracks all existing hashmaps. Get at it from gdb. See sd_dump_hashmaps.py */
 149 static LIST_HEAD(struct hashmap_debug_info, hashmap_debug_list);
 150 static pthread_mutex_t hashmap_debug_list_mutex = PTHREAD_MUTEX_INITIALIZER;
 151
 152 #define HASHMAP_DEBUG_FIELDS struct hashmap_debug_info debug;
 153
 154 #else /* !ENABLE_DEBUG_HASHMAP */
 155 #define HASHMAP_DEBUG_FIELDS
 156 #endif /* ENABLE_DEBUG_HASHMAP */
 157
 158 enum HashmapType {
 159         HASHMAP_TYPE_PLAIN,
 160         HASHMAP_TYPE_ORDERED,
 161         HASHMAP_TYPE_SET,
 162         _HASHMAP_TYPE_MAX
 163 };
 164
 165 struct _packed_ indirect_storage {
 166         void *storage;                     /* where buckets and DIBs are stored */
 167         uint8_t  hash_key[HASH_KEY_SIZE];  /* hash key; changes during resize */
 168
 169         unsigned n_entries;                /* number of stored entries */
 170         unsigned n_buckets;                /* number of buckets */
 171
 172         unsigned idx_lowest_entry;         /* Index below which all buckets are free.
 173                                               Makes "while(hashmap_steal_first())" loops
 174                                               O(n) instead of O(n^2) for unordered hashmaps. */
 175         uint8_t  _pad[3];                  /* padding for the whole HashmapBase */
 176         /* The bitfields in HashmapBase complete the alignment of the whole thing. */
 177 };
 178
 179 struct direct_storage {
 180         /* This gives us 39 bytes on 64bit, or 35 bytes on 32bit.
 181          * That's room for 4 set_entries + 4 DIB bytes + 3 unused bytes on 64bit,
 182          *              or 7 set_entries + 7 DIB bytes + 0 unused bytes on 32bit. */
 183         uint8_t storage[sizeof(struct indirect_storage)];
 184 };
 185
 186 #define DIRECT_BUCKETS(entry_t) \
 187         (sizeof(struct direct_storage) / (sizeof(entry_t) + sizeof(dib_raw_t)))
 188
 189 /* We should be able to store at least one entry directly. */
 190 assert_cc(DIRECT_BUCKETS(struct ordered_hashmap_entry) >= 1);
 191
 192 /* We have 3 bits for n_direct_entries. */
 193 assert_cc(DIRECT_BUCKETS(struct set_entry) < (1 << 3));
 194
 195 /* Hashmaps with directly stored entries all use this shared hash key.
 196  * It's no big deal if the key is guessed, because there can be only
 197  * a handful of directly stored entries in a hashmap. When a hashmap
 198  * outgrows direct storage, it gets its own key for indirect storage. */
 199 static uint8_t shared_hash_key[HASH_KEY_SIZE];
 200 static bool shared_hash_key_initialized;
 201
 202 /* Fields that all hashmap/set types must have */
 203 struct HashmapBase {
 204         const struct hash_ops *hash_ops;  /* hash and compare ops to use */
 205
 206         union _packed_ {
 207                 struct indirect_storage indirect; /* if  has_indirect */
 208                 struct direct_storage direct;     /* if !has_indirect */
 209         };
 210
 211         enum HashmapType type:2;     /* HASHMAP_TYPE_* */
 212         bool has_indirect:1;         /* whether indirect storage is used */
 213         unsigned n_direct_entries:3; /* Number of entries in direct storage.
 214                                       * Only valid if !has_indirect. */
 215         bool from_pool:1;            /* whether was allocated from mempool */
 216         bool dirty:1;                /* whether dirtied since last iterated_cache_get() */
 217         bool cached:1;               /* whether this hashmap is being cached */
 218         HASHMAP_DEBUG_FIELDS         /* optional hashmap_debug_info */
 219 };
 220
 221 /* Specific hash types
 222  * HashmapBase must be at the beginning of each hashmap struct. */
 223
 224 struct Hashmap {
 225         struct HashmapBase b;
 226 };
 227
 228 struct OrderedHashmap {
 229         struct HashmapBase b;
 230         unsigned iterate_list_head, iterate_list_tail;
 231 };
 232
 233 struct Set {
 234         struct HashmapBase b;
 235 };
 236
 237 typedef struct CacheMem {
 238         const void **ptr;
 239         size_t n_populated, n_allocated;
 240         bool active:1;
 241 } CacheMem;
 242
 243 struct IteratedCache {
 244         HashmapBase *hashmap;
 245         CacheMem keys, values;
 246 };
 247
 248 DEFINE_MEMPOOL(hashmap_pool,         Hashmap,        8);
 249 DEFINE_MEMPOOL(ordered_hashmap_pool, OrderedHashmap, 8);
 250 /* No need for a separate Set pool */
 251 assert_cc(sizeof(Hashmap) == sizeof(Set));
 252
 253 struct hashmap_type_info {
 254         size_t head_size;
 255         size_t entry_size;
 256         struct mempool *mempool;
 257         unsigned n_direct_buckets;
 258 };
 259
 260 static const struct hashmap_type_info hashmap_type_info[_HASHMAP_TYPE_MAX] = {
 261         [HASHMAP_TYPE_PLAIN] = {
 262                 .head_size        = sizeof(Hashmap),
 263                 .entry_size       = sizeof(struct plain_hashmap_entry),
 264                 .mempool          = &hashmap_pool,
 265                 .n_direct_buckets = DIRECT_BUCKETS(struct plain_hashmap_entry),
 266         },
 267         [HASHMAP_TYPE_ORDERED] = {
 268                 .head_size        = sizeof(OrderedHashmap),
 269                 .entry_size       = sizeof(struct ordered_hashmap_entry),
 270                 .mempool          = &ordered_hashmap_pool,
 271                 .n_direct_buckets = DIRECT_BUCKETS(struct ordered_hashmap_entry),
 272         },
 273         [HASHMAP_TYPE_SET] = {
 274                 .head_size        = sizeof(Set),
 275                 .entry_size       = sizeof(struct set_entry),
 276                 .mempool          = &hashmap_pool,
 277                 .n_direct_buckets = DIRECT_BUCKETS(struct set_entry),
 278         },
 279 };
 280
 281 #if VALGRIND
 282 __attribute__((destructor)) static void cleanup_pools(void) {
 283         _cleanup_free_ char *t = NULL;
 284         int r;
 285
 286         /* Be nice to valgrind */
 287
 288         /* The pool is only allocated by the main thread, but the memory can
 289          * be passed to other threads. Let's clean up if we are the main thread
 290          * and no other threads are live. */
 291         if (!is_main_thread())
 292                 return;
 293
 294         r = get_proc_field("/proc/self/status", "Threads", WHITESPACE, &t);
 295         if (r < 0 || !streq(t, "1"))
 296                 return;
 297
 298         mempool_drop(&hashmap_pool);
 299         mempool_drop(&ordered_hashmap_pool);
 300 }
 301 #endif
 302
 303 static unsigned n_buckets(HashmapBase *h) {
 304         return h->has_indirect ? h->indirect.n_buckets
 305                                : hashmap_type_info[h->type].n_direct_buckets;
 306 }
 307
 308 static unsigned n_entries(HashmapBase *h) {
 309         return h->has_indirect ? h->indirect.n_entries
 310                                : h->n_direct_entries;
 311 }
 312
 313 static void n_entries_inc(HashmapBase *h) {
 314         if (h->has_indirect)
 315                 h->indirect.n_entries++;
 316         else
 317                 h->n_direct_entries++;
 318 }
 319
 320 static void n_entries_dec(HashmapBase *h) {
 321         if (h->has_indirect)
 322                 h->indirect.n_entries--;
 323         else
 324                 h->n_direct_entries--;
 325 }
 326
 327 static void *storage_ptr(HashmapBase *h) {
 328         return h->has_indirect ? h->indirect.storage
 329                                : h->direct.storage;
 330 }
 331
 332 static uint8_t *hash_key(HashmapBase *h) {
 333         return h->has_indirect ? h->indirect.hash_key
 334                                : shared_hash_key;
 335 }
 336
 337 static unsigned base_bucket_hash(HashmapBase *h, const void *p) {
 338         struct siphash state;
 339         uint64_t hash;
 340
 341         siphash24_init(&state, hash_key(h));
 342
 343         h->hash_ops->hash(p, &state);
 344
 345         hash = siphash24_finalize(&state);
 346
 347         return (unsigned) (hash % n_buckets(h));
 348 }
 349 #define bucket_hash(h, p) base_bucket_hash(HASHMAP_BASE(h), p)
 350
 351 static inline void base_set_dirty(HashmapBase *h) {
 352         h->dirty = true;
 353 }
 354 #define hashmap_set_dirty(h) base_set_dirty(HASHMAP_BASE(h))
 355
 356 static void get_hash_key(uint8_t hash_key[HASH_KEY_SIZE], bool reuse_is_ok) {
 357         static uint8_t current[HASH_KEY_SIZE];
 358         static bool current_initialized = false;
 359
 360         /* Returns a hash function key to use. In order to keep things
 361          * fast we will not generate a new key each time we allocate a
 362          * new hash table. Instead, we'll just reuse the most recently
 363          * generated one, except if we never generated one or when we
 364          * are rehashing an entire hash table because we reached a
 365          * fill level */
 366
 367         if (!current_initialized || !reuse_is_ok) {
 368                 random_bytes(current, sizeof(current));
 369                 current_initialized = true;
 370         }
 371
 372         memcpy(hash_key, current, sizeof(current));
 373 }
 374
 375 static struct hashmap_base_entry *bucket_at(HashmapBase *h, unsigned idx) {
 376         return (struct hashmap_base_entry*)
 377                 ((uint8_t*) storage_ptr(h) + idx * hashmap_type_info[h->type].entry_size);
 378 }
 379
 380 static struct plain_hashmap_entry *plain_bucket_at(Hashmap *h, unsigned idx) {
 381         return (struct plain_hashmap_entry*) bucket_at(HASHMAP_BASE(h), idx);
 382 }
 383
 384 static struct ordered_hashmap_entry *ordered_bucket_at(OrderedHashmap *h, unsigned idx) {
 385         return (struct ordered_hashmap_entry*) bucket_at(HASHMAP_BASE(h), idx);
 386 }
 387
 388 static struct set_entry *set_bucket_at(Set *h, unsigned idx) {
 389         return (struct set_entry*) bucket_at(HASHMAP_BASE(h), idx);
 390 }
 391
 392 static struct ordered_hashmap_entry *bucket_at_swap(struct swap_entries *swap, unsigned idx) {
 393         return &swap->e[idx - _IDX_SWAP_BEGIN];
 394 }
 395
 396 /* Returns a pointer to the bucket at index idx.
 397  * Understands real indexes and swap indexes, hence "_virtual". */
 398 static struct hashmap_base_entry *bucket_at_virtual(HashmapBase *h, struct swap_entries *swap,
 399                                                     unsigned idx) {
 400         if (idx < _IDX_SWAP_BEGIN)
 401                 return bucket_at(h, idx);
 402
 403         if (idx < _IDX_SWAP_END)
 404                 return &bucket_at_swap(swap, idx)->p.b;
 405
 406         assert_not_reached("Invalid index");
 407 }
 408
 409 static dib_raw_t *dib_raw_ptr(HashmapBase *h) {
 410         return (dib_raw_t*)
 411                 ((uint8_t*) storage_ptr(h) + hashmap_type_info[h->type].entry_size * n_buckets(h));
 412 }
 413
 414 static unsigned bucket_distance(HashmapBase *h, unsigned idx, unsigned from) {
 415         return idx >= from ? idx - from
 416                            : n_buckets(h) + idx - from;
 417 }
 418
 419 static unsigned bucket_calculate_dib(HashmapBase *h, unsigned idx, dib_raw_t raw_dib) {
 420         unsigned initial_bucket;
 421
 422         if (raw_dib == DIB_RAW_FREE)
 423                 return DIB_FREE;
 424
 425         if (_likely_(raw_dib < DIB_RAW_OVERFLOW))
 426                 return raw_dib;
 427
 428         /*
 429          * Having an overflow DIB value is very unlikely. The hash function
 430          * would have to be bad. For example, in a table of size 2^24 filled
 431          * to load factor 0.9 the maximum observed DIB is only about 60.
 432          * In theory (assuming I used Maxima correctly), for an infinite size
 433          * hash table with load factor 0.8 the probability of a given entry
 434          * having DIB > 40 is 1.9e-8.
 435          * This returns the correct DIB value by recomputing the hash value in
 436          * the unlikely case. XXX Hitting this case could be a hint to rehash.
 437          */
 438         initial_bucket = bucket_hash(h, bucket_at(h, idx)->key);
 439         return bucket_distance(h, idx, initial_bucket);
 440 }
 441
 442 static void bucket_set_dib(HashmapBase *h, unsigned idx, unsigned dib) {
 443         dib_raw_ptr(h)[idx] = dib != DIB_FREE ? MIN(dib, DIB_RAW_OVERFLOW) : DIB_RAW_FREE;
 444 }
 445
 446 static unsigned skip_free_buckets(HashmapBase *h, unsigned idx) {
 447         dib_raw_t *dibs;
 448
 449         dibs = dib_raw_ptr(h);
 450
 451         for ( ; idx < n_buckets(h); idx++)
 452                 if (dibs[idx] != DIB_RAW_FREE)
 453                         return idx;
 454
 455         return IDX_NIL;
 456 }
 457
 458 static void bucket_mark_free(HashmapBase *h, unsigned idx) {
 459         memzero(bucket_at(h, idx), hashmap_type_info[h->type].entry_size);
 460         bucket_set_dib(h, idx, DIB_FREE);
 461 }
 462
 463 static void bucket_move_entry(HashmapBase *h, struct swap_entries *swap,
 464                               unsigned from, unsigned to) {
 465         struct hashmap_base_entry *e_from, *e_to;
 466
 467         assert(from != to);
 468
 469         e_from = bucket_at_virtual(h, swap, from);
 470         e_to   = bucket_at_virtual(h, swap, to);
 471
 472         memcpy(e_to, e_from, hashmap_type_info[h->type].entry_size);
 473
 474         if (h->type == HASHMAP_TYPE_ORDERED) {
 475                 OrderedHashmap *lh = (OrderedHashmap*) h;
 476                 struct ordered_hashmap_entry *le, *le_to;
 477
 478                 le_to = (struct ordered_hashmap_entry*) e_to;
 479
 480                 if (le_to->iterate_next != IDX_NIL) {
 481                         le = (struct ordered_hashmap_entry*)
 482                              bucket_at_virtual(h, swap, le_to->iterate_next);
 483                         le->iterate_previous = to;
 484                 }
 485
 486                 if (le_to->iterate_previous != IDX_NIL) {
 487                         le = (struct ordered_hashmap_entry*)
 488                              bucket_at_virtual(h, swap, le_to->iterate_previous);
 489                         le->iterate_next = to;
 490                 }
 491
 492                 if (lh->iterate_list_head == from)
 493                         lh->iterate_list_head = to;
 494                 if (lh->iterate_list_tail == from)
 495                         lh->iterate_list_tail = to;
 496         }
 497 }
 498
 499 static unsigned next_idx(HashmapBase *h, unsigned idx) {
 500         return (idx + 1U) % n_buckets(h);
 501 }
 502
 503 static unsigned prev_idx(HashmapBase *h, unsigned idx) {
 504         return (n_buckets(h) + idx - 1U) % n_buckets(h);
 505 }
 506
 507 static void *entry_value(HashmapBase *h, struct hashmap_base_entry *e) {
 508         switch (h->type) {
 509
 510         case HASHMAP_TYPE_PLAIN:
 511         case HASHMAP_TYPE_ORDERED:
 512                 return ((struct plain_hashmap_entry*)e)->value;
 513
 514         case HASHMAP_TYPE_SET:
 515                 return (void*) e->key;
 516
 517         default:
 518                 assert_not_reached("Unknown hashmap type");
 519         }
 520 }
 521
 522 static void base_remove_entry(HashmapBase *h, unsigned idx) {
 523         unsigned left, right, prev, dib;
 524         dib_raw_t raw_dib, *dibs;
 525
 526         dibs = dib_raw_ptr(h);
 527         assert(dibs[idx] != DIB_RAW_FREE);
 528
 529 #if ENABLE_DEBUG_HASHMAP
 530         h->debug.rem_count++;
 531         h->debug.last_rem_idx = idx;
 532 #endif
 533
 534         left = idx;
 535         /* Find the stop bucket ("right"). It is either free or has DIB == 0. */
 536         for (right = next_idx(h, left); ; right = next_idx(h, right)) {
 537                 raw_dib = dibs[right];
 538                 if (IN_SET(raw_dib, 0, DIB_RAW_FREE))
 539                         break;
 540
 541                 /* The buckets are not supposed to be all occupied and with DIB > 0.
 542                  * That would mean we could make everyone better off by shifting them
 543                  * backward. This scenario is impossible. */
 544                 assert(left != right);
 545         }
 546
 547         if (h->type == HASHMAP_TYPE_ORDERED) {
 548                 OrderedHashmap *lh = (OrderedHashmap*) h;
 549                 struct ordered_hashmap_entry *le = ordered_bucket_at(lh, idx);
 550
 551                 if (le->iterate_next != IDX_NIL)
 552                         ordered_bucket_at(lh, le->iterate_next)->iterate_previous = le->iterate_previous;
 553                 else
 554                         lh->iterate_list_tail = le->iterate_previous;
 555
 556                 if (le->iterate_previous != IDX_NIL)
 557                         ordered_bucket_at(lh, le->iterate_previous)->iterate_next = le->iterate_next;
 558                 else
 559                         lh->iterate_list_head = le->iterate_next;
 560         }
 561
 562         /* Now shift all buckets in the interval (left, right) one step backwards */
 563         for (prev = left, left = next_idx(h, left); left != right;
 564              prev = left, left = next_idx(h, left)) {
 565                 dib = bucket_calculate_dib(h, left, dibs[left]);
 566                 assert(dib != 0);
 567                 bucket_move_entry(h, NULL, left, prev);
 568                 bucket_set_dib(h, prev, dib - 1);
 569         }
 570
 571         bucket_mark_free(h, prev);
 572         n_entries_dec(h);
 573         base_set_dirty(h);
 574 }
 575 #define remove_entry(h, idx) base_remove_entry(HASHMAP_BASE(h), idx)
 576
 577 static unsigned hashmap_iterate_in_insertion_order(OrderedHashmap *h, Iterator *i) {
 578         struct ordered_hashmap_entry *e;
 579         unsigned idx;
 580
 581         assert(h);
 582         assert(i);
 583
 584         if (i->idx == IDX_NIL)
 585                 goto at_end;
 586
 587         if (i->idx == IDX_FIRST && h->iterate_list_head == IDX_NIL)
 588                 goto at_end;
 589
 590         if (i->idx == IDX_FIRST) {
 591                 idx = h->iterate_list_head;
 592                 e = ordered_bucket_at(h, idx);
 593         } else {
 594                 idx = i->idx;
 595                 e = ordered_bucket_at(h, idx);
 596                 /*
 597                  * We allow removing the current entry while iterating, but removal may cause
 598                  * a backward shift. The next entry may thus move one bucket to the left.
 599                  * To detect when it happens, we remember the key pointer of the entry we were
 600                  * going to iterate next. If it does not match, there was a backward shift.
 601                  */
 602                 if (e->p.b.key != i->next_key) {
 603                         idx = prev_idx(HASHMAP_BASE(h), idx);
 604                         e = ordered_bucket_at(h, idx);
 605                 }
 606                 assert(e->p.b.key == i->next_key);
 607         }
 608
 609 #if ENABLE_DEBUG_HASHMAP
 610         i->prev_idx = idx;
 611 #endif
 612
 613         if (e->iterate_next != IDX_NIL) {
 614                 struct ordered_hashmap_entry *n;
 615                 i->idx = e->iterate_next;
 616                 n = ordered_bucket_at(h, i->idx);
 617                 i->next_key = n->p.b.key;
 618         } else
 619                 i->idx = IDX_NIL;
 620
 621         return idx;
 622
 623 at_end:
 624         i->idx = IDX_NIL;
 625         return IDX_NIL;
 626 }
 627
 628 static unsigned hashmap_iterate_in_internal_order(HashmapBase *h, Iterator *i) {
 629         unsigned idx;
 630
 631         assert(h);
 632         assert(i);
 633
 634         if (i->idx == IDX_NIL)
 635                 goto at_end;
 636
 637         if (i->idx == IDX_FIRST) {
 638                 /* fast forward to the first occupied bucket */
 639                 if (h->has_indirect) {
 640                         i->idx = skip_free_buckets(h, h->indirect.idx_lowest_entry);
 641                         h->indirect.idx_lowest_entry = i->idx;
 642                 } else
 643                         i->idx = skip_free_buckets(h, 0);
 644
 645                 if (i->idx == IDX_NIL)
 646                         goto at_end;
 647         } else {
 648                 struct hashmap_base_entry *e;
 649
 650                 assert(i->idx > 0);
 651
 652                 e = bucket_at(h, i->idx);
 653                 /*
 654                  * We allow removing the current entry while iterating, but removal may cause
 655                  * a backward shift. The next entry may thus move one bucket to the left.
 656                  * To detect when it happens, we remember the key pointer of the entry we were
 657                  * going to iterate next. If it does not match, there was a backward shift.
 658                  */
 659                 if (e->key != i->next_key)
 660                         e = bucket_at(h, --i->idx);
 661
 662                 assert(e->key == i->next_key);
 663         }
 664
 665         idx = i->idx;
 666 #if ENABLE_DEBUG_HASHMAP
 667         i->prev_idx = idx;
 668 #endif
 669
 670         i->idx = skip_free_buckets(h, i->idx + 1);
 671         if (i->idx != IDX_NIL)
 672                 i->next_key = bucket_at(h, i->idx)->key;
 673         else
 674                 i->idx = IDX_NIL;
 675
 676         return idx;
 677
 678 at_end:
 679         i->idx = IDX_NIL;
 680         return IDX_NIL;
 681 }
 682
 683 static unsigned hashmap_iterate_entry(HashmapBase *h, Iterator *i) {
 684         if (!h) {
 685                 i->idx = IDX_NIL;
 686                 return IDX_NIL;
 687         }
 688
 689 #if ENABLE_DEBUG_HASHMAP
 690         if (i->idx == IDX_FIRST) {
 691                 i->put_count = h->debug.put_count;
 692                 i->rem_count = h->debug.rem_count;
 693         } else {
 694                 /* While iterating, must not add any new entries */
 695                 assert(i->put_count == h->debug.put_count);
 696                 /* ... or remove entries other than the current one */
 697                 assert(i->rem_count == h->debug.rem_count ||
 698                        (i->rem_count == h->debug.rem_count - 1 &&
 699                         i->prev_idx == h->debug.last_rem_idx));
 700                 /* Reset our removals counter */
 701                 i->rem_count = h->debug.rem_count;
 702         }
 703 #endif
 704
 705         return h->type == HASHMAP_TYPE_ORDERED ? hashmap_iterate_in_insertion_order((OrderedHashmap*) h, i)
 706                                                : hashmap_iterate_in_internal_order(h, i);
 707 }
 708
 709 bool internal_hashmap_iterate(HashmapBase *h, Iterator *i, void **value, const void **key) {
 710         struct hashmap_base_entry *e;
 711         void *data;
 712         unsigned idx;
 713
 714         idx = hashmap_iterate_entry(h, i);
 715         if (idx == IDX_NIL) {
 716                 if (value)
 717                         *value = NULL;
 718                 if (key)
 719                         *key = NULL;
 720
 721                 return false;
 722         }
 723
 724         e = bucket_at(h, idx);
 725         data = entry_value(h, e);
 726         if (value)
 727                 *value = data;
 728         if (key)
 729                 *key = e->key;
 730
 731         return true;
 732 }
 733
 734 bool set_iterate(Set *s, Iterator *i, void **value) {
 735         return internal_hashmap_iterate(HASHMAP_BASE(s), i, value, NULL);
 736 }
 737
 738 #define HASHMAP_FOREACH_IDX(idx, h, i) \
 739         for ((i) = ITERATOR_FIRST, (idx) = hashmap_iterate_entry((h), &(i)); \
 740              (idx != IDX_NIL); \
 741              (idx) = hashmap_iterate_entry((h), &(i)))
 742
 743 IteratedCache *internal_hashmap_iterated_cache_new(HashmapBase *h) {
 744         IteratedCache *cache;
 745
 746         assert(h);
 747         assert(!h->cached);
 748
 749         if (h->cached)
 750                 return NULL;
 751
 752         cache = new0(IteratedCache, 1);
 753         if (!cache)
 754                 return NULL;
 755
 756         cache->hashmap = h;
 757         h->cached = true;
 758
 759         return cache;
 760 }
 761
 762 static void reset_direct_storage(HashmapBase *h) {
 763         const struct hashmap_type_info *hi = &hashmap_type_info[h->type];
 764         void *p;
 765
 766         assert(!h->has_indirect);
 767
 768         p = mempset(h->direct.storage, 0, hi->entry_size * hi->n_direct_buckets);
 769         memset(p, DIB_RAW_INIT, sizeof(dib_raw_t) * hi->n_direct_buckets);
 770 }
 771
 772 static struct HashmapBase *hashmap_base_new(const struct hash_ops *hash_ops, enum HashmapType type HASHMAP_DEBUG_PARAMS) {
 773         HashmapBase *h;
 774         const struct hashmap_type_info *hi = &hashmap_type_info[type];
 775         bool use_pool;
 776
 777         use_pool = is_main_thread();
 778
 779         h = use_pool ? mempool_alloc0_tile(hi->mempool) : malloc0(hi->head_size);
 780
 781         if (!h)
 782                 return NULL;
 783
 784         h->type = type;
 785         h->from_pool = use_pool;
 786         h->hash_ops = hash_ops ? hash_ops : &trivial_hash_ops;
 787
 788         if (type == HASHMAP_TYPE_ORDERED) {
 789                 OrderedHashmap *lh = (OrderedHashmap*)h;
 790                 lh->iterate_list_head = lh->iterate_list_tail = IDX_NIL;
 791         }
 792
 793         reset_direct_storage(h);
 794
 795         if (!shared_hash_key_initialized) {
 796                 random_bytes(shared_hash_key, sizeof(shared_hash_key));
 797                 shared_hash_key_initialized= true;
 798         }
 799
 800 #if ENABLE_DEBUG_HASHMAP
 801         h->debug.func = func;
 802         h->debug.file = file;
 803         h->debug.line = line;
 804         assert_se(pthread_mutex_lock(&hashmap_debug_list_mutex) == 0);
 805         LIST_PREPEND(debug_list, hashmap_debug_list, &h->debug);
 806         assert_se(pthread_mutex_unlock(&hashmap_debug_list_mutex) == 0);
 807 #endif
 808
 809         return h;
 810 }
 811
 812 Hashmap *internal_hashmap_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 813         return (Hashmap*)        hashmap_base_new(hash_ops, HASHMAP_TYPE_PLAIN HASHMAP_DEBUG_PASS_ARGS);
 814 }
 815
 816 OrderedHashmap *internal_ordered_hashmap_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 817         return (OrderedHashmap*) hashmap_base_new(hash_ops, HASHMAP_TYPE_ORDERED HASHMAP_DEBUG_PASS_ARGS);
 818 }
 819
 820 Set *internal_set_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 821         return (Set*)            hashmap_base_new(hash_ops, HASHMAP_TYPE_SET HASHMAP_DEBUG_PASS_ARGS);
 822 }
 823
 824 static int hashmap_base_ensure_allocated(HashmapBase **h, const struct hash_ops *hash_ops,
 825                                          enum HashmapType type HASHMAP_DEBUG_PARAMS) {
 826         HashmapBase *q;
 827
 828         assert(h);
 829
 830         if (*h)
 831                 return 0;
 832
 833         q = hashmap_base_new(hash_ops, type HASHMAP_DEBUG_PASS_ARGS);
 834         if (!q)
 835                 return -ENOMEM;
 836
 837         *h = q;
 838         return 0;
 839 }
 840
 841 int internal_hashmap_ensure_allocated(Hashmap **h, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 842         return hashmap_base_ensure_allocated((HashmapBase**)h, hash_ops, HASHMAP_TYPE_PLAIN HASHMAP_DEBUG_PASS_ARGS);
 843 }
 844
 845 int internal_ordered_hashmap_ensure_allocated(OrderedHashmap **h, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 846         return hashmap_base_ensure_allocated((HashmapBase**)h, hash_ops, HASHMAP_TYPE_ORDERED HASHMAP_DEBUG_PASS_ARGS);
 847 }
 848
 849 int internal_set_ensure_allocated(Set **s, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 850         return hashmap_base_ensure_allocated((HashmapBase**)s, hash_ops, HASHMAP_TYPE_SET HASHMAP_DEBUG_PASS_ARGS);
 851 }
 852
 853 static void hashmap_free_no_clear(HashmapBase *h) {
 854         assert(!h->has_indirect);
 855         assert(!h->n_direct_entries);
 856
 857 #if ENABLE_DEBUG_HASHMAP
 858         assert_se(pthread_mutex_lock(&hashmap_debug_list_mutex) == 0);
 859         LIST_REMOVE(debug_list, hashmap_debug_list, &h->debug);
 860         assert_se(pthread_mutex_unlock(&hashmap_debug_list_mutex) == 0);
 861 #endif
 862
 863         if (h->from_pool)
 864                 mempool_free_tile(hashmap_type_info[h->type].mempool, h);
 865         else
 866                 free(h);
 867 }
 868
 869 HashmapBase *internal_hashmap_free(HashmapBase *h) {
 870
 871         /* Free the hashmap, but nothing in it */
 872
 873         if (h) {
 874                 internal_hashmap_clear(h);
 875                 hashmap_free_no_clear(h);
 876         }
 877
 878         return NULL;
 879 }
 880
 881 HashmapBase *internal_hashmap_free_free(HashmapBase *h) {
 882
 883         /* Free the hashmap and all data objects in it, but not the
 884          * keys */
 885
 886         if (h) {
 887                 internal_hashmap_clear_free(h);
 888                 hashmap_free_no_clear(h);
 889         }
 890
 891         return NULL;
 892 }
 893
 894 Hashmap *hashmap_free_free_free(Hashmap *h) {
 895
 896         /* Free the hashmap and all data and key objects in it */
 897
 898         if (h) {
 899                 hashmap_clear_free_free(h);
 900                 hashmap_free_no_clear(HASHMAP_BASE(h));
 901         }
 902
 903         return NULL;
 904 }
 905
 906 void internal_hashmap_clear(HashmapBase *h) {
 907         if (!h)
 908                 return;
 909
 910         if (h->has_indirect) {
 911                 free(h->indirect.storage);
 912                 h->has_indirect = false;
 913         }
 914
 915         h->n_direct_entries = 0;
 916         reset_direct_storage(h);
 917
 918         if (h->type == HASHMAP_TYPE_ORDERED) {
 919                 OrderedHashmap *lh = (OrderedHashmap*) h;
 920                 lh->iterate_list_head = lh->iterate_list_tail = IDX_NIL;
 921         }
 922
 923         base_set_dirty(h);
 924 }
 925
 926 void internal_hashmap_clear_free(HashmapBase *h) {
 927         unsigned idx;
 928
 929         if (!h)
 930                 return;
 931
 932         for (idx = skip_free_buckets(h, 0); idx != IDX_NIL;
 933              idx = skip_free_buckets(h, idx + 1))
 934                 free(entry_value(h, bucket_at(h, idx)));
 935
 936         internal_hashmap_clear(h);
 937 }
 938
 939 void hashmap_clear_free_free(Hashmap *h) {
 940         unsigned idx;
 941
 942         if (!h)
 943                 return;
 944
 945         for (idx = skip_free_buckets(HASHMAP_BASE(h), 0); idx != IDX_NIL;
 946              idx = skip_free_buckets(HASHMAP_BASE(h), idx + 1)) {
 947                 struct plain_hashmap_entry *e = plain_bucket_at(h, idx);
 948                 free((void*)e->b.key);
 949                 free(e->value);
 950         }
 951
 952         internal_hashmap_clear(HASHMAP_BASE(h));
 953 }
 954
 955 static int resize_buckets(HashmapBase *h, unsigned entries_add);
 956
 957 /*
 958  * Finds an empty bucket to put an entry into, starting the scan at 'idx'.
 959  * Performs Robin Hood swaps as it goes. The entry to put must be placed
 960  * by the caller into swap slot IDX_PUT.
 961  * If used for in-place resizing, may leave a displaced entry in swap slot
 962  * IDX_PUT. Caller must rehash it next.
 963  * Returns: true if it left a displaced entry to rehash next in IDX_PUT,
 964  *          false otherwise.
 965  */
 966 static bool hashmap_put_robin_hood(HashmapBase *h, unsigned idx,
 967                                    struct swap_entries *swap) {
 968         dib_raw_t raw_dib, *dibs;
 969         unsigned dib, distance;
 970
 971 #if ENABLE_DEBUG_HASHMAP
 972         h->debug.put_count++;
 973 #endif
 974
 975         dibs = dib_raw_ptr(h);
 976
 977         for (distance = 0; ; distance++) {
 978                 raw_dib = dibs[idx];
 979                 if (IN_SET(raw_dib, DIB_RAW_FREE, DIB_RAW_REHASH)) {
 980                         if (raw_dib == DIB_RAW_REHASH)
 981                                 bucket_move_entry(h, swap, idx, IDX_TMP);
 982
 983                         if (h->has_indirect && h->indirect.idx_lowest_entry > idx)
 984                                 h->indirect.idx_lowest_entry = idx;
 985
 986                         bucket_set_dib(h, idx, distance);
 987                         bucket_move_entry(h, swap, IDX_PUT, idx);
 988                         if (raw_dib == DIB_RAW_REHASH) {
 989                                 bucket_move_entry(h, swap, IDX_TMP, IDX_PUT);
 990                                 return true;
 991                         }
 992
 993                         return false;
 994                 }
 995
 996                 dib = bucket_calculate_dib(h, idx, raw_dib);
 997
 998                 if (dib < distance) {
 999                         /* Found a wealthier entry. Go Robin Hood! */
1000                         bucket_set_dib(h, idx, distance);
1001
1002                         /* swap the entries */
1003                         bucket_move_entry(h, swap, idx, IDX_TMP);
1004                         bucket_move_entry(h, swap, IDX_PUT, idx);
1005                         bucket_move_entry(h, swap, IDX_TMP, IDX_PUT);
1006
1007                         distance = dib;
1008                 }
1009
1010                 idx = next_idx(h, idx);
1011         }
1012 }
1013
1014 /*
1015  * Puts an entry into a hashmap, boldly - no check whether key already exists.
1016  * The caller must place the entry (only its key and value, not link indexes)
1017  * in swap slot IDX_PUT.
1018  * Caller must ensure: the key does not exist yet in the hashmap.
1019  *                     that resize is not needed if !may_resize.
1020  * Returns: 1 if entry was put successfully.
1021  *          -ENOMEM if may_resize==true and resize failed with -ENOMEM.
1022  *          Cannot return -ENOMEM if !may_resize.
1023  */
1024 static int hashmap_base_put_boldly(HashmapBase *h, unsigned idx,
1025                                    struct swap_entries *swap, bool may_resize) {
1026         struct ordered_hashmap_entry *new_entry;
1027         int r;
1028
1029         assert(idx < n_buckets(h));
1030
1031         new_entry = bucket_at_swap(swap, IDX_PUT);
1032
1033         if (may_resize) {
1034                 r = resize_buckets(h, 1);
1035                 if (r < 0)
1036                         return r;
1037                 if (r > 0)
1038                         idx = bucket_hash(h, new_entry->p.b.key);
1039         }
1040         assert(n_entries(h) < n_buckets(h));
1041
1042         if (h->type == HASHMAP_TYPE_ORDERED) {
1043                 OrderedHashmap *lh = (OrderedHashmap*) h;
1044
1045                 new_entry->iterate_next = IDX_NIL;
1046                 new_entry->iterate_previous = lh->iterate_list_tail;
1047
1048                 if (lh->iterate_list_tail != IDX_NIL) {
1049                         struct ordered_hashmap_entry *old_tail;
1050
1051                         old_tail = ordered_bucket_at(lh, lh->iterate_list_tail);
1052                         assert(old_tail->iterate_next == IDX_NIL);
1053                         old_tail->iterate_next = IDX_PUT;
1054                 }
1055
1056                 lh->iterate_list_tail = IDX_PUT;
1057                 if (lh->iterate_list_head == IDX_NIL)
1058                         lh->iterate_list_head = IDX_PUT;
1059         }
1060
1061         assert_se(hashmap_put_robin_hood(h, idx, swap) == false);
1062
1063         n_entries_inc(h);
1064 #if ENABLE_DEBUG_HASHMAP
1065         h->debug.max_entries = MAX(h->debug.max_entries, n_entries(h));
1066 #endif
1067
1068         base_set_dirty(h);
1069
1070         return 1;
1071 }
1072 #define hashmap_put_boldly(h, idx, swap, may_resize) \
1073         hashmap_base_put_boldly(HASHMAP_BASE(h), idx, swap, may_resize)
1074
1075 /*
1076  * Returns 0 if resize is not needed.
1077  *         1 if successfully resized.
1078  *         -ENOMEM on allocation failure.
1079  */
1080 static int resize_buckets(HashmapBase *h, unsigned entries_add) {
1081         struct swap_entries swap;
1082         void *new_storage;
1083         dib_raw_t *old_dibs, *new_dibs;
1084         const struct hashmap_type_info *hi;
1085         unsigned idx, optimal_idx;
1086         unsigned old_n_buckets, new_n_buckets, n_rehashed, new_n_entries;
1087         uint8_t new_shift;
1088         bool rehash_next;
1089
1090         assert(h);
1091
1092         hi = &hashmap_type_info[h->type];
1093         new_n_entries = n_entries(h) + entries_add;
1094
1095         /* overflow? */
1096         if (_unlikely_(new_n_entries < entries_add))
1097                 return -ENOMEM;
1098
1099         /* For direct storage we allow 100% load, because it's tiny. */
1100         if (!h->has_indirect && new_n_entries <= hi->n_direct_buckets)
1101                 return 0;
1102
1103         /*
1104          * Load factor = n/m = 1 - (1/INV_KEEP_FREE).
1105          * From it follows: m = n + n/(INV_KEEP_FREE - 1)
1106          */
1107         new_n_buckets = new_n_entries + new_n_entries / (INV_KEEP_FREE - 1);
1108         /* overflow? */
1109         if (_unlikely_(new_n_buckets < new_n_entries))
1110                 return -ENOMEM;
1111
1112         if (_unlikely_(new_n_buckets > UINT_MAX / (hi->entry_size + sizeof(dib_raw_t))))
1113                 return -ENOMEM;
1114
1115         old_n_buckets = n_buckets(h);
1116
1117         if (_likely_(new_n_buckets <= old_n_buckets))
1118                 return 0;
1119
1120         new_shift = log2u_round_up(MAX(
1121                         new_n_buckets * (hi->entry_size + sizeof(dib_raw_t)),
1122                         2 * sizeof(struct direct_storage)));
1123
1124         /* Realloc storage (buckets and DIB array). */
1125         new_storage = realloc(h->has_indirect ? h->indirect.storage : NULL,
1126                               1U << new_shift);
1127         if (!new_storage)
1128                 return -ENOMEM;
1129
1130         /* Must upgrade direct to indirect storage. */
1131         if (!h->has_indirect) {
1132                 memcpy(new_storage, h->direct.storage,
1133                        old_n_buckets * (hi->entry_size + sizeof(dib_raw_t)));
1134                 h->indirect.n_entries = h->n_direct_entries;
1135                 h->indirect.idx_lowest_entry = 0;
1136                 h->n_direct_entries = 0;
1137         }
1138
1139         /* Get a new hash key. If we've just upgraded to indirect storage,
1140          * allow reusing a previously generated key. It's still a different key
1141          * from the shared one that we used for direct storage. */
1142         get_hash_key(h->indirect.hash_key, !h->has_indirect);
1143
1144         h->has_indirect = true;
1145         h->indirect.storage = new_storage;
1146         h->indirect.n_buckets = (1U << new_shift) /
1147                                 (hi->entry_size + sizeof(dib_raw_t));
1148
1149         old_dibs = (dib_raw_t*)((uint8_t*) new_storage + hi->entry_size * old_n_buckets);
1150         new_dibs = dib_raw_ptr(h);
1151
1152         /*
1153          * Move the DIB array to the new place, replacing valid DIB values with
1154          * DIB_RAW_REHASH to indicate all of the used buckets need rehashing.
1155          * Note: Overlap is not possible, because we have at least doubled the
1156          * number of buckets and dib_raw_t is smaller than any entry type.
1157          */
1158         for (idx = 0; idx < old_n_buckets; idx++) {
1159                 assert(old_dibs[idx] != DIB_RAW_REHASH);
1160                 new_dibs[idx] = old_dibs[idx] == DIB_RAW_FREE ? DIB_RAW_FREE
1161                                                               : DIB_RAW_REHASH;
1162         }
1163
1164         /* Zero the area of newly added entries (including the old DIB area) */
1165         memzero(bucket_at(h, old_n_buckets),
1166                (n_buckets(h) - old_n_buckets) * hi->entry_size);
1167
1168         /* The upper half of the new DIB array needs initialization */
1169         memset(&new_dibs[old_n_buckets], DIB_RAW_INIT,
1170                (n_buckets(h) - old_n_buckets) * sizeof(dib_raw_t));
1171
1172         /* Rehash entries that need it */
1173         n_rehashed = 0;
1174         for (idx = 0; idx < old_n_buckets; idx++) {
1175                 if (new_dibs[idx] != DIB_RAW_REHASH)
1176                         continue;
1177
1178                 optimal_idx = bucket_hash(h, bucket_at(h, idx)->key);
1179
1180                 /*
1181                  * Not much to do if by luck the entry hashes to its current
1182                  * location. Just set its DIB.
1183                  */
1184                 if (optimal_idx == idx) {
1185                         new_dibs[idx] = 0;
1186                         n_rehashed++;
1187                         continue;
1188                 }
1189
1190                 new_dibs[idx] = DIB_RAW_FREE;
1191                 bucket_move_entry(h, &swap, idx, IDX_PUT);
1192                 /* bucket_move_entry does not clear the source */
1193                 memzero(bucket_at(h, idx), hi->entry_size);
1194
1195                 do {
1196                         /*
1197                          * Find the new bucket for the current entry. This may make
1198                          * another entry homeless and load it into IDX_PUT.
1199                          */
1200                         rehash_next = hashmap_put_robin_hood(h, optimal_idx, &swap);
1201                         n_rehashed++;
1202
1203                         /* Did the current entry displace another one? */
1204                         if (rehash_next)
1205                                 optimal_idx = bucket_hash(h, bucket_at_swap(&swap, IDX_PUT)->p.b.key);
1206                 } while (rehash_next);
1207         }
1208
1209         assert(n_rehashed == n_entries(h));
1210
1211         return 1;
1212 }
1213
1214 /*
1215  * Finds an entry with a matching key
1216  * Returns: index of the found entry, or IDX_NIL if not found.
1217  */
1218 static unsigned base_bucket_scan(HashmapBase *h, unsigned idx, const void *key) {
1219         struct hashmap_base_entry *e;
1220         unsigned dib, distance;
1221         dib_raw_t *dibs = dib_raw_ptr(h);
1222
1223         assert(idx < n_buckets(h));
1224
1225         for (distance = 0; ; distance++) {
1226                 if (dibs[idx] == DIB_RAW_FREE)
1227                         return IDX_NIL;
1228
1229                 dib = bucket_calculate_dib(h, idx, dibs[idx]);
1230
1231                 if (dib < distance)
1232                         return IDX_NIL;
1233                 if (dib == distance) {
1234                         e = bucket_at(h, idx);
1235                         if (h->hash_ops->compare(e->key, key) == 0)
1236                                 return idx;
1237                 }
1238
1239                 idx = next_idx(h, idx);
1240         }
1241 }
1242 #define bucket_scan(h, idx, key) base_bucket_scan(HASHMAP_BASE(h), idx, key)
1243
1244 int hashmap_put(Hashmap *h, const void *key, void *value) {
1245         struct swap_entries swap;
1246         struct plain_hashmap_entry *e;
1247         unsigned hash, idx;
1248
1249         assert(h);
1250
1251         hash = bucket_hash(h, key);
1252         idx = bucket_scan(h, hash, key);
1253         if (idx != IDX_NIL) {
1254                 e = plain_bucket_at(h, idx);
1255                 if (e->value == value)
1256                         return 0;
1257                 return -EEXIST;
1258         }
1259
1260         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1261         e->b.key = key;
1262         e->value = value;
1263         return hashmap_put_boldly(h, hash, &swap, true);
1264 }
1265
1266 int set_put(Set *s, const void *key) {
1267         struct swap_entries swap;
1268         struct hashmap_base_entry *e;
1269         unsigned hash, idx;
1270
1271         assert(s);
1272
1273         hash = bucket_hash(s, key);
1274         idx = bucket_scan(s, hash, key);
1275         if (idx != IDX_NIL)
1276                 return 0;
1277
1278         e = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1279         e->key = key;
1280         return hashmap_put_boldly(s, hash, &swap, true);
1281 }
1282
1283 int hashmap_replace(Hashmap *h, const void *key, void *value) {
1284         struct swap_entries swap;
1285         struct plain_hashmap_entry *e;
1286         unsigned hash, idx;
1287
1288         assert(h);
1289
1290         hash = bucket_hash(h, key);
1291         idx = bucket_scan(h, hash, key);
1292         if (idx != IDX_NIL) {
1293                 e = plain_bucket_at(h, idx);
1294 #if ENABLE_DEBUG_HASHMAP
1295                 /* Although the key is equal, the key pointer may have changed,
1296                  * and this would break our assumption for iterating. So count
1297                  * this operation as incompatible with iteration. */
1298                 if (e->b.key != key) {
1299                         h->b.debug.put_count++;
1300                         h->b.debug.rem_count++;
1301                         h->b.debug.last_rem_idx = idx;
1302                 }
1303 #endif
1304                 e->b.key = key;
1305                 e->value = value;
1306                 hashmap_set_dirty(h);
1307
1308                 return 0;
1309         }
1310
1311         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1312         e->b.key = key;
1313         e->value = value;
1314         return hashmap_put_boldly(h, hash, &swap, true);
1315 }
1316
1317 int hashmap_update(Hashmap *h, const void *key, void *value) {
1318         struct plain_hashmap_entry *e;
1319         unsigned hash, idx;
1320
1321         assert(h);
1322
1323         hash = bucket_hash(h, key);
1324         idx = bucket_scan(h, hash, key);
1325         if (idx == IDX_NIL)
1326                 return -ENOENT;
1327
1328         e = plain_bucket_at(h, idx);
1329         e->value = value;
1330         hashmap_set_dirty(h);
1331
1332         return 0;
1333 }
1334
1335 void *internal_hashmap_get(HashmapBase *h, const void *key) {
1336         struct hashmap_base_entry *e;
1337         unsigned hash, idx;
1338
1339         if (!h)
1340                 return NULL;
1341
1342         hash = bucket_hash(h, key);
1343         idx = bucket_scan(h, hash, key);
1344         if (idx == IDX_NIL)
1345                 return NULL;
1346
1347         e = bucket_at(h, idx);
1348         return entry_value(h, e);
1349 }
1350
1351 void *hashmap_get2(Hashmap *h, const void *key, void **key2) {
1352         struct plain_hashmap_entry *e;
1353         unsigned hash, idx;
1354
1355         if (!h)
1356                 return NULL;
1357
1358         hash = bucket_hash(h, key);
1359         idx = bucket_scan(h, hash, key);
1360         if (idx == IDX_NIL)
1361                 return NULL;
1362
1363         e = plain_bucket_at(h, idx);
1364         if (key2)
1365                 *key2 = (void*) e->b.key;
1366
1367         return e->value;
1368 }
1369
1370 bool internal_hashmap_contains(HashmapBase *h, const void *key) {
1371         unsigned hash;
1372
1373         if (!h)
1374                 return false;
1375
1376         hash = bucket_hash(h, key);
1377         return bucket_scan(h, hash, key) != IDX_NIL;
1378 }
1379
1380 void *internal_hashmap_remove(HashmapBase *h, const void *key) {
1381         struct hashmap_base_entry *e;
1382         unsigned hash, idx;
1383         void *data;
1384
1385         if (!h)
1386                 return NULL;
1387
1388         hash = bucket_hash(h, key);
1389         idx = bucket_scan(h, hash, key);
1390         if (idx == IDX_NIL)
1391                 return NULL;
1392
1393         e = bucket_at(h, idx);
1394         data = entry_value(h, e);
1395         remove_entry(h, idx);
1396
1397         return data;
1398 }
1399
1400 void *hashmap_remove2(Hashmap *h, const void *key, void **rkey) {
1401         struct plain_hashmap_entry *e;
1402         unsigned hash, idx;
1403         void *data;
1404
1405         if (!h) {
1406                 if (rkey)
1407                         *rkey = NULL;
1408                 return NULL;
1409         }
1410
1411         hash = bucket_hash(h, key);
1412         idx = bucket_scan(h, hash, key);
1413         if (idx == IDX_NIL) {
1414                 if (rkey)
1415                         *rkey = NULL;
1416                 return NULL;
1417         }
1418
1419         e = plain_bucket_at(h, idx);
1420         data = e->value;
1421         if (rkey)
1422                 *rkey = (void*) e->b.key;
1423
1424         remove_entry(h, idx);
1425
1426         return data;
1427 }
1428
1429 int hashmap_remove_and_put(Hashmap *h, const void *old_key, const void *new_key, void *value) {
1430         struct swap_entries swap;
1431         struct plain_hashmap_entry *e;
1432         unsigned old_hash, new_hash, idx;
1433
1434         if (!h)
1435                 return -ENOENT;
1436
1437         old_hash = bucket_hash(h, old_key);
1438         idx = bucket_scan(h, old_hash, old_key);
1439         if (idx == IDX_NIL)
1440                 return -ENOENT;
1441
1442         new_hash = bucket_hash(h, new_key);
1443         if (bucket_scan(h, new_hash, new_key) != IDX_NIL)
1444                 return -EEXIST;
1445
1446         remove_entry(h, idx);
1447
1448         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1449         e->b.key = new_key;
1450         e->value = value;
1451         assert_se(hashmap_put_boldly(h, new_hash, &swap, false) == 1);
1452
1453         return 0;
1454 }
1455
1456 int set_remove_and_put(Set *s, const void *old_key, const void *new_key) {
1457         struct swap_entries swap;
1458         struct hashmap_base_entry *e;
1459         unsigned old_hash, new_hash, idx;
1460
1461         if (!s)
1462                 return -ENOENT;
1463
1464         old_hash = bucket_hash(s, old_key);
1465         idx = bucket_scan(s, old_hash, old_key);
1466         if (idx == IDX_NIL)
1467                 return -ENOENT;
1468
1469         new_hash = bucket_hash(s, new_key);
1470         if (bucket_scan(s, new_hash, new_key) != IDX_NIL)
1471                 return -EEXIST;
1472
1473         remove_entry(s, idx);
1474
1475         e = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1476         e->key = new_key;
1477         assert_se(hashmap_put_boldly(s, new_hash, &swap, false) == 1);
1478
1479         return 0;
1480 }
1481
1482 int hashmap_remove_and_replace(Hashmap *h, const void *old_key, const void *new_key, void *value) {
1483         struct swap_entries swap;
1484         struct plain_hashmap_entry *e;
1485         unsigned old_hash, new_hash, idx_old, idx_new;
1486
1487         if (!h)
1488                 return -ENOENT;
1489
1490         old_hash = bucket_hash(h, old_key);
1491         idx_old = bucket_scan(h, old_hash, old_key);
1492         if (idx_old == IDX_NIL)
1493                 return -ENOENT;
1494
1495         old_key = bucket_at(HASHMAP_BASE(h), idx_old)->key;
1496
1497         new_hash = bucket_hash(h, new_key);
1498         idx_new = bucket_scan(h, new_hash, new_key);
1499         if (idx_new != IDX_NIL)
1500                 if (idx_old != idx_new) {
1501                         remove_entry(h, idx_new);
1502                         /* Compensate for a possible backward shift. */
1503                         if (old_key != bucket_at(HASHMAP_BASE(h), idx_old)->key)
1504                                 idx_old = prev_idx(HASHMAP_BASE(h), idx_old);
1505                         assert(old_key == bucket_at(HASHMAP_BASE(h), idx_old)->key);
1506                 }
1507
1508         remove_entry(h, idx_old);
1509
1510         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1511         e->b.key = new_key;
1512         e->value = value;
1513         assert_se(hashmap_put_boldly(h, new_hash, &swap, false) == 1);
1514
1515         return 0;
1516 }
1517
1518 void *hashmap_remove_value(Hashmap *h, const void *key, void *value) {
1519         struct plain_hashmap_entry *e;
1520         unsigned hash, idx;
1521
1522         if (!h)
1523                 return NULL;
1524
1525         hash = bucket_hash(h, key);
1526         idx = bucket_scan(h, hash, key);
1527         if (idx == IDX_NIL)
1528                 return NULL;
1529
1530         e = plain_bucket_at(h, idx);
1531         if (e->value != value)
1532                 return NULL;
1533
1534         remove_entry(h, idx);
1535
1536         return value;
1537 }
1538
1539 static unsigned find_first_entry(HashmapBase *h) {
1540         Iterator i = ITERATOR_FIRST;
1541
1542         if (!h || !n_entries(h))
1543                 return IDX_NIL;
1544
1545         return hashmap_iterate_entry(h, &i);
1546 }
1547
1548 void *internal_hashmap_first(HashmapBase *h) {
1549         unsigned idx;
1550
1551         idx = find_first_entry(h);
1552         if (idx == IDX_NIL)
1553                 return NULL;
1554
1555         return entry_value(h, bucket_at(h, idx));
1556 }
1557
1558 void *internal_hashmap_first_key(HashmapBase *h) {
1559         struct hashmap_base_entry *e;
1560         unsigned idx;
1561
1562         idx = find_first_entry(h);
1563         if (idx == IDX_NIL)
1564                 return NULL;
1565
1566         e = bucket_at(h, idx);
1567         return (void*) e->key;
1568 }
1569
1570 void *internal_hashmap_steal_first(HashmapBase *h) {
1571         struct hashmap_base_entry *e;
1572         void *data;
1573         unsigned idx;
1574
1575         idx = find_first_entry(h);
1576         if (idx == IDX_NIL)
1577                 return NULL;
1578
1579         e = bucket_at(h, idx);
1580         data = entry_value(h, e);
1581         remove_entry(h, idx);
1582
1583         return data;
1584 }
1585
1586 void *internal_hashmap_steal_first_key(HashmapBase *h) {
1587         struct hashmap_base_entry *e;
1588         void *key;
1589         unsigned idx;
1590
1591         idx = find_first_entry(h);
1592         if (idx == IDX_NIL)
1593                 return NULL;
1594
1595         e = bucket_at(h, idx);
1596         key = (void*) e->key;
1597         remove_entry(h, idx);
1598
1599         return key;
1600 }
1601
1602 unsigned internal_hashmap_size(HashmapBase *h) {
1603
1604         if (!h)
1605                 return 0;
1606
1607         return n_entries(h);
1608 }
1609
1610 unsigned internal_hashmap_buckets(HashmapBase *h) {
1611
1612         if (!h)
1613                 return 0;
1614
1615         return n_buckets(h);
1616 }
1617
1618 int internal_hashmap_merge(Hashmap *h, Hashmap *other) {
1619         Iterator i;
1620         unsigned idx;
1621
1622         assert(h);
1623
1624         HASHMAP_FOREACH_IDX(idx, HASHMAP_BASE(other), i) {
1625                 struct plain_hashmap_entry *pe = plain_bucket_at(other, idx);
1626                 int r;
1627
1628                 r = hashmap_put(h, pe->b.key, pe->value);
1629                 if (r < 0 && r != -EEXIST)
1630                         return r;
1631         }
1632
1633         return 0;
1634 }
1635
1636 int set_merge(Set *s, Set *other) {
1637         Iterator i;
1638         unsigned idx;
1639
1640         assert(s);
1641
1642         HASHMAP_FOREACH_IDX(idx, HASHMAP_BASE(other), i) {
1643                 struct set_entry *se = set_bucket_at(other, idx);
1644                 int r;
1645
1646                 r = set_put(s, se->b.key);
1647                 if (r < 0)
1648                         return r;
1649         }
1650
1651         return 0;
1652 }
1653
1654 int internal_hashmap_reserve(HashmapBase *h, unsigned entries_add) {
1655         int r;
1656
1657         assert(h);
1658
1659         r = resize_buckets(h, entries_add);
1660         if (r < 0)
1661                 return r;
1662
1663         return 0;
1664 }
1665
1666 /*
1667  * The same as hashmap_merge(), but every new item from other is moved to h.
1668  * Keys already in h are skipped and stay in other.
1669  * Returns: 0 on success.
1670  *          -ENOMEM on alloc failure, in which case no move has been done.
1671  */
1672 int internal_hashmap_move(HashmapBase *h, HashmapBase *other) {
1673         struct swap_entries swap;
1674         struct hashmap_base_entry *e, *n;
1675         Iterator i;
1676         unsigned idx;
1677         int r;
1678
1679         assert(h);
1680
1681         if (!other)
1682                 return 0;
1683
1684         assert(other->type == h->type);
1685
1686         /*
1687          * This reserves buckets for the worst case, where none of other's
1688          * entries are yet present in h. This is preferable to risking
1689          * an allocation failure in the middle of the moving and having to
1690          * rollback or return a partial result.
1691          */
1692         r = resize_buckets(h, n_entries(other));
1693         if (r < 0)
1694                 return r;
1695
1696         HASHMAP_FOREACH_IDX(idx, other, i) {
1697                 unsigned h_hash;
1698
1699                 e = bucket_at(other, idx);
1700                 h_hash = bucket_hash(h, e->key);
1701                 if (bucket_scan(h, h_hash, e->key) != IDX_NIL)
1702                         continue;
1703
1704                 n = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1705                 n->key = e->key;
1706                 if (h->type != HASHMAP_TYPE_SET)
1707                         ((struct plain_hashmap_entry*) n)->value =
1708                                 ((struct plain_hashmap_entry*) e)->value;
1709                 assert_se(hashmap_put_boldly(h, h_hash, &swap, false) == 1);
1710
1711                 remove_entry(other, idx);
1712         }
1713
1714         return 0;
1715 }
1716
1717 int internal_hashmap_move_one(HashmapBase *h, HashmapBase *other, const void *key) {
1718         struct swap_entries swap;
1719         unsigned h_hash, other_hash, idx;
1720         struct hashmap_base_entry *e, *n;
1721         int r;
1722
1723         assert(h);
1724
1725         h_hash = bucket_hash(h, key);
1726         if (bucket_scan(h, h_hash, key) != IDX_NIL)
1727                 return -EEXIST;
1728
1729         if (!other)
1730                 return -ENOENT;
1731
1732         assert(other->type == h->type);
1733
1734         other_hash = bucket_hash(other, key);
1735         idx = bucket_scan(other, other_hash, key);
1736         if (idx == IDX_NIL)
1737                 return -ENOENT;
1738
1739         e = bucket_at(other, idx);
1740
1741         n = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1742         n->key = e->key;
1743         if (h->type != HASHMAP_TYPE_SET)
1744                 ((struct plain_hashmap_entry*) n)->value =
1745                         ((struct plain_hashmap_entry*) e)->value;
1746         r = hashmap_put_boldly(h, h_hash, &swap, true);
1747         if (r < 0)
1748                 return r;
1749
1750         remove_entry(other, idx);
1751         return 0;
1752 }
1753
1754 HashmapBase *internal_hashmap_copy(HashmapBase *h) {
1755         HashmapBase *copy;
1756         int r;
1757
1758         assert(h);
1759
1760         copy = hashmap_base_new(h->hash_ops, h->type  HASHMAP_DEBUG_SRC_ARGS);
1761         if (!copy)
1762                 return NULL;
1763
1764         switch (h->type) {
1765         case HASHMAP_TYPE_PLAIN:
1766         case HASHMAP_TYPE_ORDERED:
1767                 r = hashmap_merge((Hashmap*)copy, (Hashmap*)h);
1768                 break;
1769         case HASHMAP_TYPE_SET:
1770                 r = set_merge((Set*)copy, (Set*)h);
1771                 break;
1772         default:
1773                 assert_not_reached("Unknown hashmap type");
1774         }
1775
1776         if (r < 0) {
1777                 internal_hashmap_free(copy);
1778                 return NULL;
1779         }
1780
1781         return copy;
1782 }
1783
1784 char **internal_hashmap_get_strv(HashmapBase *h) {
1785         char **sv;
1786         Iterator i;
1787         unsigned idx, n;
1788
1789         sv = new(char*, n_entries(h)+1);
1790         if (!sv)
1791                 return NULL;
1792
1793         n = 0;
1794         HASHMAP_FOREACH_IDX(idx, h, i)
1795                 sv[n++] = entry_value(h, bucket_at(h, idx));
1796         sv[n] = NULL;
1797
1798         return sv;
1799 }
1800
1801 void *ordered_hashmap_next(OrderedHashmap *h, const void *key) {
1802         struct ordered_hashmap_entry *e;
1803         unsigned hash, idx;
1804
1805         if (!h)
1806                 return NULL;
1807
1808         hash = bucket_hash(h, key);
1809         idx = bucket_scan(h, hash, key);
1810         if (idx == IDX_NIL)
1811                 return NULL;
1812
1813         e = ordered_bucket_at(h, idx);
1814         if (e->iterate_next == IDX_NIL)
1815                 return NULL;
1816         return ordered_bucket_at(h, e->iterate_next)->p.value;
1817 }
1818
1819 int set_consume(Set *s, void *value) {
1820         int r;
1821
1822         assert(s);
1823         assert(value);
1824
1825         r = set_put(s, value);
1826         if (r <= 0)
1827                 free(value);
1828
1829         return r;
1830 }
1831
1832 int set_put_strdup(Set *s, const char *p) {
1833         char *c;
1834
1835         assert(s);
1836         assert(p);
1837
1838         if (set_contains(s, (char*) p))
1839                 return 0;
1840
1841         c = strdup(p);
1842         if (!c)
1843                 return -ENOMEM;
1844
1845         return set_consume(s, c);
1846 }
1847
1848 int set_put_strdupv(Set *s, char **l) {
1849         int n = 0, r;
1850         char **i;
1851
1852         assert(s);
1853
1854         STRV_FOREACH(i, l) {
1855                 r = set_put_strdup(s, *i);
1856                 if (r < 0)
1857                         return r;
1858
1859                 n += r;
1860         }
1861
1862         return n;
1863 }
1864
1865 int set_put_strsplit(Set *s, const char *v, const char *separators, ExtractFlags flags) {
1866         const char *p = v;
1867         int r;
1868
1869         assert(s);
1870         assert(v);
1871
1872         for (;;) {
1873                 char *word;
1874
1875                 r = extract_first_word(&p, &word, separators, flags);
1876                 if (r <= 0)
1877                         return r;
1878
1879                 r = set_consume(s, word);
1880                 if (r < 0)
1881                         return r;
1882         }
1883 }
1884
1885 /* expand the cachemem if needed, return true if newly (re)activated. */
1886 static int cachemem_maintain(CacheMem *mem, unsigned size) {
1887         assert(mem);
1888
1889         if (!GREEDY_REALLOC(mem->ptr, mem->n_allocated, size)) {
1890                 if (size > 0)
1891                         return -ENOMEM;
1892         }
1893
1894         if (!mem->active) {
1895                 mem->active = true;
1896                 return true;
1897         }
1898
1899         return false;
1900 }
1901
1902 int iterated_cache_get(IteratedCache *cache, const void ***res_keys, const void ***res_values, unsigned *res_n_entries) {
1903         bool sync_keys = false, sync_values = false;
1904         unsigned size;
1905         int r;
1906
1907         assert(cache);
1908         assert(cache->hashmap);
1909
1910         size = n_entries(cache->hashmap);
1911
1912         if (res_keys) {
1913                 r = cachemem_maintain(&cache->keys, size);
1914                 if (r < 0)
1915                         return r;
1916
1917                 sync_keys = r;
1918         } else
1919                 cache->keys.active = false;
1920
1921         if (res_values) {
1922                 r = cachemem_maintain(&cache->values, size);
1923                 if (r < 0)
1924                         return r;
1925
1926                 sync_values = r;
1927         } else
1928                 cache->values.active = false;
1929
1930         if (cache->hashmap->dirty) {
1931                 if (cache->keys.active)
1932                         sync_keys = true;
1933                 if (cache->values.active)
1934                         sync_values = true;
1935
1936                 cache->hashmap->dirty = false;
1937         }
1938
1939         if (sync_keys || sync_values) {
1940                 unsigned i, idx;
1941                 Iterator iter;
1942
1943                 i = 0;
1944                 HASHMAP_FOREACH_IDX(idx, cache->hashmap, iter) {
1945                         struct hashmap_base_entry *e;
1946
1947                         e = bucket_at(cache->hashmap, idx);
1948
1949                         if (sync_keys)
1950                                 cache->keys.ptr[i] = e->key;
1951                         if (sync_values)
1952                                 cache->values.ptr[i] = entry_value(cache->hashmap, e);
1953                         i++;
1954                 }
1955         }
1956
1957         if (res_keys)
1958                 *res_keys = cache->keys.ptr;
1959         if (res_values)
1960                 *res_values = cache->values.ptr;
1961         if (res_n_entries)
1962                 *res_n_entries = size;
1963
1964         return 0;
1965 }
1966
1967 IteratedCache *iterated_cache_free(IteratedCache *cache) {
1968         if (cache) {
1969                 free(cache->keys.ptr);
1970                 free(cache->values.ptr);
1971                 free(cache);
1972         }
1973
1974         return NULL;
1975 }