src/basic/hashmap.c

   1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
   2
   3 /***
   4   This file is part of systemd.
   5
   6   Copyright 2010 Lennart Poettering
   7   Copyright 2014 Michal Schmidt
   8
   9   systemd is free software; you can redistribute it and/or modify it
  10   under the terms of the GNU Lesser General Public License as published by
  11   the Free Software Foundation; either version 2.1 of the License, or
  12   (at your option) any later version.
  13
  14   systemd is distributed in the hope that it will be useful, but
  15   WITHOUT ANY WARRANTY; without even the implied warranty of
  16   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  17   Lesser General Public License for more details.
  18
  19   You should have received a copy of the GNU Lesser General Public License
  20   along with systemd; If not, see <http://www.gnu.org/licenses/>.
  21 ***/
  22
  23 #include <errno.h>
  24 #include <pthread.h>
  25 #include <stdlib.h>
  26
  27 #include "alloc-util.h"
  28 #include "hashmap.h"
  29 #include "macro.h"
  30 #include "mempool.h"
  31 #include "process-util.h"
  32 #include "random-util.h"
  33 #include "set.h"
  34 #include "siphash24.h"
  35 #include "strv.h"
  36 #include "util.h"
  37
  38 #ifdef ENABLE_DEBUG_HASHMAP
  39 #include "list.h"
  40 #endif
  41
  42 /*
  43  * Implementation of hashmaps.
  44  * Addressing: open
  45  *   - uses less RAM compared to closed addressing (chaining), because
  46  *     our entries are small (especially in Sets, which tend to contain
  47  *     the majority of entries in systemd).
  48  * Collision resolution: Robin Hood
  49  *   - tends to equalize displacement of entries from their optimal buckets.
  50  * Probe sequence: linear
  51  *   - though theoretically worse than random probing/uniform hashing/double
  52  *     hashing, it is good for cache locality.
  53  *
  54  * References:
  55  * Celis, P. 1986. Robin Hood Hashing.
  56  * Ph.D. Dissertation. University of Waterloo, Waterloo, Ont., Canada, Canada.
  57  * https://cs.uwaterloo.ca/research/tr/1986/CS-86-14.pdf
  58  * - The results are derived for random probing. Suggests deletion with
  59  *   tombstones and two mean-centered search methods. None of that works
  60  *   well for linear probing.
  61  *
  62  * Janson, S. 2005. Individual displacements for linear probing hashing with different insertion policies.
  63  * ACM Trans. Algorithms 1, 2 (October 2005), 177-213.
  64  * DOI=10.1145/1103963.1103964 http://doi.acm.org/10.1145/1103963.1103964
  65  * http://www.math.uu.se/~svante/papers/sj157.pdf
  66  * - Applies to Robin Hood with linear probing. Contains remarks on
  67  *   the unsuitability of mean-centered search with linear probing.
  68  *
  69  * Viola, A. 2005. Exact distribution of individual displacements in linear probing hashing.
  70  * ACM Trans. Algorithms 1, 2 (October 2005), 214-242.
  71  * DOI=10.1145/1103963.1103965 http://doi.acm.org/10.1145/1103963.1103965
  72  * - Similar to Janson. Note that Viola writes about C_{m,n} (number of probes
  73  *   in a successful search), and Janson writes about displacement. C = d + 1.
  74  *
  75  * Goossaert, E. 2013. Robin Hood hashing: backward shift deletion.
  76  * http://codecapsule.com/2013/11/17/robin-hood-hashing-backward-shift-deletion/
  77  * - Explanation of backward shift deletion with pictures.
  78  *
  79  * Khuong, P. 2013. The Other Robin Hood Hashing.
  80  * http://www.pvk.ca/Blog/2013/11/26/the-other-robin-hood-hashing/
  81  * - Short summary of random vs. linear probing, and tombstones vs. backward shift.
  82  */
  83
  84 /*
  85  * XXX Ideas for improvement:
  86  * For unordered hashmaps, randomize iteration order, similarly to Perl:
  87  * http://blog.booking.com/hardening-perls-hash-function.html
  88  */
  89
  90 /* INV_KEEP_FREE = 1 / (1 - max_load_factor)
  91  * e.g. 1 / (1 - 0.8) = 5 ... keep one fifth of the buckets free. */
  92 #define INV_KEEP_FREE            5U
  93
  94 /* Fields common to entries of all hashmap/set types */
  95 struct hashmap_base_entry {
  96         const void *key;
  97 };
  98
  99 /* Entry types for specific hashmap/set types
 100  * hashmap_base_entry must be at the beginning of each entry struct. */
 101
 102 struct plain_hashmap_entry {
 103         struct hashmap_base_entry b;
 104         void *value;
 105 };
 106
 107 struct ordered_hashmap_entry {
 108         struct plain_hashmap_entry p;
 109         unsigned iterate_next, iterate_previous;
 110 };
 111
 112 struct set_entry {
 113         struct hashmap_base_entry b;
 114 };
 115
 116 /* In several functions it is advantageous to have the hash table extended
 117  * virtually by a couple of additional buckets. We reserve special index values
 118  * for these "swap" buckets. */
 119 #define _IDX_SWAP_BEGIN     (UINT_MAX - 3)
 120 #define IDX_PUT             (_IDX_SWAP_BEGIN + 0)
 121 #define IDX_TMP             (_IDX_SWAP_BEGIN + 1)
 122 #define _IDX_SWAP_END       (_IDX_SWAP_BEGIN + 2)
 123
 124 #define IDX_FIRST           (UINT_MAX - 1) /* special index for freshly initialized iterators */
 125 #define IDX_NIL             UINT_MAX       /* special index value meaning "none" or "end" */
 126
 127 assert_cc(IDX_FIRST == _IDX_SWAP_END);
 128 assert_cc(IDX_FIRST == _IDX_ITERATOR_FIRST);
 129
 130 /* Storage space for the "swap" buckets.
 131  * All entry types can fit into a ordered_hashmap_entry. */
 132 struct swap_entries {
 133         struct ordered_hashmap_entry e[_IDX_SWAP_END - _IDX_SWAP_BEGIN];
 134 };
 135
 136 /* Distance from Initial Bucket */
 137 typedef uint8_t dib_raw_t;
 138 #define DIB_RAW_OVERFLOW ((dib_raw_t)0xfdU)   /* indicates DIB value is greater than representable */
 139 #define DIB_RAW_REHASH   ((dib_raw_t)0xfeU)   /* entry yet to be rehashed during in-place resize */
 140 #define DIB_RAW_FREE     ((dib_raw_t)0xffU)   /* a free bucket */
 141 #define DIB_RAW_INIT     ((char)DIB_RAW_FREE) /* a byte to memset a DIB store with when initializing */
 142
 143 #define DIB_FREE UINT_MAX
 144
 145 #ifdef ENABLE_DEBUG_HASHMAP
 146 struct hashmap_debug_info {
 147         LIST_FIELDS(struct hashmap_debug_info, debug_list);
 148         unsigned max_entries;  /* high watermark of n_entries */
 149
 150         /* who allocated this hashmap */
 151         int line;
 152         const char *file;
 153         const char *func;
 154
 155         /* fields to detect modification while iterating */
 156         unsigned put_count;    /* counts puts into the hashmap */
 157         unsigned rem_count;    /* counts removals from hashmap */
 158         unsigned last_rem_idx; /* remembers last removal index */
 159 };
 160
 161 /* Tracks all existing hashmaps. Get at it from gdb. See sd_dump_hashmaps.py */
 162 static LIST_HEAD(struct hashmap_debug_info, hashmap_debug_list);
 163 static pthread_mutex_t hashmap_debug_list_mutex = PTHREAD_MUTEX_INITIALIZER;
 164
 165 #define HASHMAP_DEBUG_FIELDS struct hashmap_debug_info debug;
 166
 167 #else /* !ENABLE_DEBUG_HASHMAP */
 168 #define HASHMAP_DEBUG_FIELDS
 169 #endif /* ENABLE_DEBUG_HASHMAP */
 170
 171 enum HashmapType {
 172         HASHMAP_TYPE_PLAIN,
 173         HASHMAP_TYPE_ORDERED,
 174         HASHMAP_TYPE_SET,
 175         _HASHMAP_TYPE_MAX
 176 };
 177
 178 struct _packed_ indirect_storage {
 179         char    *storage;                  /* where buckets and DIBs are stored */
 180         uint8_t  hash_key[HASH_KEY_SIZE];  /* hash key; changes during resize */
 181
 182         unsigned n_entries;                /* number of stored entries */
 183         unsigned n_buckets;                /* number of buckets */
 184
 185         unsigned idx_lowest_entry;         /* Index below which all buckets are free.
 186                                               Makes "while(hashmap_steal_first())" loops
 187                                               O(n) instead of O(n^2) for unordered hashmaps. */
 188         uint8_t  _pad[3];                  /* padding for the whole HashmapBase */
 189         /* The bitfields in HashmapBase complete the alignment of the whole thing. */
 190 };
 191
 192 struct direct_storage {
 193         /* This gives us 39 bytes on 64bit, or 35 bytes on 32bit.
 194          * That's room for 4 set_entries + 4 DIB bytes + 3 unused bytes on 64bit,
 195          *              or 7 set_entries + 7 DIB bytes + 0 unused bytes on 32bit. */
 196         char storage[sizeof(struct indirect_storage)];
 197 };
 198
 199 #define DIRECT_BUCKETS(entry_t) \
 200         (sizeof(struct direct_storage) / (sizeof(entry_t) + sizeof(dib_raw_t)))
 201
 202 /* We should be able to store at least one entry directly. */
 203 assert_cc(DIRECT_BUCKETS(struct ordered_hashmap_entry) >= 1);
 204
 205 /* We have 3 bits for n_direct_entries. */
 206 assert_cc(DIRECT_BUCKETS(struct set_entry) < (1 << 3));
 207
 208 /* Hashmaps with directly stored entries all use this shared hash key.
 209  * It's no big deal if the key is guessed, because there can be only
 210  * a handful of directly stored entries in a hashmap. When a hashmap
 211  * outgrows direct storage, it gets its own key for indirect storage. */
 212 static uint8_t shared_hash_key[HASH_KEY_SIZE];
 213 static bool shared_hash_key_initialized;
 214
 215 /* Fields that all hashmap/set types must have */
 216 struct HashmapBase {
 217         const struct hash_ops *hash_ops;  /* hash and compare ops to use */
 218
 219         union _packed_ {
 220                 struct indirect_storage indirect; /* if  has_indirect */
 221                 struct direct_storage direct;     /* if !has_indirect */
 222         };
 223
 224         enum HashmapType type:2;     /* HASHMAP_TYPE_* */
 225         bool has_indirect:1;         /* whether indirect storage is used */
 226         unsigned n_direct_entries:3; /* Number of entries in direct storage.
 227                                       * Only valid if !has_indirect. */
 228         bool from_pool:1;            /* whether was allocated from mempool */
 229         HASHMAP_DEBUG_FIELDS         /* optional hashmap_debug_info */
 230 };
 231
 232 /* Specific hash types
 233  * HashmapBase must be at the beginning of each hashmap struct. */
 234
 235 struct Hashmap {
 236         struct HashmapBase b;
 237 };
 238
 239 struct OrderedHashmap {
 240         struct HashmapBase b;
 241         unsigned iterate_list_head, iterate_list_tail;
 242 };
 243
 244 struct Set {
 245         struct HashmapBase b;
 246 };
 247
 248 DEFINE_MEMPOOL(hashmap_pool,         Hashmap,        8);
 249 DEFINE_MEMPOOL(ordered_hashmap_pool, OrderedHashmap, 8);
 250 /* No need for a separate Set pool */
 251 assert_cc(sizeof(Hashmap) == sizeof(Set));
 252
 253 struct hashmap_type_info {
 254         size_t head_size;
 255         size_t entry_size;
 256         struct mempool *mempool;
 257         unsigned n_direct_buckets;
 258 };
 259
 260 static const struct hashmap_type_info hashmap_type_info[_HASHMAP_TYPE_MAX] = {
 261         [HASHMAP_TYPE_PLAIN] = {
 262                 .head_size        = sizeof(Hashmap),
 263                 .entry_size       = sizeof(struct plain_hashmap_entry),
 264                 .mempool          = &hashmap_pool,
 265                 .n_direct_buckets = DIRECT_BUCKETS(struct plain_hashmap_entry),
 266         },
 267         [HASHMAP_TYPE_ORDERED] = {
 268                 .head_size        = sizeof(OrderedHashmap),
 269                 .entry_size       = sizeof(struct ordered_hashmap_entry),
 270                 .mempool          = &ordered_hashmap_pool,
 271                 .n_direct_buckets = DIRECT_BUCKETS(struct ordered_hashmap_entry),
 272         },
 273         [HASHMAP_TYPE_SET] = {
 274                 .head_size        = sizeof(Set),
 275                 .entry_size       = sizeof(struct set_entry),
 276                 .mempool          = &hashmap_pool,
 277                 .n_direct_buckets = DIRECT_BUCKETS(struct set_entry),
 278         },
 279 };
 280
 281 void string_hash_func(const void *p, struct siphash *state) {
 282         siphash24_compress(p, strlen(p) + 1, state);
 283 }
 284
 285 int string_compare_func(const void *a, const void *b) {
 286         return strcmp(a, b);
 287 }
 288
 289 const struct hash_ops string_hash_ops = {
 290         .hash = string_hash_func,
 291         .compare = string_compare_func
 292 };
 293
 294 void trivial_hash_func(const void *p, struct siphash *state) {
 295         siphash24_compress(&p, sizeof(p), state);
 296 }
 297
 298 int trivial_compare_func(const void *a, const void *b) {
 299         return a < b ? -1 : (a > b ? 1 : 0);
 300 }
 301
 302 const struct hash_ops trivial_hash_ops = {
 303         .hash = trivial_hash_func,
 304         .compare = trivial_compare_func
 305 };
 306
 307 void uint64_hash_func(const void *p, struct siphash *state) {
 308         siphash24_compress(p, sizeof(uint64_t), state);
 309 }
 310
 311 int uint64_compare_func(const void *_a, const void *_b) {
 312         uint64_t a, b;
 313         a = *(const uint64_t*) _a;
 314         b = *(const uint64_t*) _b;
 315         return a < b ? -1 : (a > b ? 1 : 0);
 316 }
 317
 318 const struct hash_ops uint64_hash_ops = {
 319         .hash = uint64_hash_func,
 320         .compare = uint64_compare_func
 321 };
 322
 323 #if SIZEOF_DEV_T != 8
 324 void devt_hash_func(const void *p, struct siphash *state) {
 325         siphash24_compress(p, sizeof(dev_t), state);
 326 }
 327
 328 int devt_compare_func(const void *_a, const void *_b) {
 329         dev_t a, b;
 330         a = *(const dev_t*) _a;
 331         b = *(const dev_t*) _b;
 332         return a < b ? -1 : (a > b ? 1 : 0);
 333 }
 334
 335 const struct hash_ops devt_hash_ops = {
 336         .hash = devt_hash_func,
 337         .compare = devt_compare_func
 338 };
 339 #endif
 340
 341 static unsigned n_buckets(HashmapBase *h) {
 342         return h->has_indirect ? h->indirect.n_buckets
 343                                : hashmap_type_info[h->type].n_direct_buckets;
 344 }
 345
 346 static unsigned n_entries(HashmapBase *h) {
 347         return h->has_indirect ? h->indirect.n_entries
 348                                : h->n_direct_entries;
 349 }
 350
 351 static void n_entries_inc(HashmapBase *h) {
 352         if (h->has_indirect)
 353                 h->indirect.n_entries++;
 354         else
 355                 h->n_direct_entries++;
 356 }
 357
 358 static void n_entries_dec(HashmapBase *h) {
 359         if (h->has_indirect)
 360                 h->indirect.n_entries--;
 361         else
 362                 h->n_direct_entries--;
 363 }
 364
 365 static char *storage_ptr(HashmapBase *h) {
 366         return h->has_indirect ? h->indirect.storage
 367                                : h->direct.storage;
 368 }
 369
 370 static uint8_t *hash_key(HashmapBase *h) {
 371         return h->has_indirect ? h->indirect.hash_key
 372                                : shared_hash_key;
 373 }
 374
 375 static unsigned base_bucket_hash(HashmapBase *h, const void *p) {
 376         struct siphash state;
 377         uint64_t hash;
 378
 379         siphash24_init(&state, hash_key(h));
 380
 381         h->hash_ops->hash(p, &state);
 382
 383         hash = siphash24_finalize(&state);
 384
 385         return (unsigned) (hash % n_buckets(h));
 386 }
 387 #define bucket_hash(h, p) base_bucket_hash(HASHMAP_BASE(h), p)
 388
 389 static void get_hash_key(uint8_t hash_key[HASH_KEY_SIZE], bool reuse_is_ok) {
 390         static uint8_t current[HASH_KEY_SIZE];
 391         static bool current_initialized = false;
 392
 393         /* Returns a hash function key to use. In order to keep things
 394          * fast we will not generate a new key each time we allocate a
 395          * new hash table. Instead, we'll just reuse the most recently
 396          * generated one, except if we never generated one or when we
 397          * are rehashing an entire hash table because we reached a
 398          * fill level */
 399
 400         if (!current_initialized || !reuse_is_ok) {
 401                 random_bytes(current, sizeof(current));
 402                 current_initialized = true;
 403         }
 404
 405         memcpy(hash_key, current, sizeof(current));
 406 }
 407
 408 static struct hashmap_base_entry *bucket_at(HashmapBase *h, unsigned idx) {
 409         return (struct hashmap_base_entry*)
 410                 (storage_ptr(h) + idx * hashmap_type_info[h->type].entry_size);
 411 }
 412
 413 static struct plain_hashmap_entry *plain_bucket_at(Hashmap *h, unsigned idx) {
 414         return (struct plain_hashmap_entry*) bucket_at(HASHMAP_BASE(h), idx);
 415 }
 416
 417 static struct ordered_hashmap_entry *ordered_bucket_at(OrderedHashmap *h, unsigned idx) {
 418         return (struct ordered_hashmap_entry*) bucket_at(HASHMAP_BASE(h), idx);
 419 }
 420
 421 static struct set_entry *set_bucket_at(Set *h, unsigned idx) {
 422         return (struct set_entry*) bucket_at(HASHMAP_BASE(h), idx);
 423 }
 424
 425 static struct ordered_hashmap_entry *bucket_at_swap(struct swap_entries *swap, unsigned idx) {
 426         return &swap->e[idx - _IDX_SWAP_BEGIN];
 427 }
 428
 429 /* Returns a pointer to the bucket at index idx.
 430  * Understands real indexes and swap indexes, hence "_virtual". */
 431 static struct hashmap_base_entry *bucket_at_virtual(HashmapBase *h, struct swap_entries *swap,
 432                                                     unsigned idx) {
 433         if (idx < _IDX_SWAP_BEGIN)
 434                 return bucket_at(h, idx);
 435
 436         if (idx < _IDX_SWAP_END)
 437                 return &bucket_at_swap(swap, idx)->p.b;
 438
 439         assert_not_reached("Invalid index");
 440 }
 441
 442 static dib_raw_t *dib_raw_ptr(HashmapBase *h) {
 443         return (dib_raw_t*)
 444                 (storage_ptr(h) + hashmap_type_info[h->type].entry_size * n_buckets(h));
 445 }
 446
 447 static unsigned bucket_distance(HashmapBase *h, unsigned idx, unsigned from) {
 448         return idx >= from ? idx - from
 449                            : n_buckets(h) + idx - from;
 450 }
 451
 452 static unsigned bucket_calculate_dib(HashmapBase *h, unsigned idx, dib_raw_t raw_dib) {
 453         unsigned initial_bucket;
 454
 455         if (raw_dib == DIB_RAW_FREE)
 456                 return DIB_FREE;
 457
 458         if (_likely_(raw_dib < DIB_RAW_OVERFLOW))
 459                 return raw_dib;
 460
 461         /*
 462          * Having an overflow DIB value is very unlikely. The hash function
 463          * would have to be bad. For example, in a table of size 2^24 filled
 464          * to load factor 0.9 the maximum observed DIB is only about 60.
 465          * In theory (assuming I used Maxima correctly), for an infinite size
 466          * hash table with load factor 0.8 the probability of a given entry
 467          * having DIB > 40 is 1.9e-8.
 468          * This returns the correct DIB value by recomputing the hash value in
 469          * the unlikely case. XXX Hitting this case could be a hint to rehash.
 470          */
 471         initial_bucket = bucket_hash(h, bucket_at(h, idx)->key);
 472         return bucket_distance(h, idx, initial_bucket);
 473 }
 474
 475 static void bucket_set_dib(HashmapBase *h, unsigned idx, unsigned dib) {
 476         dib_raw_ptr(h)[idx] = dib != DIB_FREE ? MIN(dib, DIB_RAW_OVERFLOW) : DIB_RAW_FREE;
 477 }
 478
 479 static unsigned skip_free_buckets(HashmapBase *h, unsigned idx) {
 480         dib_raw_t *dibs;
 481
 482         dibs = dib_raw_ptr(h);
 483
 484         for ( ; idx < n_buckets(h); idx++)
 485                 if (dibs[idx] != DIB_RAW_FREE)
 486                         return idx;
 487
 488         return IDX_NIL;
 489 }
 490
 491 static void bucket_mark_free(HashmapBase *h, unsigned idx) {
 492         memzero(bucket_at(h, idx), hashmap_type_info[h->type].entry_size);
 493         bucket_set_dib(h, idx, DIB_FREE);
 494 }
 495
 496 static void bucket_move_entry(HashmapBase *h, struct swap_entries *swap,
 497                               unsigned from, unsigned to) {
 498         struct hashmap_base_entry *e_from, *e_to;
 499
 500         assert(from != to);
 501
 502         e_from = bucket_at_virtual(h, swap, from);
 503         e_to   = bucket_at_virtual(h, swap, to);
 504
 505         memcpy(e_to, e_from, hashmap_type_info[h->type].entry_size);
 506
 507         if (h->type == HASHMAP_TYPE_ORDERED) {
 508                 OrderedHashmap *lh = (OrderedHashmap*) h;
 509                 struct ordered_hashmap_entry *le, *le_to;
 510
 511                 le_to = (struct ordered_hashmap_entry*) e_to;
 512
 513                 if (le_to->iterate_next != IDX_NIL) {
 514                         le = (struct ordered_hashmap_entry*)
 515                              bucket_at_virtual(h, swap, le_to->iterate_next);
 516                         le->iterate_previous = to;
 517                 }
 518
 519                 if (le_to->iterate_previous != IDX_NIL) {
 520                         le = (struct ordered_hashmap_entry*)
 521                              bucket_at_virtual(h, swap, le_to->iterate_previous);
 522                         le->iterate_next = to;
 523                 }
 524
 525                 if (lh->iterate_list_head == from)
 526                         lh->iterate_list_head = to;
 527                 if (lh->iterate_list_tail == from)
 528                         lh->iterate_list_tail = to;
 529         }
 530 }
 531
 532 static unsigned next_idx(HashmapBase *h, unsigned idx) {
 533         return (idx + 1U) % n_buckets(h);
 534 }
 535
 536 static unsigned prev_idx(HashmapBase *h, unsigned idx) {
 537         return (n_buckets(h) + idx - 1U) % n_buckets(h);
 538 }
 539
 540 static void *entry_value(HashmapBase *h, struct hashmap_base_entry *e) {
 541         switch (h->type) {
 542
 543         case HASHMAP_TYPE_PLAIN:
 544         case HASHMAP_TYPE_ORDERED:
 545                 return ((struct plain_hashmap_entry*)e)->value;
 546
 547         case HASHMAP_TYPE_SET:
 548                 return (void*) e->key;
 549
 550         default:
 551                 assert_not_reached("Unknown hashmap type");
 552         }
 553 }
 554
 555 static void base_remove_entry(HashmapBase *h, unsigned idx) {
 556         unsigned left, right, prev, dib;
 557         dib_raw_t raw_dib, *dibs;
 558
 559         dibs = dib_raw_ptr(h);
 560         assert(dibs[idx] != DIB_RAW_FREE);
 561
 562 #ifdef ENABLE_DEBUG_HASHMAP
 563         h->debug.rem_count++;
 564         h->debug.last_rem_idx = idx;
 565 #endif
 566
 567         left = idx;
 568         /* Find the stop bucket ("right"). It is either free or has DIB == 0. */
 569         for (right = next_idx(h, left); ; right = next_idx(h, right)) {
 570                 raw_dib = dibs[right];
 571                 if (raw_dib == 0 || raw_dib == DIB_RAW_FREE)
 572                         break;
 573
 574                 /* The buckets are not supposed to be all occupied and with DIB > 0.
 575                  * That would mean we could make everyone better off by shifting them
 576                  * backward. This scenario is impossible. */
 577                 assert(left != right);
 578         }
 579
 580         if (h->type == HASHMAP_TYPE_ORDERED) {
 581                 OrderedHashmap *lh = (OrderedHashmap*) h;
 582                 struct ordered_hashmap_entry *le = ordered_bucket_at(lh, idx);
 583
 584                 if (le->iterate_next != IDX_NIL)
 585                         ordered_bucket_at(lh, le->iterate_next)->iterate_previous = le->iterate_previous;
 586                 else
 587                         lh->iterate_list_tail = le->iterate_previous;
 588
 589                 if (le->iterate_previous != IDX_NIL)
 590                         ordered_bucket_at(lh, le->iterate_previous)->iterate_next = le->iterate_next;
 591                 else
 592                         lh->iterate_list_head = le->iterate_next;
 593         }
 594
 595         /* Now shift all buckets in the interval (left, right) one step backwards */
 596         for (prev = left, left = next_idx(h, left); left != right;
 597              prev = left, left = next_idx(h, left)) {
 598                 dib = bucket_calculate_dib(h, left, dibs[left]);
 599                 assert(dib != 0);
 600                 bucket_move_entry(h, NULL, left, prev);
 601                 bucket_set_dib(h, prev, dib - 1);
 602         }
 603
 604         bucket_mark_free(h, prev);
 605         n_entries_dec(h);
 606 }
 607 #define remove_entry(h, idx) base_remove_entry(HASHMAP_BASE(h), idx)
 608
 609 static unsigned hashmap_iterate_in_insertion_order(OrderedHashmap *h, Iterator *i) {
 610         struct ordered_hashmap_entry *e;
 611         unsigned idx;
 612
 613         assert(h);
 614         assert(i);
 615
 616         if (i->idx == IDX_NIL)
 617                 goto at_end;
 618
 619         if (i->idx == IDX_FIRST && h->iterate_list_head == IDX_NIL)
 620                 goto at_end;
 621
 622         if (i->idx == IDX_FIRST) {
 623                 idx = h->iterate_list_head;
 624                 e = ordered_bucket_at(h, idx);
 625         } else {
 626                 idx = i->idx;
 627                 e = ordered_bucket_at(h, idx);
 628                 /*
 629                  * We allow removing the current entry while iterating, but removal may cause
 630                  * a backward shift. The next entry may thus move one bucket to the left.
 631                  * To detect when it happens, we remember the key pointer of the entry we were
 632                  * going to iterate next. If it does not match, there was a backward shift.
 633                  */
 634                 if (e->p.b.key != i->next_key) {
 635                         idx = prev_idx(HASHMAP_BASE(h), idx);
 636                         e = ordered_bucket_at(h, idx);
 637                 }
 638                 assert(e->p.b.key == i->next_key);
 639         }
 640
 641 #ifdef ENABLE_DEBUG_HASHMAP
 642         i->prev_idx = idx;
 643 #endif
 644
 645         if (e->iterate_next != IDX_NIL) {
 646                 struct ordered_hashmap_entry *n;
 647                 i->idx = e->iterate_next;
 648                 n = ordered_bucket_at(h, i->idx);
 649                 i->next_key = n->p.b.key;
 650         } else
 651                 i->idx = IDX_NIL;
 652
 653         return idx;
 654
 655 at_end:
 656         i->idx = IDX_NIL;
 657         return IDX_NIL;
 658 }
 659
 660 static unsigned hashmap_iterate_in_internal_order(HashmapBase *h, Iterator *i) {
 661         unsigned idx;
 662
 663         assert(h);
 664         assert(i);
 665
 666         if (i->idx == IDX_NIL)
 667                 goto at_end;
 668
 669         if (i->idx == IDX_FIRST) {
 670                 /* fast forward to the first occupied bucket */
 671                 if (h->has_indirect) {
 672                         i->idx = skip_free_buckets(h, h->indirect.idx_lowest_entry);
 673                         h->indirect.idx_lowest_entry = i->idx;
 674                 } else
 675                         i->idx = skip_free_buckets(h, 0);
 676
 677                 if (i->idx == IDX_NIL)
 678                         goto at_end;
 679         } else {
 680                 struct hashmap_base_entry *e;
 681
 682                 assert(i->idx > 0);
 683
 684                 e = bucket_at(h, i->idx);
 685                 /*
 686                  * We allow removing the current entry while iterating, but removal may cause
 687                  * a backward shift. The next entry may thus move one bucket to the left.
 688                  * To detect when it happens, we remember the key pointer of the entry we were
 689                  * going to iterate next. If it does not match, there was a backward shift.
 690                  */
 691                 if (e->key != i->next_key)
 692                         e = bucket_at(h, --i->idx);
 693
 694                 assert(e->key == i->next_key);
 695         }
 696
 697         idx = i->idx;
 698 #ifdef ENABLE_DEBUG_HASHMAP
 699         i->prev_idx = idx;
 700 #endif
 701
 702         i->idx = skip_free_buckets(h, i->idx + 1);
 703         if (i->idx != IDX_NIL)
 704                 i->next_key = bucket_at(h, i->idx)->key;
 705         else
 706                 i->idx = IDX_NIL;
 707
 708         return idx;
 709
 710 at_end:
 711         i->idx = IDX_NIL;
 712         return IDX_NIL;
 713 }
 714
 715 static unsigned hashmap_iterate_entry(HashmapBase *h, Iterator *i) {
 716         if (!h) {
 717                 i->idx = IDX_NIL;
 718                 return IDX_NIL;
 719         }
 720
 721 #ifdef ENABLE_DEBUG_HASHMAP
 722         if (i->idx == IDX_FIRST) {
 723                 i->put_count = h->debug.put_count;
 724                 i->rem_count = h->debug.rem_count;
 725         } else {
 726                 /* While iterating, must not add any new entries */
 727                 assert(i->put_count == h->debug.put_count);
 728                 /* ... or remove entries other than the current one */
 729                 assert(i->rem_count == h->debug.rem_count ||
 730                        (i->rem_count == h->debug.rem_count - 1 &&
 731                         i->prev_idx == h->debug.last_rem_idx));
 732                 /* Reset our removals counter */
 733                 i->rem_count = h->debug.rem_count;
 734         }
 735 #endif
 736
 737         return h->type == HASHMAP_TYPE_ORDERED ? hashmap_iterate_in_insertion_order((OrderedHashmap*) h, i)
 738                                                : hashmap_iterate_in_internal_order(h, i);
 739 }
 740
 741 bool internal_hashmap_iterate(HashmapBase *h, Iterator *i, void **value, const void **key) {
 742         struct hashmap_base_entry *e;
 743         void *data;
 744         unsigned idx;
 745
 746         idx = hashmap_iterate_entry(h, i);
 747         if (idx == IDX_NIL) {
 748                 if (value)
 749                         *value = NULL;
 750                 if (key)
 751                         *key = NULL;
 752
 753                 return false;
 754         }
 755
 756         e = bucket_at(h, idx);
 757         data = entry_value(h, e);
 758         if (value)
 759                 *value = data;
 760         if (key)
 761                 *key = e->key;
 762
 763         return true;
 764 }
 765
 766 bool set_iterate(Set *s, Iterator *i, void **value) {
 767         return internal_hashmap_iterate(HASHMAP_BASE(s), i, value, NULL);
 768 }
 769
 770 #define HASHMAP_FOREACH_IDX(idx, h, i) \
 771         for ((i) = ITERATOR_FIRST, (idx) = hashmap_iterate_entry((h), &(i)); \
 772              (idx != IDX_NIL); \
 773              (idx) = hashmap_iterate_entry((h), &(i)))
 774
 775 static void reset_direct_storage(HashmapBase *h) {
 776         const struct hashmap_type_info *hi = &hashmap_type_info[h->type];
 777         void *p;
 778
 779         assert(!h->has_indirect);
 780
 781         p = mempset(h->direct.storage, 0, hi->entry_size * hi->n_direct_buckets);
 782         memset(p, DIB_RAW_INIT, sizeof(dib_raw_t) * hi->n_direct_buckets);
 783 }
 784
 785 static struct HashmapBase *hashmap_base_new(const struct hash_ops *hash_ops, enum HashmapType type HASHMAP_DEBUG_PARAMS) {
 786         HashmapBase *h;
 787         const struct hashmap_type_info *hi = &hashmap_type_info[type];
 788         bool use_pool;
 789
 790         use_pool = is_main_thread();
 791
 792         h = use_pool ? mempool_alloc0_tile(hi->mempool) : malloc0(hi->head_size);
 793
 794         if (!h)
 795                 return NULL;
 796
 797         h->type = type;
 798         h->from_pool = use_pool;
 799         h->hash_ops = hash_ops ? hash_ops : &trivial_hash_ops;
 800
 801         if (type == HASHMAP_TYPE_ORDERED) {
 802                 OrderedHashmap *lh = (OrderedHashmap*)h;
 803                 lh->iterate_list_head = lh->iterate_list_tail = IDX_NIL;
 804         }
 805
 806         reset_direct_storage(h);
 807
 808         if (!shared_hash_key_initialized) {
 809                 random_bytes(shared_hash_key, sizeof(shared_hash_key));
 810                 shared_hash_key_initialized= true;
 811         }
 812
 813 #ifdef ENABLE_DEBUG_HASHMAP
 814         h->debug.func = func;
 815         h->debug.file = file;
 816         h->debug.line = line;
 817         assert_se(pthread_mutex_lock(&hashmap_debug_list_mutex) == 0);
 818         LIST_PREPEND(debug_list, hashmap_debug_list, &h->debug);
 819         assert_se(pthread_mutex_unlock(&hashmap_debug_list_mutex) == 0);
 820 #endif
 821
 822         return h;
 823 }
 824
 825 Hashmap *internal_hashmap_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 826         return (Hashmap*)        hashmap_base_new(hash_ops, HASHMAP_TYPE_PLAIN HASHMAP_DEBUG_PASS_ARGS);
 827 }
 828
 829 OrderedHashmap *internal_ordered_hashmap_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 830         return (OrderedHashmap*) hashmap_base_new(hash_ops, HASHMAP_TYPE_ORDERED HASHMAP_DEBUG_PASS_ARGS);
 831 }
 832
 833 Set *internal_set_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 834         return (Set*)            hashmap_base_new(hash_ops, HASHMAP_TYPE_SET HASHMAP_DEBUG_PASS_ARGS);
 835 }
 836
 837 static int hashmap_base_ensure_allocated(HashmapBase **h, const struct hash_ops *hash_ops,
 838                                          enum HashmapType type HASHMAP_DEBUG_PARAMS) {
 839         HashmapBase *q;
 840
 841         assert(h);
 842
 843         if (*h)
 844                 return 0;
 845
 846         q = hashmap_base_new(hash_ops, type HASHMAP_DEBUG_PASS_ARGS);
 847         if (!q)
 848                 return -ENOMEM;
 849
 850         *h = q;
 851         return 0;
 852 }
 853
 854 int internal_hashmap_ensure_allocated(Hashmap **h, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 855         return hashmap_base_ensure_allocated((HashmapBase**)h, hash_ops, HASHMAP_TYPE_PLAIN HASHMAP_DEBUG_PASS_ARGS);
 856 }
 857
 858 int internal_ordered_hashmap_ensure_allocated(OrderedHashmap **h, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 859         return hashmap_base_ensure_allocated((HashmapBase**)h, hash_ops, HASHMAP_TYPE_ORDERED HASHMAP_DEBUG_PASS_ARGS);
 860 }
 861
 862 int internal_set_ensure_allocated(Set **s, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 863         return hashmap_base_ensure_allocated((HashmapBase**)s, hash_ops, HASHMAP_TYPE_SET HASHMAP_DEBUG_PASS_ARGS);
 864 }
 865
 866 static void hashmap_free_no_clear(HashmapBase *h) {
 867         assert(!h->has_indirect);
 868         assert(!h->n_direct_entries);
 869
 870 #ifdef ENABLE_DEBUG_HASHMAP
 871         assert_se(pthread_mutex_lock(&hashmap_debug_list_mutex) == 0);
 872         LIST_REMOVE(debug_list, hashmap_debug_list, &h->debug);
 873         assert_se(pthread_mutex_unlock(&hashmap_debug_list_mutex) == 0);
 874 #endif
 875
 876         if (h->from_pool)
 877                 mempool_free_tile(hashmap_type_info[h->type].mempool, h);
 878         else
 879                 free(h);
 880 }
 881
 882 HashmapBase *internal_hashmap_free(HashmapBase *h) {
 883
 884         /* Free the hashmap, but nothing in it */
 885
 886         if (h) {
 887                 internal_hashmap_clear(h);
 888                 hashmap_free_no_clear(h);
 889         }
 890
 891         return NULL;
 892 }
 893
 894 HashmapBase *internal_hashmap_free_free(HashmapBase *h) {
 895
 896         /* Free the hashmap and all data objects in it, but not the
 897          * keys */
 898
 899         if (h) {
 900                 internal_hashmap_clear_free(h);
 901                 hashmap_free_no_clear(h);
 902         }
 903
 904         return NULL;
 905 }
 906
 907 Hashmap *hashmap_free_free_free(Hashmap *h) {
 908
 909         /* Free the hashmap and all data and key objects in it */
 910
 911         if (h) {
 912                 hashmap_clear_free_free(h);
 913                 hashmap_free_no_clear(HASHMAP_BASE(h));
 914         }
 915
 916         return NULL;
 917 }
 918
 919 void internal_hashmap_clear(HashmapBase *h) {
 920         if (!h)
 921                 return;
 922
 923         if (h->has_indirect) {
 924                 free(h->indirect.storage);
 925                 h->has_indirect = false;
 926         }
 927
 928         h->n_direct_entries = 0;
 929         reset_direct_storage(h);
 930
 931         if (h->type == HASHMAP_TYPE_ORDERED) {
 932                 OrderedHashmap *lh = (OrderedHashmap*) h;
 933                 lh->iterate_list_head = lh->iterate_list_tail = IDX_NIL;
 934         }
 935 }
 936
 937 void internal_hashmap_clear_free(HashmapBase *h) {
 938         unsigned idx;
 939
 940         if (!h)
 941                 return;
 942
 943         for (idx = skip_free_buckets(h, 0); idx != IDX_NIL;
 944              idx = skip_free_buckets(h, idx + 1))
 945                 free(entry_value(h, bucket_at(h, idx)));
 946
 947         internal_hashmap_clear(h);
 948 }
 949
 950 void hashmap_clear_free_free(Hashmap *h) {
 951         unsigned idx;
 952
 953         if (!h)
 954                 return;
 955
 956         for (idx = skip_free_buckets(HASHMAP_BASE(h), 0); idx != IDX_NIL;
 957              idx = skip_free_buckets(HASHMAP_BASE(h), idx + 1)) {
 958                 struct plain_hashmap_entry *e = plain_bucket_at(h, idx);
 959                 free((void*)e->b.key);
 960                 free(e->value);
 961         }
 962
 963         internal_hashmap_clear(HASHMAP_BASE(h));
 964 }
 965
 966 static int resize_buckets(HashmapBase *h, unsigned entries_add);
 967
 968 /*
 969  * Finds an empty bucket to put an entry into, starting the scan at 'idx'.
 970  * Performs Robin Hood swaps as it goes. The entry to put must be placed
 971  * by the caller into swap slot IDX_PUT.
 972  * If used for in-place resizing, may leave a displaced entry in swap slot
 973  * IDX_PUT. Caller must rehash it next.
 974  * Returns: true if it left a displaced entry to rehash next in IDX_PUT,
 975  *          false otherwise.
 976  */
 977 static bool hashmap_put_robin_hood(HashmapBase *h, unsigned idx,
 978                                    struct swap_entries *swap) {
 979         dib_raw_t raw_dib, *dibs;
 980         unsigned dib, distance;
 981
 982 #ifdef ENABLE_DEBUG_HASHMAP
 983         h->debug.put_count++;
 984 #endif
 985
 986         dibs = dib_raw_ptr(h);
 987
 988         for (distance = 0; ; distance++) {
 989                 raw_dib = dibs[idx];
 990                 if (raw_dib == DIB_RAW_FREE || raw_dib == DIB_RAW_REHASH) {
 991                         if (raw_dib == DIB_RAW_REHASH)
 992                                 bucket_move_entry(h, swap, idx, IDX_TMP);
 993
 994                         if (h->has_indirect && h->indirect.idx_lowest_entry > idx)
 995                                 h->indirect.idx_lowest_entry = idx;
 996
 997                         bucket_set_dib(h, idx, distance);
 998                         bucket_move_entry(h, swap, IDX_PUT, idx);
 999                         if (raw_dib == DIB_RAW_REHASH) {
1000                                 bucket_move_entry(h, swap, IDX_TMP, IDX_PUT);
1001                                 return true;
1002                         }
1003
1004                         return false;
1005                 }
1006
1007                 dib = bucket_calculate_dib(h, idx, raw_dib);
1008
1009                 if (dib < distance) {
1010                         /* Found a wealthier entry. Go Robin Hood! */
1011                         bucket_set_dib(h, idx, distance);
1012
1013                         /* swap the entries */
1014                         bucket_move_entry(h, swap, idx, IDX_TMP);
1015                         bucket_move_entry(h, swap, IDX_PUT, idx);
1016                         bucket_move_entry(h, swap, IDX_TMP, IDX_PUT);
1017
1018                         distance = dib;
1019                 }
1020
1021                 idx = next_idx(h, idx);
1022         }
1023 }
1024
1025 /*
1026  * Puts an entry into a hashmap, boldly - no check whether key already exists.
1027  * The caller must place the entry (only its key and value, not link indexes)
1028  * in swap slot IDX_PUT.
1029  * Caller must ensure: the key does not exist yet in the hashmap.
1030  *                     that resize is not needed if !may_resize.
1031  * Returns: 1 if entry was put successfully.
1032  *          -ENOMEM if may_resize==true and resize failed with -ENOMEM.
1033  *          Cannot return -ENOMEM if !may_resize.
1034  */
1035 static int hashmap_base_put_boldly(HashmapBase *h, unsigned idx,
1036                                    struct swap_entries *swap, bool may_resize) {
1037         struct ordered_hashmap_entry *new_entry;
1038         int r;
1039
1040         assert(idx < n_buckets(h));
1041
1042         new_entry = bucket_at_swap(swap, IDX_PUT);
1043
1044         if (may_resize) {
1045                 r = resize_buckets(h, 1);
1046                 if (r < 0)
1047                         return r;
1048                 if (r > 0)
1049                         idx = bucket_hash(h, new_entry->p.b.key);
1050         }
1051         assert(n_entries(h) < n_buckets(h));
1052
1053         if (h->type == HASHMAP_TYPE_ORDERED) {
1054                 OrderedHashmap *lh = (OrderedHashmap*) h;
1055
1056                 new_entry->iterate_next = IDX_NIL;
1057                 new_entry->iterate_previous = lh->iterate_list_tail;
1058
1059                 if (lh->iterate_list_tail != IDX_NIL) {
1060                         struct ordered_hashmap_entry *old_tail;
1061
1062                         old_tail = ordered_bucket_at(lh, lh->iterate_list_tail);
1063                         assert(old_tail->iterate_next == IDX_NIL);
1064                         old_tail->iterate_next = IDX_PUT;
1065                 }
1066
1067                 lh->iterate_list_tail = IDX_PUT;
1068                 if (lh->iterate_list_head == IDX_NIL)
1069                         lh->iterate_list_head = IDX_PUT;
1070         }
1071
1072         assert_se(hashmap_put_robin_hood(h, idx, swap) == false);
1073
1074         n_entries_inc(h);
1075 #ifdef ENABLE_DEBUG_HASHMAP
1076         h->debug.max_entries = MAX(h->debug.max_entries, n_entries(h));
1077 #endif
1078
1079         return 1;
1080 }
1081 #define hashmap_put_boldly(h, idx, swap, may_resize) \
1082         hashmap_base_put_boldly(HASHMAP_BASE(h), idx, swap, may_resize)
1083
1084 /*
1085  * Returns 0 if resize is not needed.
1086  *         1 if successfully resized.
1087  *         -ENOMEM on allocation failure.
1088  */
1089 static int resize_buckets(HashmapBase *h, unsigned entries_add) {
1090         struct swap_entries swap;
1091         char *new_storage;
1092         dib_raw_t *old_dibs, *new_dibs;
1093         const struct hashmap_type_info *hi;
1094         unsigned idx, optimal_idx;
1095         unsigned old_n_buckets, new_n_buckets, n_rehashed, new_n_entries;
1096         uint8_t new_shift;
1097         bool rehash_next;
1098
1099         assert(h);
1100
1101         hi = &hashmap_type_info[h->type];
1102         new_n_entries = n_entries(h) + entries_add;
1103
1104         /* overflow? */
1105         if (_unlikely_(new_n_entries < entries_add))
1106                 return -ENOMEM;
1107
1108         /* For direct storage we allow 100% load, because it's tiny. */
1109         if (!h->has_indirect && new_n_entries <= hi->n_direct_buckets)
1110                 return 0;
1111
1112         /*
1113          * Load factor = n/m = 1 - (1/INV_KEEP_FREE).
1114          * From it follows: m = n + n/(INV_KEEP_FREE - 1)
1115          */
1116         new_n_buckets = new_n_entries + new_n_entries / (INV_KEEP_FREE - 1);
1117         /* overflow? */
1118         if (_unlikely_(new_n_buckets < new_n_entries))
1119                 return -ENOMEM;
1120
1121         if (_unlikely_(new_n_buckets > UINT_MAX / (hi->entry_size + sizeof(dib_raw_t))))
1122                 return -ENOMEM;
1123
1124         old_n_buckets = n_buckets(h);
1125
1126         if (_likely_(new_n_buckets <= old_n_buckets))
1127                 return 0;
1128
1129         new_shift = log2u_round_up(MAX(
1130                         new_n_buckets * (hi->entry_size + sizeof(dib_raw_t)),
1131                         2 * sizeof(struct direct_storage)));
1132
1133         /* Realloc storage (buckets and DIB array). */
1134         new_storage = realloc(h->has_indirect ? h->indirect.storage : NULL,
1135                               1U << new_shift);
1136         if (!new_storage)
1137                 return -ENOMEM;
1138
1139         /* Must upgrade direct to indirect storage. */
1140         if (!h->has_indirect) {
1141                 memcpy(new_storage, h->direct.storage,
1142                        old_n_buckets * (hi->entry_size + sizeof(dib_raw_t)));
1143                 h->indirect.n_entries = h->n_direct_entries;
1144                 h->indirect.idx_lowest_entry = 0;
1145                 h->n_direct_entries = 0;
1146         }
1147
1148         /* Get a new hash key. If we've just upgraded to indirect storage,
1149          * allow reusing a previously generated key. It's still a different key
1150          * from the shared one that we used for direct storage. */
1151         get_hash_key(h->indirect.hash_key, !h->has_indirect);
1152
1153         h->has_indirect = true;
1154         h->indirect.storage = new_storage;
1155         h->indirect.n_buckets = (1U << new_shift) /
1156                                 (hi->entry_size + sizeof(dib_raw_t));
1157
1158         old_dibs = (dib_raw_t*)(new_storage + hi->entry_size * old_n_buckets);
1159         new_dibs = dib_raw_ptr(h);
1160
1161         /*
1162          * Move the DIB array to the new place, replacing valid DIB values with
1163          * DIB_RAW_REHASH to indicate all of the used buckets need rehashing.
1164          * Note: Overlap is not possible, because we have at least doubled the
1165          * number of buckets and dib_raw_t is smaller than any entry type.
1166          */
1167         for (idx = 0; idx < old_n_buckets; idx++) {
1168                 assert(old_dibs[idx] != DIB_RAW_REHASH);
1169                 new_dibs[idx] = old_dibs[idx] == DIB_RAW_FREE ? DIB_RAW_FREE
1170                                                               : DIB_RAW_REHASH;
1171         }
1172
1173         /* Zero the area of newly added entries (including the old DIB area) */
1174         memzero(bucket_at(h, old_n_buckets),
1175                (n_buckets(h) - old_n_buckets) * hi->entry_size);
1176
1177         /* The upper half of the new DIB array needs initialization */
1178         memset(&new_dibs[old_n_buckets], DIB_RAW_INIT,
1179                (n_buckets(h) - old_n_buckets) * sizeof(dib_raw_t));
1180
1181         /* Rehash entries that need it */
1182         n_rehashed = 0;
1183         for (idx = 0; idx < old_n_buckets; idx++) {
1184                 if (new_dibs[idx] != DIB_RAW_REHASH)
1185                         continue;
1186
1187                 optimal_idx = bucket_hash(h, bucket_at(h, idx)->key);
1188
1189                 /*
1190                  * Not much to do if by luck the entry hashes to its current
1191                  * location. Just set its DIB.
1192                  */
1193                 if (optimal_idx == idx) {
1194                         new_dibs[idx] = 0;
1195                         n_rehashed++;
1196                         continue;
1197                 }
1198
1199                 new_dibs[idx] = DIB_RAW_FREE;
1200                 bucket_move_entry(h, &swap, idx, IDX_PUT);
1201                 /* bucket_move_entry does not clear the source */
1202                 memzero(bucket_at(h, idx), hi->entry_size);
1203
1204                 do {
1205                         /*
1206                          * Find the new bucket for the current entry. This may make
1207                          * another entry homeless and load it into IDX_PUT.
1208                          */
1209                         rehash_next = hashmap_put_robin_hood(h, optimal_idx, &swap);
1210                         n_rehashed++;
1211
1212                         /* Did the current entry displace another one? */
1213                         if (rehash_next)
1214                                 optimal_idx = bucket_hash(h, bucket_at_swap(&swap, IDX_PUT)->p.b.key);
1215                 } while (rehash_next);
1216         }
1217
1218         assert(n_rehashed == n_entries(h));
1219
1220         return 1;
1221 }
1222
1223 /*
1224  * Finds an entry with a matching key
1225  * Returns: index of the found entry, or IDX_NIL if not found.
1226  */
1227 static unsigned base_bucket_scan(HashmapBase *h, unsigned idx, const void *key) {
1228         struct hashmap_base_entry *e;
1229         unsigned dib, distance;
1230         dib_raw_t *dibs = dib_raw_ptr(h);
1231
1232         assert(idx < n_buckets(h));
1233
1234         for (distance = 0; ; distance++) {
1235                 if (dibs[idx] == DIB_RAW_FREE)
1236                         return IDX_NIL;
1237
1238                 dib = bucket_calculate_dib(h, idx, dibs[idx]);
1239
1240                 if (dib < distance)
1241                         return IDX_NIL;
1242                 if (dib == distance) {
1243                         e = bucket_at(h, idx);
1244                         if (h->hash_ops->compare(e->key, key) == 0)
1245                                 return idx;
1246                 }
1247
1248                 idx = next_idx(h, idx);
1249         }
1250 }
1251 #define bucket_scan(h, idx, key) base_bucket_scan(HASHMAP_BASE(h), idx, key)
1252
1253 int hashmap_put(Hashmap *h, const void *key, void *value) {
1254         struct swap_entries swap;
1255         struct plain_hashmap_entry *e;
1256         unsigned hash, idx;
1257
1258         assert(h);
1259
1260         hash = bucket_hash(h, key);
1261         idx = bucket_scan(h, hash, key);
1262         if (idx != IDX_NIL) {
1263                 e = plain_bucket_at(h, idx);
1264                 if (e->value == value)
1265                         return 0;
1266                 return -EEXIST;
1267         }
1268
1269         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1270         e->b.key = key;
1271         e->value = value;
1272         return hashmap_put_boldly(h, hash, &swap, true);
1273 }
1274
1275 int set_put(Set *s, const void *key) {
1276         struct swap_entries swap;
1277         struct hashmap_base_entry *e;
1278         unsigned hash, idx;
1279
1280         assert(s);
1281
1282         hash = bucket_hash(s, key);
1283         idx = bucket_scan(s, hash, key);
1284         if (idx != IDX_NIL)
1285                 return 0;
1286
1287         e = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1288         e->key = key;
1289         return hashmap_put_boldly(s, hash, &swap, true);
1290 }
1291
1292 int hashmap_replace(Hashmap *h, const void *key, void *value) {
1293         struct swap_entries swap;
1294         struct plain_hashmap_entry *e;
1295         unsigned hash, idx;
1296
1297         assert(h);
1298
1299         hash = bucket_hash(h, key);
1300         idx = bucket_scan(h, hash, key);
1301         if (idx != IDX_NIL) {
1302                 e = plain_bucket_at(h, idx);
1303 #ifdef ENABLE_DEBUG_HASHMAP
1304                 /* Although the key is equal, the key pointer may have changed,
1305                  * and this would break our assumption for iterating. So count
1306                  * this operation as incompatible with iteration. */
1307                 if (e->b.key != key) {
1308                         h->b.debug.put_count++;
1309                         h->b.debug.rem_count++;
1310                         h->b.debug.last_rem_idx = idx;
1311                 }
1312 #endif
1313                 e->b.key = key;
1314                 e->value = value;
1315                 return 0;
1316         }
1317
1318         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1319         e->b.key = key;
1320         e->value = value;
1321         return hashmap_put_boldly(h, hash, &swap, true);
1322 }
1323
1324 int hashmap_update(Hashmap *h, const void *key, void *value) {
1325         struct plain_hashmap_entry *e;
1326         unsigned hash, idx;
1327
1328         assert(h);
1329
1330         hash = bucket_hash(h, key);
1331         idx = bucket_scan(h, hash, key);
1332         if (idx == IDX_NIL)
1333                 return -ENOENT;
1334
1335         e = plain_bucket_at(h, idx);
1336         e->value = value;
1337         return 0;
1338 }
1339
1340 void *internal_hashmap_get(HashmapBase *h, const void *key) {
1341         struct hashmap_base_entry *e;
1342         unsigned hash, idx;
1343
1344         if (!h)
1345                 return NULL;
1346
1347         hash = bucket_hash(h, key);
1348         idx = bucket_scan(h, hash, key);
1349         if (idx == IDX_NIL)
1350                 return NULL;
1351
1352         e = bucket_at(h, idx);
1353         return entry_value(h, e);
1354 }
1355
1356 void *hashmap_get2(Hashmap *h, const void *key, void **key2) {
1357         struct plain_hashmap_entry *e;
1358         unsigned hash, idx;
1359
1360         if (!h)
1361                 return NULL;
1362
1363         hash = bucket_hash(h, key);
1364         idx = bucket_scan(h, hash, key);
1365         if (idx == IDX_NIL)
1366                 return NULL;
1367
1368         e = plain_bucket_at(h, idx);
1369         if (key2)
1370                 *key2 = (void*) e->b.key;
1371
1372         return e->value;
1373 }
1374
1375 bool internal_hashmap_contains(HashmapBase *h, const void *key) {
1376         unsigned hash;
1377
1378         if (!h)
1379                 return false;
1380
1381         hash = bucket_hash(h, key);
1382         return bucket_scan(h, hash, key) != IDX_NIL;
1383 }
1384
1385 void *internal_hashmap_remove(HashmapBase *h, const void *key) {
1386         struct hashmap_base_entry *e;
1387         unsigned hash, idx;
1388         void *data;
1389
1390         if (!h)
1391                 return NULL;
1392
1393         hash = bucket_hash(h, key);
1394         idx = bucket_scan(h, hash, key);
1395         if (idx == IDX_NIL)
1396                 return NULL;
1397
1398         e = bucket_at(h, idx);
1399         data = entry_value(h, e);
1400         remove_entry(h, idx);
1401
1402         return data;
1403 }
1404
1405 void *hashmap_remove2(Hashmap *h, const void *key, void **rkey) {
1406         struct plain_hashmap_entry *e;
1407         unsigned hash, idx;
1408         void *data;
1409
1410         if (!h) {
1411                 if (rkey)
1412                         *rkey = NULL;
1413                 return NULL;
1414         }
1415
1416         hash = bucket_hash(h, key);
1417         idx = bucket_scan(h, hash, key);
1418         if (idx == IDX_NIL) {
1419                 if (rkey)
1420                         *rkey = NULL;
1421                 return NULL;
1422         }
1423
1424         e = plain_bucket_at(h, idx);
1425         data = e->value;
1426         if (rkey)
1427                 *rkey = (void*) e->b.key;
1428
1429         remove_entry(h, idx);
1430
1431         return data;
1432 }
1433
1434 int hashmap_remove_and_put(Hashmap *h, const void *old_key, const void *new_key, void *value) {
1435         struct swap_entries swap;
1436         struct plain_hashmap_entry *e;
1437         unsigned old_hash, new_hash, idx;
1438
1439         if (!h)
1440                 return -ENOENT;
1441
1442         old_hash = bucket_hash(h, old_key);
1443         idx = bucket_scan(h, old_hash, old_key);
1444         if (idx == IDX_NIL)
1445                 return -ENOENT;
1446
1447         new_hash = bucket_hash(h, new_key);
1448         if (bucket_scan(h, new_hash, new_key) != IDX_NIL)
1449                 return -EEXIST;
1450
1451         remove_entry(h, idx);
1452
1453         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1454         e->b.key = new_key;
1455         e->value = value;
1456         assert_se(hashmap_put_boldly(h, new_hash, &swap, false) == 1);
1457
1458         return 0;
1459 }
1460
1461 int set_remove_and_put(Set *s, const void *old_key, const void *new_key) {
1462         struct swap_entries swap;
1463         struct hashmap_base_entry *e;
1464         unsigned old_hash, new_hash, idx;
1465
1466         if (!s)
1467                 return -ENOENT;
1468
1469         old_hash = bucket_hash(s, old_key);
1470         idx = bucket_scan(s, old_hash, old_key);
1471         if (idx == IDX_NIL)
1472                 return -ENOENT;
1473
1474         new_hash = bucket_hash(s, new_key);
1475         if (bucket_scan(s, new_hash, new_key) != IDX_NIL)
1476                 return -EEXIST;
1477
1478         remove_entry(s, idx);
1479
1480         e = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1481         e->key = new_key;
1482         assert_se(hashmap_put_boldly(s, new_hash, &swap, false) == 1);
1483
1484         return 0;
1485 }
1486
1487 int hashmap_remove_and_replace(Hashmap *h, const void *old_key, const void *new_key, void *value) {
1488         struct swap_entries swap;
1489         struct plain_hashmap_entry *e;
1490         unsigned old_hash, new_hash, idx_old, idx_new;
1491
1492         if (!h)
1493                 return -ENOENT;
1494
1495         old_hash = bucket_hash(h, old_key);
1496         idx_old = bucket_scan(h, old_hash, old_key);
1497         if (idx_old == IDX_NIL)
1498                 return -ENOENT;
1499
1500         old_key = bucket_at(HASHMAP_BASE(h), idx_old)->key;
1501
1502         new_hash = bucket_hash(h, new_key);
1503         idx_new = bucket_scan(h, new_hash, new_key);
1504         if (idx_new != IDX_NIL)
1505                 if (idx_old != idx_new) {
1506                         remove_entry(h, idx_new);
1507                         /* Compensate for a possible backward shift. */
1508                         if (old_key != bucket_at(HASHMAP_BASE(h), idx_old)->key)
1509                                 idx_old = prev_idx(HASHMAP_BASE(h), idx_old);
1510                         assert(old_key == bucket_at(HASHMAP_BASE(h), idx_old)->key);
1511                 }
1512
1513         remove_entry(h, idx_old);
1514
1515         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1516         e->b.key = new_key;
1517         e->value = value;
1518         assert_se(hashmap_put_boldly(h, new_hash, &swap, false) == 1);
1519
1520         return 0;
1521 }
1522
1523 void *hashmap_remove_value(Hashmap *h, const void *key, void *value) {
1524         struct plain_hashmap_entry *e;
1525         unsigned hash, idx;
1526
1527         if (!h)
1528                 return NULL;
1529
1530         hash = bucket_hash(h, key);
1531         idx = bucket_scan(h, hash, key);
1532         if (idx == IDX_NIL)
1533                 return NULL;
1534
1535         e = plain_bucket_at(h, idx);
1536         if (e->value != value)
1537                 return NULL;
1538
1539         remove_entry(h, idx);
1540
1541         return value;
1542 }
1543
1544 static unsigned find_first_entry(HashmapBase *h) {
1545         Iterator i = ITERATOR_FIRST;
1546
1547         if (!h || !n_entries(h))
1548                 return IDX_NIL;
1549
1550         return hashmap_iterate_entry(h, &i);
1551 }
1552
1553 void *internal_hashmap_first(HashmapBase *h) {
1554         unsigned idx;
1555
1556         idx = find_first_entry(h);
1557         if (idx == IDX_NIL)
1558                 return NULL;
1559
1560         return entry_value(h, bucket_at(h, idx));
1561 }
1562
1563 void *internal_hashmap_first_key(HashmapBase *h) {
1564         struct hashmap_base_entry *e;
1565         unsigned idx;
1566
1567         idx = find_first_entry(h);
1568         if (idx == IDX_NIL)
1569                 return NULL;
1570
1571         e = bucket_at(h, idx);
1572         return (void*) e->key;
1573 }
1574
1575 void *internal_hashmap_steal_first(HashmapBase *h) {
1576         struct hashmap_base_entry *e;
1577         void *data;
1578         unsigned idx;
1579
1580         idx = find_first_entry(h);
1581         if (idx == IDX_NIL)
1582                 return NULL;
1583
1584         e = bucket_at(h, idx);
1585         data = entry_value(h, e);
1586         remove_entry(h, idx);
1587
1588         return data;
1589 }
1590
1591 void *internal_hashmap_steal_first_key(HashmapBase *h) {
1592         struct hashmap_base_entry *e;
1593         void *key;
1594         unsigned idx;
1595
1596         idx = find_first_entry(h);
1597         if (idx == IDX_NIL)
1598                 return NULL;
1599
1600         e = bucket_at(h, idx);
1601         key = (void*) e->key;
1602         remove_entry(h, idx);
1603
1604         return key;
1605 }
1606
1607 unsigned internal_hashmap_size(HashmapBase *h) {
1608
1609         if (!h)
1610                 return 0;
1611
1612         return n_entries(h);
1613 }
1614
1615 unsigned internal_hashmap_buckets(HashmapBase *h) {
1616
1617         if (!h)
1618                 return 0;
1619
1620         return n_buckets(h);
1621 }
1622
1623 int internal_hashmap_merge(Hashmap *h, Hashmap *other) {
1624         Iterator i;
1625         unsigned idx;
1626
1627         assert(h);
1628
1629         HASHMAP_FOREACH_IDX(idx, HASHMAP_BASE(other), i) {
1630                 struct plain_hashmap_entry *pe = plain_bucket_at(other, idx);
1631                 int r;
1632
1633                 r = hashmap_put(h, pe->b.key, pe->value);
1634                 if (r < 0 && r != -EEXIST)
1635                         return r;
1636         }
1637
1638         return 0;
1639 }
1640
1641 int set_merge(Set *s, Set *other) {
1642         Iterator i;
1643         unsigned idx;
1644
1645         assert(s);
1646
1647         HASHMAP_FOREACH_IDX(idx, HASHMAP_BASE(other), i) {
1648                 struct set_entry *se = set_bucket_at(other, idx);
1649                 int r;
1650
1651                 r = set_put(s, se->b.key);
1652                 if (r < 0)
1653                         return r;
1654         }
1655
1656         return 0;
1657 }
1658
1659 int internal_hashmap_reserve(HashmapBase *h, unsigned entries_add) {
1660         int r;
1661
1662         assert(h);
1663
1664         r = resize_buckets(h, entries_add);
1665         if (r < 0)
1666                 return r;
1667
1668         return 0;
1669 }
1670
1671 /*
1672  * The same as hashmap_merge(), but every new item from other is moved to h.
1673  * Keys already in h are skipped and stay in other.
1674  * Returns: 0 on success.
1675  *          -ENOMEM on alloc failure, in which case no move has been done.
1676  */
1677 int internal_hashmap_move(HashmapBase *h, HashmapBase *other) {
1678         struct swap_entries swap;
1679         struct hashmap_base_entry *e, *n;
1680         Iterator i;
1681         unsigned idx;
1682         int r;
1683
1684         assert(h);
1685
1686         if (!other)
1687                 return 0;
1688
1689         assert(other->type == h->type);
1690
1691         /*
1692          * This reserves buckets for the worst case, where none of other's
1693          * entries are yet present in h. This is preferable to risking
1694          * an allocation failure in the middle of the moving and having to
1695          * rollback or return a partial result.
1696          */
1697         r = resize_buckets(h, n_entries(other));
1698         if (r < 0)
1699                 return r;
1700
1701         HASHMAP_FOREACH_IDX(idx, other, i) {
1702                 unsigned h_hash;
1703
1704                 e = bucket_at(other, idx);
1705                 h_hash = bucket_hash(h, e->key);
1706                 if (bucket_scan(h, h_hash, e->key) != IDX_NIL)
1707                         continue;
1708
1709                 n = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1710                 n->key = e->key;
1711                 if (h->type != HASHMAP_TYPE_SET)
1712                         ((struct plain_hashmap_entry*) n)->value =
1713                                 ((struct plain_hashmap_entry*) e)->value;
1714                 assert_se(hashmap_put_boldly(h, h_hash, &swap, false) == 1);
1715
1716                 remove_entry(other, idx);
1717         }
1718
1719         return 0;
1720 }
1721
1722 int internal_hashmap_move_one(HashmapBase *h, HashmapBase *other, const void *key) {
1723         struct swap_entries swap;
1724         unsigned h_hash, other_hash, idx;
1725         struct hashmap_base_entry *e, *n;
1726         int r;
1727
1728         assert(h);
1729
1730         h_hash = bucket_hash(h, key);
1731         if (bucket_scan(h, h_hash, key) != IDX_NIL)
1732                 return -EEXIST;
1733
1734         if (!other)
1735                 return -ENOENT;
1736
1737         assert(other->type == h->type);
1738
1739         other_hash = bucket_hash(other, key);
1740         idx = bucket_scan(other, other_hash, key);
1741         if (idx == IDX_NIL)
1742                 return -ENOENT;
1743
1744         e = bucket_at(other, idx);
1745
1746         n = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1747         n->key = e->key;
1748         if (h->type != HASHMAP_TYPE_SET)
1749                 ((struct plain_hashmap_entry*) n)->value =
1750                         ((struct plain_hashmap_entry*) e)->value;
1751         r = hashmap_put_boldly(h, h_hash, &swap, true);
1752         if (r < 0)
1753                 return r;
1754
1755         remove_entry(other, idx);
1756         return 0;
1757 }
1758
1759 HashmapBase *internal_hashmap_copy(HashmapBase *h) {
1760         HashmapBase *copy;
1761         int r;
1762
1763         assert(h);
1764
1765         copy = hashmap_base_new(h->hash_ops, h->type  HASHMAP_DEBUG_SRC_ARGS);
1766         if (!copy)
1767                 return NULL;
1768
1769         switch (h->type) {
1770         case HASHMAP_TYPE_PLAIN:
1771         case HASHMAP_TYPE_ORDERED:
1772                 r = hashmap_merge((Hashmap*)copy, (Hashmap*)h);
1773                 break;
1774         case HASHMAP_TYPE_SET:
1775                 r = set_merge((Set*)copy, (Set*)h);
1776                 break;
1777         default:
1778                 assert_not_reached("Unknown hashmap type");
1779         }
1780
1781         if (r < 0) {
1782                 internal_hashmap_free(copy);
1783                 return NULL;
1784         }
1785
1786         return copy;
1787 }
1788
1789 char **internal_hashmap_get_strv(HashmapBase *h) {
1790         char **sv;
1791         Iterator i;
1792         unsigned idx, n;
1793
1794         sv = new(char*, n_entries(h)+1);
1795         if (!sv)
1796                 return NULL;
1797
1798         n = 0;
1799         HASHMAP_FOREACH_IDX(idx, h, i)
1800                 sv[n++] = entry_value(h, bucket_at(h, idx));
1801         sv[n] = NULL;
1802
1803         return sv;
1804 }
1805
1806 void *ordered_hashmap_next(OrderedHashmap *h, const void *key) {
1807         struct ordered_hashmap_entry *e;
1808         unsigned hash, idx;
1809
1810         if (!h)
1811                 return NULL;
1812
1813         hash = bucket_hash(h, key);
1814         idx = bucket_scan(h, hash, key);
1815         if (idx == IDX_NIL)
1816                 return NULL;
1817
1818         e = ordered_bucket_at(h, idx);
1819         if (e->iterate_next == IDX_NIL)
1820                 return NULL;
1821         return ordered_bucket_at(h, e->iterate_next)->p.value;
1822 }
1823
1824 int set_consume(Set *s, void *value) {
1825         int r;
1826
1827         r = set_put(s, value);
1828         if (r <= 0)
1829                 free(value);
1830
1831         return r;
1832 }
1833
1834 int set_put_strdup(Set *s, const char *p) {
1835         char *c;
1836         int r;
1837
1838         assert(s);
1839         assert(p);
1840
1841         c = strdup(p);
1842         if (!c)
1843                 return -ENOMEM;
1844
1845         r = set_consume(s, c);
1846         if (r == -EEXIST)
1847                 return 0;
1848
1849         return r;
1850 }
1851
1852 int set_put_strdupv(Set *s, char **l) {
1853         int n = 0, r;
1854         char **i;
1855
1856         STRV_FOREACH(i, l) {
1857                 r = set_put_strdup(s, *i);
1858                 if (r < 0)
1859                         return r;
1860
1861                 n += r;
1862         }
1863
1864         return n;
1865 }