src/basic/hashmap.c

   1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
   2
   3 /***
   4   This file is part of systemd.
   5
   6   Copyright 2010 Lennart Poettering
   7   Copyright 2014 Michal Schmidt
   8
   9   systemd is free software; you can redistribute it and/or modify it
  10   under the terms of the GNU Lesser General Public License as published by
  11   the Free Software Foundation; either version 2.1 of the License, or
  12   (at your option) any later version.
  13
  14   systemd is distributed in the hope that it will be useful, but
  15   WITHOUT ANY WARRANTY; without even the implied warranty of
  16   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  17   Lesser General Public License for more details.
  18
  19   You should have received a copy of the GNU Lesser General Public License
  20   along with systemd; If not, see <http://www.gnu.org/licenses/>.
  21 ***/
  22
  23 #include <errno.h>
  24 #include <stdint.h>
  25 #include <stdlib.h>
  26 #include <string.h>
  27
  28 #include "alloc-util.h"
  29 #include "hashmap.h"
  30 #include "macro.h"
  31 #include "mempool.h"
  32 #include "process-util.h"
  33 #include "random-util.h"
  34 #include "set.h"
  35 #include "siphash24.h"
  36 #include "strv.h"
  37 #include "util.h"
  38
  39 #ifdef ENABLE_DEBUG_HASHMAP
  40 #include "list.h"
  41 #endif
  42
  43 /*
  44  * Implementation of hashmaps.
  45  * Addressing: open
  46  *   - uses less RAM compared to closed addressing (chaining), because
  47  *     our entries are small (especially in Sets, which tend to contain
  48  *     the majority of entries in systemd).
  49  * Collision resolution: Robin Hood
  50  *   - tends to equalize displacement of entries from their optimal buckets.
  51  * Probe sequence: linear
  52  *   - though theoretically worse than random probing/uniform hashing/double
  53  *     hashing, it is good for cache locality.
  54  *
  55  * References:
  56  * Celis, P. 1986. Robin Hood Hashing.
  57  * Ph.D. Dissertation. University of Waterloo, Waterloo, Ont., Canada, Canada.
  58  * https://cs.uwaterloo.ca/research/tr/1986/CS-86-14.pdf
  59  * - The results are derived for random probing. Suggests deletion with
  60  *   tombstones and two mean-centered search methods. None of that works
  61  *   well for linear probing.
  62  *
  63  * Janson, S. 2005. Individual displacements for linear probing hashing with different insertion policies.
  64  * ACM Trans. Algorithms 1, 2 (October 2005), 177-213.
  65  * DOI=10.1145/1103963.1103964 http://doi.acm.org/10.1145/1103963.1103964
  66  * http://www.math.uu.se/~svante/papers/sj157.pdf
  67  * - Applies to Robin Hood with linear probing. Contains remarks on
  68  *   the unsuitability of mean-centered search with linear probing.
  69  *
  70  * Viola, A. 2005. Exact distribution of individual displacements in linear probing hashing.
  71  * ACM Trans. Algorithms 1, 2 (October 2005), 214-242.
  72  * DOI=10.1145/1103963.1103965 http://doi.acm.org/10.1145/1103963.1103965
  73  * - Similar to Janson. Note that Viola writes about C_{m,n} (number of probes
  74  *   in a successful search), and Janson writes about displacement. C = d + 1.
  75  *
  76  * Goossaert, E. 2013. Robin Hood hashing: backward shift deletion.
  77  * http://codecapsule.com/2013/11/17/robin-hood-hashing-backward-shift-deletion/
  78  * - Explanation of backward shift deletion with pictures.
  79  *
  80  * Khuong, P. 2013. The Other Robin Hood Hashing.
  81  * http://www.pvk.ca/Blog/2013/11/26/the-other-robin-hood-hashing/
  82  * - Short summary of random vs. linear probing, and tombstones vs. backward shift.
  83  */
  84
  85 /*
  86  * XXX Ideas for improvement:
  87  * For unordered hashmaps, randomize iteration order, similarly to Perl:
  88  * http://blog.booking.com/hardening-perls-hash-function.html
  89  */
  90
  91 /* INV_KEEP_FREE = 1 / (1 - max_load_factor)
  92  * e.g. 1 / (1 - 0.8) = 5 ... keep one fifth of the buckets free. */
  93 #define INV_KEEP_FREE            5U
  94
  95 /* Fields common to entries of all hashmap/set types */
  96 struct hashmap_base_entry {
  97         const void *key;
  98 };
  99
 100 /* Entry types for specific hashmap/set types
 101  * hashmap_base_entry must be at the beginning of each entry struct. */
 102
 103 struct plain_hashmap_entry {
 104         struct hashmap_base_entry b;
 105         void *value;
 106 };
 107
 108 struct ordered_hashmap_entry {
 109         struct plain_hashmap_entry p;
 110         unsigned iterate_next, iterate_previous;
 111 };
 112
 113 struct set_entry {
 114         struct hashmap_base_entry b;
 115 };
 116
 117 /* In several functions it is advantageous to have the hash table extended
 118  * virtually by a couple of additional buckets. We reserve special index values
 119  * for these "swap" buckets. */
 120 #define _IDX_SWAP_BEGIN     (UINT_MAX - 3)
 121 #define IDX_PUT             (_IDX_SWAP_BEGIN + 0)
 122 #define IDX_TMP             (_IDX_SWAP_BEGIN + 1)
 123 #define _IDX_SWAP_END       (_IDX_SWAP_BEGIN + 2)
 124
 125 #define IDX_FIRST           (UINT_MAX - 1) /* special index for freshly initialized iterators */
 126 #define IDX_NIL             UINT_MAX       /* special index value meaning "none" or "end" */
 127
 128 assert_cc(IDX_FIRST == _IDX_SWAP_END);
 129 assert_cc(IDX_FIRST == _IDX_ITERATOR_FIRST);
 130
 131 /* Storage space for the "swap" buckets.
 132  * All entry types can fit into a ordered_hashmap_entry. */
 133 struct swap_entries {
 134         struct ordered_hashmap_entry e[_IDX_SWAP_END - _IDX_SWAP_BEGIN];
 135 };
 136
 137 /* Distance from Initial Bucket */
 138 typedef uint8_t dib_raw_t;
 139 #define DIB_RAW_OVERFLOW ((dib_raw_t)0xfdU)   /* indicates DIB value is greater than representable */
 140 #define DIB_RAW_REHASH   ((dib_raw_t)0xfeU)   /* entry yet to be rehashed during in-place resize */
 141 #define DIB_RAW_FREE     ((dib_raw_t)0xffU)   /* a free bucket */
 142 #define DIB_RAW_INIT     ((char)DIB_RAW_FREE) /* a byte to memset a DIB store with when initializing */
 143
 144 #define DIB_FREE UINT_MAX
 145
 146 #ifdef ENABLE_DEBUG_HASHMAP
 147 struct hashmap_debug_info {
 148         LIST_FIELDS(struct hashmap_debug_info, debug_list);
 149         unsigned max_entries;  /* high watermark of n_entries */
 150
 151         /* who allocated this hashmap */
 152         int line;
 153         const char *file;
 154         const char *func;
 155
 156         /* fields to detect modification while iterating */
 157         unsigned put_count;    /* counts puts into the hashmap */
 158         unsigned rem_count;    /* counts removals from hashmap */
 159         unsigned last_rem_idx; /* remembers last removal index */
 160 };
 161
 162 /* Tracks all existing hashmaps. Get at it from gdb. See sd_dump_hashmaps.py */
 163 static LIST_HEAD(struct hashmap_debug_info, hashmap_debug_list);
 164 static pthread_mutex_t hashmap_debug_list_mutex = PTHREAD_MUTEX_INITIALIZER;
 165
 166 #define HASHMAP_DEBUG_FIELDS struct hashmap_debug_info debug;
 167
 168 #else /* !ENABLE_DEBUG_HASHMAP */
 169 #define HASHMAP_DEBUG_FIELDS
 170 #endif /* ENABLE_DEBUG_HASHMAP */
 171
 172 enum HashmapType {
 173         HASHMAP_TYPE_PLAIN,
 174         HASHMAP_TYPE_ORDERED,
 175         HASHMAP_TYPE_SET,
 176         _HASHMAP_TYPE_MAX
 177 };
 178
 179 struct _packed_ indirect_storage {
 180         char    *storage;                  /* where buckets and DIBs are stored */
 181         uint8_t  hash_key[HASH_KEY_SIZE];  /* hash key; changes during resize */
 182
 183         unsigned n_entries;                /* number of stored entries */
 184         unsigned n_buckets;                /* number of buckets */
 185
 186         unsigned idx_lowest_entry;         /* Index below which all buckets are free.
 187                                               Makes "while(hashmap_steal_first())" loops
 188                                               O(n) instead of O(n^2) for unordered hashmaps. */
 189         uint8_t  _pad[3];                  /* padding for the whole HashmapBase */
 190         /* The bitfields in HashmapBase complete the alignment of the whole thing. */
 191 };
 192
 193 struct direct_storage {
 194         /* This gives us 39 bytes on 64bit, or 35 bytes on 32bit.
 195          * That's room for 4 set_entries + 4 DIB bytes + 3 unused bytes on 64bit,
 196          *              or 7 set_entries + 7 DIB bytes + 0 unused bytes on 32bit. */
 197         char storage[sizeof(struct indirect_storage)];
 198 };
 199
 200 #define DIRECT_BUCKETS(entry_t) \
 201         (sizeof(struct direct_storage) / (sizeof(entry_t) + sizeof(dib_raw_t)))
 202
 203 /* We should be able to store at least one entry directly. */
 204 assert_cc(DIRECT_BUCKETS(struct ordered_hashmap_entry) >= 1);
 205
 206 /* We have 3 bits for n_direct_entries. */
 207 assert_cc(DIRECT_BUCKETS(struct set_entry) < (1 << 3));
 208
 209 /* Hashmaps with directly stored entries all use this shared hash key.
 210  * It's no big deal if the key is guessed, because there can be only
 211  * a handful of directly stored entries in a hashmap. When a hashmap
 212  * outgrows direct storage, it gets its own key for indirect storage. */
 213 static uint8_t shared_hash_key[HASH_KEY_SIZE];
 214 static bool shared_hash_key_initialized;
 215
 216 /* Fields that all hashmap/set types must have */
 217 struct HashmapBase {
 218         const struct hash_ops *hash_ops;  /* hash and compare ops to use */
 219
 220         union _packed_ {
 221                 struct indirect_storage indirect; /* if  has_indirect */
 222                 struct direct_storage direct;     /* if !has_indirect */
 223         };
 224
 225         enum HashmapType type:2;     /* HASHMAP_TYPE_* */
 226         bool has_indirect:1;         /* whether indirect storage is used */
 227         unsigned n_direct_entries:3; /* Number of entries in direct storage.
 228                                       * Only valid if !has_indirect. */
 229         bool from_pool:1;            /* whether was allocated from mempool */
 230         HASHMAP_DEBUG_FIELDS         /* optional hashmap_debug_info */
 231 };
 232
 233 /* Specific hash types
 234  * HashmapBase must be at the beginning of each hashmap struct. */
 235
 236 struct Hashmap {
 237         struct HashmapBase b;
 238 };
 239
 240 struct OrderedHashmap {
 241         struct HashmapBase b;
 242         unsigned iterate_list_head, iterate_list_tail;
 243 };
 244
 245 struct Set {
 246         struct HashmapBase b;
 247 };
 248
 249 DEFINE_MEMPOOL(hashmap_pool,         Hashmap,        8);
 250 DEFINE_MEMPOOL(ordered_hashmap_pool, OrderedHashmap, 8);
 251 /* No need for a separate Set pool */
 252 assert_cc(sizeof(Hashmap) == sizeof(Set));
 253
 254 struct hashmap_type_info {
 255         size_t head_size;
 256         size_t entry_size;
 257         struct mempool *mempool;
 258         unsigned n_direct_buckets;
 259 };
 260
 261 static const struct hashmap_type_info hashmap_type_info[_HASHMAP_TYPE_MAX] = {
 262         [HASHMAP_TYPE_PLAIN] = {
 263                 .head_size        = sizeof(Hashmap),
 264                 .entry_size       = sizeof(struct plain_hashmap_entry),
 265                 .mempool          = &hashmap_pool,
 266                 .n_direct_buckets = DIRECT_BUCKETS(struct plain_hashmap_entry),
 267         },
 268         [HASHMAP_TYPE_ORDERED] = {
 269                 .head_size        = sizeof(OrderedHashmap),
 270                 .entry_size       = sizeof(struct ordered_hashmap_entry),
 271                 .mempool          = &ordered_hashmap_pool,
 272                 .n_direct_buckets = DIRECT_BUCKETS(struct ordered_hashmap_entry),
 273         },
 274         [HASHMAP_TYPE_SET] = {
 275                 .head_size        = sizeof(Set),
 276                 .entry_size       = sizeof(struct set_entry),
 277                 .mempool          = &hashmap_pool,
 278                 .n_direct_buckets = DIRECT_BUCKETS(struct set_entry),
 279         },
 280 };
 281
 282 void string_hash_func(const void *p, struct siphash *state) {
 283         siphash24_compress(p, strlen(p) + 1, state);
 284 }
 285
 286 int string_compare_func(const void *a, const void *b) {
 287         return strcmp(a, b);
 288 }
 289
 290 const struct hash_ops string_hash_ops = {
 291         .hash = string_hash_func,
 292         .compare = string_compare_func
 293 };
 294
 295 void trivial_hash_func(const void *p, struct siphash *state) {
 296         siphash24_compress(&p, sizeof(p), state);
 297 }
 298
 299 int trivial_compare_func(const void *a, const void *b) {
 300         return a < b ? -1 : (a > b ? 1 : 0);
 301 }
 302
 303 const struct hash_ops trivial_hash_ops = {
 304         .hash = trivial_hash_func,
 305         .compare = trivial_compare_func
 306 };
 307
 308 void uint64_hash_func(const void *p, struct siphash *state) {
 309         siphash24_compress(p, sizeof(uint64_t), state);
 310 }
 311
 312 int uint64_compare_func(const void *_a, const void *_b) {
 313         uint64_t a, b;
 314         a = *(const uint64_t*) _a;
 315         b = *(const uint64_t*) _b;
 316         return a < b ? -1 : (a > b ? 1 : 0);
 317 }
 318
 319 const struct hash_ops uint64_hash_ops = {
 320         .hash = uint64_hash_func,
 321         .compare = uint64_compare_func
 322 };
 323
 324 #if SIZEOF_DEV_T != 8
 325 void devt_hash_func(const void *p, struct siphash *state) {
 326         siphash24_compress(p, sizeof(dev_t), state);
 327 }
 328
 329 int devt_compare_func(const void *_a, const void *_b) {
 330         dev_t a, b;
 331         a = *(const dev_t*) _a;
 332         b = *(const dev_t*) _b;
 333         return a < b ? -1 : (a > b ? 1 : 0);
 334 }
 335
 336 const struct hash_ops devt_hash_ops = {
 337         .hash = devt_hash_func,
 338         .compare = devt_compare_func
 339 };
 340 #endif
 341
 342 static unsigned n_buckets(HashmapBase *h) {
 343         return h->has_indirect ? h->indirect.n_buckets
 344                                : hashmap_type_info[h->type].n_direct_buckets;
 345 }
 346
 347 static unsigned n_entries(HashmapBase *h) {
 348         return h->has_indirect ? h->indirect.n_entries
 349                                : h->n_direct_entries;
 350 }
 351
 352 static void n_entries_inc(HashmapBase *h) {
 353         if (h->has_indirect)
 354                 h->indirect.n_entries++;
 355         else
 356                 h->n_direct_entries++;
 357 }
 358
 359 static void n_entries_dec(HashmapBase *h) {
 360         if (h->has_indirect)
 361                 h->indirect.n_entries--;
 362         else
 363                 h->n_direct_entries--;
 364 }
 365
 366 static char *storage_ptr(HashmapBase *h) {
 367         return h->has_indirect ? h->indirect.storage
 368                                : h->direct.storage;
 369 }
 370
 371 static uint8_t *hash_key(HashmapBase *h) {
 372         return h->has_indirect ? h->indirect.hash_key
 373                                : shared_hash_key;
 374 }
 375
 376 static unsigned base_bucket_hash(HashmapBase *h, const void *p) {
 377         struct siphash state;
 378         uint64_t hash;
 379
 380         siphash24_init(&state, hash_key(h));
 381
 382         h->hash_ops->hash(p, &state);
 383
 384         hash = siphash24_finalize(&state);
 385
 386         return (unsigned) (hash % n_buckets(h));
 387 }
 388 #define bucket_hash(h, p) base_bucket_hash(HASHMAP_BASE(h), p)
 389
 390 static void get_hash_key(uint8_t hash_key[HASH_KEY_SIZE], bool reuse_is_ok) {
 391         static uint8_t current[HASH_KEY_SIZE];
 392         static bool current_initialized = false;
 393
 394         /* Returns a hash function key to use. In order to keep things
 395          * fast we will not generate a new key each time we allocate a
 396          * new hash table. Instead, we'll just reuse the most recently
 397          * generated one, except if we never generated one or when we
 398          * are rehashing an entire hash table because we reached a
 399          * fill level */
 400
 401         if (!current_initialized || !reuse_is_ok) {
 402                 random_bytes(current, sizeof(current));
 403                 current_initialized = true;
 404         }
 405
 406         memcpy(hash_key, current, sizeof(current));
 407 }
 408
 409 static struct hashmap_base_entry *bucket_at(HashmapBase *h, unsigned idx) {
 410         return (struct hashmap_base_entry*)
 411                 (storage_ptr(h) + idx * hashmap_type_info[h->type].entry_size);
 412 }
 413
 414 static struct plain_hashmap_entry *plain_bucket_at(Hashmap *h, unsigned idx) {
 415         return (struct plain_hashmap_entry*) bucket_at(HASHMAP_BASE(h), idx);
 416 }
 417
 418 static struct ordered_hashmap_entry *ordered_bucket_at(OrderedHashmap *h, unsigned idx) {
 419         return (struct ordered_hashmap_entry*) bucket_at(HASHMAP_BASE(h), idx);
 420 }
 421
 422 static struct set_entry *set_bucket_at(Set *h, unsigned idx) {
 423         return (struct set_entry*) bucket_at(HASHMAP_BASE(h), idx);
 424 }
 425
 426 static struct ordered_hashmap_entry *bucket_at_swap(struct swap_entries *swap, unsigned idx) {
 427         return &swap->e[idx - _IDX_SWAP_BEGIN];
 428 }
 429
 430 /* Returns a pointer to the bucket at index idx.
 431  * Understands real indexes and swap indexes, hence "_virtual". */
 432 static struct hashmap_base_entry *bucket_at_virtual(HashmapBase *h, struct swap_entries *swap,
 433                                                     unsigned idx) {
 434         if (idx < _IDX_SWAP_BEGIN)
 435                 return bucket_at(h, idx);
 436
 437         if (idx < _IDX_SWAP_END)
 438                 return &bucket_at_swap(swap, idx)->p.b;
 439
 440         assert_not_reached("Invalid index");
 441 }
 442
 443 static dib_raw_t *dib_raw_ptr(HashmapBase *h) {
 444         return (dib_raw_t*)
 445                 (storage_ptr(h) + hashmap_type_info[h->type].entry_size * n_buckets(h));
 446 }
 447
 448 static unsigned bucket_distance(HashmapBase *h, unsigned idx, unsigned from) {
 449         return idx >= from ? idx - from
 450                            : n_buckets(h) + idx - from;
 451 }
 452
 453 static unsigned bucket_calculate_dib(HashmapBase *h, unsigned idx, dib_raw_t raw_dib) {
 454         unsigned initial_bucket;
 455
 456         if (raw_dib == DIB_RAW_FREE)
 457                 return DIB_FREE;
 458
 459         if (_likely_(raw_dib < DIB_RAW_OVERFLOW))
 460                 return raw_dib;
 461
 462         /*
 463          * Having an overflow DIB value is very unlikely. The hash function
 464          * would have to be bad. For example, in a table of size 2^24 filled
 465          * to load factor 0.9 the maximum observed DIB is only about 60.
 466          * In theory (assuming I used Maxima correctly), for an infinite size
 467          * hash table with load factor 0.8 the probability of a given entry
 468          * having DIB > 40 is 1.9e-8.
 469          * This returns the correct DIB value by recomputing the hash value in
 470          * the unlikely case. XXX Hitting this case could be a hint to rehash.
 471          */
 472         initial_bucket = bucket_hash(h, bucket_at(h, idx)->key);
 473         return bucket_distance(h, idx, initial_bucket);
 474 }
 475
 476 static void bucket_set_dib(HashmapBase *h, unsigned idx, unsigned dib) {
 477         dib_raw_ptr(h)[idx] = dib != DIB_FREE ? MIN(dib, DIB_RAW_OVERFLOW) : DIB_RAW_FREE;
 478 }
 479
 480 static unsigned skip_free_buckets(HashmapBase *h, unsigned idx) {
 481         dib_raw_t *dibs;
 482
 483         dibs = dib_raw_ptr(h);
 484
 485         for ( ; idx < n_buckets(h); idx++)
 486                 if (dibs[idx] != DIB_RAW_FREE)
 487                         return idx;
 488
 489         return IDX_NIL;
 490 }
 491
 492 static void bucket_mark_free(HashmapBase *h, unsigned idx) {
 493         memzero(bucket_at(h, idx), hashmap_type_info[h->type].entry_size);
 494         bucket_set_dib(h, idx, DIB_FREE);
 495 }
 496
 497 static void bucket_move_entry(HashmapBase *h, struct swap_entries *swap,
 498                               unsigned from, unsigned to) {
 499         struct hashmap_base_entry *e_from, *e_to;
 500
 501         assert(from != to);
 502
 503         e_from = bucket_at_virtual(h, swap, from);
 504         e_to   = bucket_at_virtual(h, swap, to);
 505
 506         memcpy(e_to, e_from, hashmap_type_info[h->type].entry_size);
 507
 508         if (h->type == HASHMAP_TYPE_ORDERED) {
 509                 OrderedHashmap *lh = (OrderedHashmap*) h;
 510                 struct ordered_hashmap_entry *le, *le_to;
 511
 512                 le_to = (struct ordered_hashmap_entry*) e_to;
 513
 514                 if (le_to->iterate_next != IDX_NIL) {
 515                         le = (struct ordered_hashmap_entry*)
 516                              bucket_at_virtual(h, swap, le_to->iterate_next);
 517                         le->iterate_previous = to;
 518                 }
 519
 520                 if (le_to->iterate_previous != IDX_NIL) {
 521                         le = (struct ordered_hashmap_entry*)
 522                              bucket_at_virtual(h, swap, le_to->iterate_previous);
 523                         le->iterate_next = to;
 524                 }
 525
 526                 if (lh->iterate_list_head == from)
 527                         lh->iterate_list_head = to;
 528                 if (lh->iterate_list_tail == from)
 529                         lh->iterate_list_tail = to;
 530         }
 531 }
 532
 533 static unsigned next_idx(HashmapBase *h, unsigned idx) {
 534         return (idx + 1U) % n_buckets(h);
 535 }
 536
 537 static unsigned prev_idx(HashmapBase *h, unsigned idx) {
 538         return (n_buckets(h) + idx - 1U) % n_buckets(h);
 539 }
 540
 541 static void *entry_value(HashmapBase *h, struct hashmap_base_entry *e) {
 542         switch (h->type) {
 543
 544         case HASHMAP_TYPE_PLAIN:
 545         case HASHMAP_TYPE_ORDERED:
 546                 return ((struct plain_hashmap_entry*)e)->value;
 547
 548         case HASHMAP_TYPE_SET:
 549                 return (void*) e->key;
 550
 551         default:
 552                 assert_not_reached("Unknown hashmap type");
 553         }
 554 }
 555
 556 static void base_remove_entry(HashmapBase *h, unsigned idx) {
 557         unsigned left, right, prev, dib;
 558         dib_raw_t raw_dib, *dibs;
 559
 560         dibs = dib_raw_ptr(h);
 561         assert(dibs[idx] != DIB_RAW_FREE);
 562
 563 #ifdef ENABLE_DEBUG_HASHMAP
 564         h->debug.rem_count++;
 565         h->debug.last_rem_idx = idx;
 566 #endif
 567
 568         left = idx;
 569         /* Find the stop bucket ("right"). It is either free or has DIB == 0. */
 570         for (right = next_idx(h, left); ; right = next_idx(h, right)) {
 571                 raw_dib = dibs[right];
 572                 if (raw_dib == 0 || raw_dib == DIB_RAW_FREE)
 573                         break;
 574
 575                 /* The buckets are not supposed to be all occupied and with DIB > 0.
 576                  * That would mean we could make everyone better off by shifting them
 577                  * backward. This scenario is impossible. */
 578                 assert(left != right);
 579         }
 580
 581         if (h->type == HASHMAP_TYPE_ORDERED) {
 582                 OrderedHashmap *lh = (OrderedHashmap*) h;
 583                 struct ordered_hashmap_entry *le = ordered_bucket_at(lh, idx);
 584
 585                 if (le->iterate_next != IDX_NIL)
 586                         ordered_bucket_at(lh, le->iterate_next)->iterate_previous = le->iterate_previous;
 587                 else
 588                         lh->iterate_list_tail = le->iterate_previous;
 589
 590                 if (le->iterate_previous != IDX_NIL)
 591                         ordered_bucket_at(lh, le->iterate_previous)->iterate_next = le->iterate_next;
 592                 else
 593                         lh->iterate_list_head = le->iterate_next;
 594         }
 595
 596         /* Now shift all buckets in the interval (left, right) one step backwards */
 597         for (prev = left, left = next_idx(h, left); left != right;
 598              prev = left, left = next_idx(h, left)) {
 599                 dib = bucket_calculate_dib(h, left, dibs[left]);
 600                 assert(dib != 0);
 601                 bucket_move_entry(h, NULL, left, prev);
 602                 bucket_set_dib(h, prev, dib - 1);
 603         }
 604
 605         bucket_mark_free(h, prev);
 606         n_entries_dec(h);
 607 }
 608 #define remove_entry(h, idx) base_remove_entry(HASHMAP_BASE(h), idx)
 609
 610 static unsigned hashmap_iterate_in_insertion_order(OrderedHashmap *h, Iterator *i) {
 611         struct ordered_hashmap_entry *e;
 612         unsigned idx;
 613
 614         assert(h);
 615         assert(i);
 616
 617         if (i->idx == IDX_NIL)
 618                 goto at_end;
 619
 620         if (i->idx == IDX_FIRST && h->iterate_list_head == IDX_NIL)
 621                 goto at_end;
 622
 623         if (i->idx == IDX_FIRST) {
 624                 idx = h->iterate_list_head;
 625                 e = ordered_bucket_at(h, idx);
 626         } else {
 627                 idx = i->idx;
 628                 e = ordered_bucket_at(h, idx);
 629                 /*
 630                  * We allow removing the current entry while iterating, but removal may cause
 631                  * a backward shift. The next entry may thus move one bucket to the left.
 632                  * To detect when it happens, we remember the key pointer of the entry we were
 633                  * going to iterate next. If it does not match, there was a backward shift.
 634                  */
 635                 if (e->p.b.key != i->next_key) {
 636                         idx = prev_idx(HASHMAP_BASE(h), idx);
 637                         e = ordered_bucket_at(h, idx);
 638                 }
 639                 assert(e->p.b.key == i->next_key);
 640         }
 641
 642 #ifdef ENABLE_DEBUG_HASHMAP
 643         i->prev_idx = idx;
 644 #endif
 645
 646         if (e->iterate_next != IDX_NIL) {
 647                 struct ordered_hashmap_entry *n;
 648                 i->idx = e->iterate_next;
 649                 n = ordered_bucket_at(h, i->idx);
 650                 i->next_key = n->p.b.key;
 651         } else
 652                 i->idx = IDX_NIL;
 653
 654         return idx;
 655
 656 at_end:
 657         i->idx = IDX_NIL;
 658         return IDX_NIL;
 659 }
 660
 661 static unsigned hashmap_iterate_in_internal_order(HashmapBase *h, Iterator *i) {
 662         unsigned idx;
 663
 664         assert(h);
 665         assert(i);
 666
 667         if (i->idx == IDX_NIL)
 668                 goto at_end;
 669
 670         if (i->idx == IDX_FIRST) {
 671                 /* fast forward to the first occupied bucket */
 672                 if (h->has_indirect) {
 673                         i->idx = skip_free_buckets(h, h->indirect.idx_lowest_entry);
 674                         h->indirect.idx_lowest_entry = i->idx;
 675                 } else
 676                         i->idx = skip_free_buckets(h, 0);
 677
 678                 if (i->idx == IDX_NIL)
 679                         goto at_end;
 680         } else {
 681                 struct hashmap_base_entry *e;
 682
 683                 assert(i->idx > 0);
 684
 685                 e = bucket_at(h, i->idx);
 686                 /*
 687                  * We allow removing the current entry while iterating, but removal may cause
 688                  * a backward shift. The next entry may thus move one bucket to the left.
 689                  * To detect when it happens, we remember the key pointer of the entry we were
 690                  * going to iterate next. If it does not match, there was a backward shift.
 691                  */
 692                 if (e->key != i->next_key)
 693                         e = bucket_at(h, --i->idx);
 694
 695                 assert(e->key == i->next_key);
 696         }
 697
 698         idx = i->idx;
 699 #ifdef ENABLE_DEBUG_HASHMAP
 700         i->prev_idx = idx;
 701 #endif
 702
 703         i->idx = skip_free_buckets(h, i->idx + 1);
 704         if (i->idx != IDX_NIL)
 705                 i->next_key = bucket_at(h, i->idx)->key;
 706         else
 707                 i->idx = IDX_NIL;
 708
 709         return idx;
 710
 711 at_end:
 712         i->idx = IDX_NIL;
 713         return IDX_NIL;
 714 }
 715
 716 static unsigned hashmap_iterate_entry(HashmapBase *h, Iterator *i) {
 717         if (!h) {
 718                 i->idx = IDX_NIL;
 719                 return IDX_NIL;
 720         }
 721
 722 #ifdef ENABLE_DEBUG_HASHMAP
 723         if (i->idx == IDX_FIRST) {
 724                 i->put_count = h->debug.put_count;
 725                 i->rem_count = h->debug.rem_count;
 726         } else {
 727                 /* While iterating, must not add any new entries */
 728                 assert(i->put_count == h->debug.put_count);
 729                 /* ... or remove entries other than the current one */
 730                 assert(i->rem_count == h->debug.rem_count ||
 731                        (i->rem_count == h->debug.rem_count - 1 &&
 732                         i->prev_idx == h->debug.last_rem_idx));
 733                 /* Reset our removals counter */
 734                 i->rem_count = h->debug.rem_count;
 735         }
 736 #endif
 737
 738         return h->type == HASHMAP_TYPE_ORDERED ? hashmap_iterate_in_insertion_order((OrderedHashmap*) h, i)
 739                                                : hashmap_iterate_in_internal_order(h, i);
 740 }
 741
 742 bool internal_hashmap_iterate(HashmapBase *h, Iterator *i, void **value, const void **key) {
 743         struct hashmap_base_entry *e;
 744         void *data;
 745         unsigned idx;
 746
 747         idx = hashmap_iterate_entry(h, i);
 748         if (idx == IDX_NIL) {
 749                 if (value)
 750                         *value = NULL;
 751                 if (key)
 752                         *key = NULL;
 753
 754                 return false;
 755         }
 756
 757         e = bucket_at(h, idx);
 758         data = entry_value(h, e);
 759         if (value)
 760                 *value = data;
 761         if (key)
 762                 *key = e->key;
 763
 764         return true;
 765 }
 766
 767 bool set_iterate(Set *s, Iterator *i, void **value) {
 768         return internal_hashmap_iterate(HASHMAP_BASE(s), i, value, NULL);
 769 }
 770
 771 #define HASHMAP_FOREACH_IDX(idx, h, i) \
 772         for ((i) = ITERATOR_FIRST, (idx) = hashmap_iterate_entry((h), &(i)); \
 773              (idx != IDX_NIL); \
 774              (idx) = hashmap_iterate_entry((h), &(i)))
 775
 776 static void reset_direct_storage(HashmapBase *h) {
 777         const struct hashmap_type_info *hi = &hashmap_type_info[h->type];
 778         void *p;
 779
 780         assert(!h->has_indirect);
 781
 782         p = mempset(h->direct.storage, 0, hi->entry_size * hi->n_direct_buckets);
 783         memset(p, DIB_RAW_INIT, sizeof(dib_raw_t) * hi->n_direct_buckets);
 784 }
 785
 786 static struct HashmapBase *hashmap_base_new(const struct hash_ops *hash_ops, enum HashmapType type HASHMAP_DEBUG_PARAMS) {
 787         HashmapBase *h;
 788         const struct hashmap_type_info *hi = &hashmap_type_info[type];
 789         bool use_pool;
 790
 791         use_pool = is_main_thread();
 792
 793         h = use_pool ? mempool_alloc0_tile(hi->mempool) : malloc0(hi->head_size);
 794
 795         if (!h)
 796                 return NULL;
 797
 798         h->type = type;
 799         h->from_pool = use_pool;
 800         h->hash_ops = hash_ops ? hash_ops : &trivial_hash_ops;
 801
 802         if (type == HASHMAP_TYPE_ORDERED) {
 803                 OrderedHashmap *lh = (OrderedHashmap*)h;
 804                 lh->iterate_list_head = lh->iterate_list_tail = IDX_NIL;
 805         }
 806
 807         reset_direct_storage(h);
 808
 809         if (!shared_hash_key_initialized) {
 810                 random_bytes(shared_hash_key, sizeof(shared_hash_key));
 811                 shared_hash_key_initialized= true;
 812         }
 813
 814 #ifdef ENABLE_DEBUG_HASHMAP
 815         h->debug.func = func;
 816         h->debug.file = file;
 817         h->debug.line = line;
 818         assert_se(pthread_mutex_lock(&hashmap_debug_list_mutex) == 0);
 819         LIST_PREPEND(debug_list, hashmap_debug_list, &h->debug);
 820         assert_se(pthread_mutex_unlock(&hashmap_debug_list_mutex) == 0);
 821 #endif
 822
 823         return h;
 824 }
 825
 826 Hashmap *internal_hashmap_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 827         return (Hashmap*)        hashmap_base_new(hash_ops, HASHMAP_TYPE_PLAIN HASHMAP_DEBUG_PASS_ARGS);
 828 }
 829
 830 OrderedHashmap *internal_ordered_hashmap_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 831         return (OrderedHashmap*) hashmap_base_new(hash_ops, HASHMAP_TYPE_ORDERED HASHMAP_DEBUG_PASS_ARGS);
 832 }
 833
 834 Set *internal_set_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 835         return (Set*)            hashmap_base_new(hash_ops, HASHMAP_TYPE_SET HASHMAP_DEBUG_PASS_ARGS);
 836 }
 837
 838 static int hashmap_base_ensure_allocated(HashmapBase **h, const struct hash_ops *hash_ops,
 839                                          enum HashmapType type HASHMAP_DEBUG_PARAMS) {
 840         HashmapBase *q;
 841
 842         assert(h);
 843
 844         if (*h)
 845                 return 0;
 846
 847         q = hashmap_base_new(hash_ops, type HASHMAP_DEBUG_PASS_ARGS);
 848         if (!q)
 849                 return -ENOMEM;
 850
 851         *h = q;
 852         return 0;
 853 }
 854
 855 int internal_hashmap_ensure_allocated(Hashmap **h, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 856         return hashmap_base_ensure_allocated((HashmapBase**)h, hash_ops, HASHMAP_TYPE_PLAIN HASHMAP_DEBUG_PASS_ARGS);
 857 }
 858
 859 int internal_ordered_hashmap_ensure_allocated(OrderedHashmap **h, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 860         return hashmap_base_ensure_allocated((HashmapBase**)h, hash_ops, HASHMAP_TYPE_ORDERED HASHMAP_DEBUG_PASS_ARGS);
 861 }
 862
 863 int internal_set_ensure_allocated(Set **s, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
 864         return hashmap_base_ensure_allocated((HashmapBase**)s, hash_ops, HASHMAP_TYPE_SET HASHMAP_DEBUG_PASS_ARGS);
 865 }
 866
 867 static void hashmap_free_no_clear(HashmapBase *h) {
 868         assert(!h->has_indirect);
 869         assert(!h->n_direct_entries);
 870
 871 #ifdef ENABLE_DEBUG_HASHMAP
 872         assert_se(pthread_mutex_lock(&hashmap_debug_list_mutex) == 0);
 873         LIST_REMOVE(debug_list, hashmap_debug_list, &h->debug);
 874         assert_se(pthread_mutex_unlock(&hashmap_debug_list_mutex) == 0);
 875 #endif
 876
 877         if (h->from_pool)
 878                 mempool_free_tile(hashmap_type_info[h->type].mempool, h);
 879         else
 880                 free(h);
 881 }
 882
 883 HashmapBase *internal_hashmap_free(HashmapBase *h) {
 884
 885         /* Free the hashmap, but nothing in it */
 886
 887         if (h) {
 888                 internal_hashmap_clear(h);
 889                 hashmap_free_no_clear(h);
 890         }
 891
 892         return NULL;
 893 }
 894
 895 HashmapBase *internal_hashmap_free_free(HashmapBase *h) {
 896
 897         /* Free the hashmap and all data objects in it, but not the
 898          * keys */
 899
 900         if (h) {
 901                 internal_hashmap_clear_free(h);
 902                 hashmap_free_no_clear(h);
 903         }
 904
 905         return NULL;
 906 }
 907
 908 Hashmap *hashmap_free_free_free(Hashmap *h) {
 909
 910         /* Free the hashmap and all data and key objects in it */
 911
 912         if (h) {
 913                 hashmap_clear_free_free(h);
 914                 hashmap_free_no_clear(HASHMAP_BASE(h));
 915         }
 916
 917         return NULL;
 918 }
 919
 920 void internal_hashmap_clear(HashmapBase *h) {
 921         if (!h)
 922                 return;
 923
 924         if (h->has_indirect) {
 925                 free(h->indirect.storage);
 926                 h->has_indirect = false;
 927         }
 928
 929         h->n_direct_entries = 0;
 930         reset_direct_storage(h);
 931
 932         if (h->type == HASHMAP_TYPE_ORDERED) {
 933                 OrderedHashmap *lh = (OrderedHashmap*) h;
 934                 lh->iterate_list_head = lh->iterate_list_tail = IDX_NIL;
 935         }
 936 }
 937
 938 void internal_hashmap_clear_free(HashmapBase *h) {
 939         unsigned idx;
 940
 941         if (!h)
 942                 return;
 943
 944         for (idx = skip_free_buckets(h, 0); idx != IDX_NIL;
 945              idx = skip_free_buckets(h, idx + 1))
 946                 free(entry_value(h, bucket_at(h, idx)));
 947
 948         internal_hashmap_clear(h);
 949 }
 950
 951 void hashmap_clear_free_free(Hashmap *h) {
 952         unsigned idx;
 953
 954         if (!h)
 955                 return;
 956
 957         for (idx = skip_free_buckets(HASHMAP_BASE(h), 0); idx != IDX_NIL;
 958              idx = skip_free_buckets(HASHMAP_BASE(h), idx + 1)) {
 959                 struct plain_hashmap_entry *e = plain_bucket_at(h, idx);
 960                 free((void*)e->b.key);
 961                 free(e->value);
 962         }
 963
 964         internal_hashmap_clear(HASHMAP_BASE(h));
 965 }
 966
 967 static int resize_buckets(HashmapBase *h, unsigned entries_add);
 968
 969 /*
 970  * Finds an empty bucket to put an entry into, starting the scan at 'idx'.
 971  * Performs Robin Hood swaps as it goes. The entry to put must be placed
 972  * by the caller into swap slot IDX_PUT.
 973  * If used for in-place resizing, may leave a displaced entry in swap slot
 974  * IDX_PUT. Caller must rehash it next.
 975  * Returns: true if it left a displaced entry to rehash next in IDX_PUT,
 976  *          false otherwise.
 977  */
 978 static bool hashmap_put_robin_hood(HashmapBase *h, unsigned idx,
 979                                    struct swap_entries *swap) {
 980         dib_raw_t raw_dib, *dibs;
 981         unsigned dib, distance;
 982
 983 #ifdef ENABLE_DEBUG_HASHMAP
 984         h->debug.put_count++;
 985 #endif
 986
 987         dibs = dib_raw_ptr(h);
 988
 989         for (distance = 0; ; distance++) {
 990                 raw_dib = dibs[idx];
 991                 if (raw_dib == DIB_RAW_FREE || raw_dib == DIB_RAW_REHASH) {
 992                         if (raw_dib == DIB_RAW_REHASH)
 993                                 bucket_move_entry(h, swap, idx, IDX_TMP);
 994
 995                         if (h->has_indirect && h->indirect.idx_lowest_entry > idx)
 996                                 h->indirect.idx_lowest_entry = idx;
 997
 998                         bucket_set_dib(h, idx, distance);
 999                         bucket_move_entry(h, swap, IDX_PUT, idx);
1000                         if (raw_dib == DIB_RAW_REHASH) {
1001                                 bucket_move_entry(h, swap, IDX_TMP, IDX_PUT);
1002                                 return true;
1003                         }
1004
1005                         return false;
1006                 }
1007
1008                 dib = bucket_calculate_dib(h, idx, raw_dib);
1009
1010                 if (dib < distance) {
1011                         /* Found a wealthier entry. Go Robin Hood! */
1012                         bucket_set_dib(h, idx, distance);
1013
1014                         /* swap the entries */
1015                         bucket_move_entry(h, swap, idx, IDX_TMP);
1016                         bucket_move_entry(h, swap, IDX_PUT, idx);
1017                         bucket_move_entry(h, swap, IDX_TMP, IDX_PUT);
1018
1019                         distance = dib;
1020                 }
1021
1022                 idx = next_idx(h, idx);
1023         }
1024 }
1025
1026 /*
1027  * Puts an entry into a hashmap, boldly - no check whether key already exists.
1028  * The caller must place the entry (only its key and value, not link indexes)
1029  * in swap slot IDX_PUT.
1030  * Caller must ensure: the key does not exist yet in the hashmap.
1031  *                     that resize is not needed if !may_resize.
1032  * Returns: 1 if entry was put successfully.
1033  *          -ENOMEM if may_resize==true and resize failed with -ENOMEM.
1034  *          Cannot return -ENOMEM if !may_resize.
1035  */
1036 static int hashmap_base_put_boldly(HashmapBase *h, unsigned idx,
1037                                    struct swap_entries *swap, bool may_resize) {
1038         struct ordered_hashmap_entry *new_entry;
1039         int r;
1040
1041         assert(idx < n_buckets(h));
1042
1043         new_entry = bucket_at_swap(swap, IDX_PUT);
1044
1045         if (may_resize) {
1046                 r = resize_buckets(h, 1);
1047                 if (r < 0)
1048                         return r;
1049                 if (r > 0)
1050                         idx = bucket_hash(h, new_entry->p.b.key);
1051         }
1052         assert(n_entries(h) < n_buckets(h));
1053
1054         if (h->type == HASHMAP_TYPE_ORDERED) {
1055                 OrderedHashmap *lh = (OrderedHashmap*) h;
1056
1057                 new_entry->iterate_next = IDX_NIL;
1058                 new_entry->iterate_previous = lh->iterate_list_tail;
1059
1060                 if (lh->iterate_list_tail != IDX_NIL) {
1061                         struct ordered_hashmap_entry *old_tail;
1062
1063                         old_tail = ordered_bucket_at(lh, lh->iterate_list_tail);
1064                         assert(old_tail->iterate_next == IDX_NIL);
1065                         old_tail->iterate_next = IDX_PUT;
1066                 }
1067
1068                 lh->iterate_list_tail = IDX_PUT;
1069                 if (lh->iterate_list_head == IDX_NIL)
1070                         lh->iterate_list_head = IDX_PUT;
1071         }
1072
1073         assert_se(hashmap_put_robin_hood(h, idx, swap) == false);
1074
1075         n_entries_inc(h);
1076 #ifdef ENABLE_DEBUG_HASHMAP
1077         h->debug.max_entries = MAX(h->debug.max_entries, n_entries(h));
1078 #endif
1079
1080         return 1;
1081 }
1082 #define hashmap_put_boldly(h, idx, swap, may_resize) \
1083         hashmap_base_put_boldly(HASHMAP_BASE(h), idx, swap, may_resize)
1084
1085 /*
1086  * Returns 0 if resize is not needed.
1087  *         1 if successfully resized.
1088  *         -ENOMEM on allocation failure.
1089  */
1090 static int resize_buckets(HashmapBase *h, unsigned entries_add) {
1091         struct swap_entries swap;
1092         char *new_storage;
1093         dib_raw_t *old_dibs, *new_dibs;
1094         const struct hashmap_type_info *hi;
1095         unsigned idx, optimal_idx;
1096         unsigned old_n_buckets, new_n_buckets, n_rehashed, new_n_entries;
1097         uint8_t new_shift;
1098         bool rehash_next;
1099
1100         assert(h);
1101
1102         hi = &hashmap_type_info[h->type];
1103         new_n_entries = n_entries(h) + entries_add;
1104
1105         /* overflow? */
1106         if (_unlikely_(new_n_entries < entries_add))
1107                 return -ENOMEM;
1108
1109         /* For direct storage we allow 100% load, because it's tiny. */
1110         if (!h->has_indirect && new_n_entries <= hi->n_direct_buckets)
1111                 return 0;
1112
1113         /*
1114          * Load factor = n/m = 1 - (1/INV_KEEP_FREE).
1115          * From it follows: m = n + n/(INV_KEEP_FREE - 1)
1116          */
1117         new_n_buckets = new_n_entries + new_n_entries / (INV_KEEP_FREE - 1);
1118         /* overflow? */
1119         if (_unlikely_(new_n_buckets < new_n_entries))
1120                 return -ENOMEM;
1121
1122         if (_unlikely_(new_n_buckets > UINT_MAX / (hi->entry_size + sizeof(dib_raw_t))))
1123                 return -ENOMEM;
1124
1125         old_n_buckets = n_buckets(h);
1126
1127         if (_likely_(new_n_buckets <= old_n_buckets))
1128                 return 0;
1129
1130         new_shift = log2u_round_up(MAX(
1131                         new_n_buckets * (hi->entry_size + sizeof(dib_raw_t)),
1132                         2 * sizeof(struct direct_storage)));
1133
1134         /* Realloc storage (buckets and DIB array). */
1135         new_storage = realloc(h->has_indirect ? h->indirect.storage : NULL,
1136                               1U << new_shift);
1137         if (!new_storage)
1138                 return -ENOMEM;
1139
1140         /* Must upgrade direct to indirect storage. */
1141         if (!h->has_indirect) {
1142                 memcpy(new_storage, h->direct.storage,
1143                        old_n_buckets * (hi->entry_size + sizeof(dib_raw_t)));
1144                 h->indirect.n_entries = h->n_direct_entries;
1145                 h->indirect.idx_lowest_entry = 0;
1146                 h->n_direct_entries = 0;
1147         }
1148
1149         /* Get a new hash key. If we've just upgraded to indirect storage,
1150          * allow reusing a previously generated key. It's still a different key
1151          * from the shared one that we used for direct storage. */
1152         get_hash_key(h->indirect.hash_key, !h->has_indirect);
1153
1154         h->has_indirect = true;
1155         h->indirect.storage = new_storage;
1156         h->indirect.n_buckets = (1U << new_shift) /
1157                                 (hi->entry_size + sizeof(dib_raw_t));
1158
1159         old_dibs = (dib_raw_t*)(new_storage + hi->entry_size * old_n_buckets);
1160         new_dibs = dib_raw_ptr(h);
1161
1162         /*
1163          * Move the DIB array to the new place, replacing valid DIB values with
1164          * DIB_RAW_REHASH to indicate all of the used buckets need rehashing.
1165          * Note: Overlap is not possible, because we have at least doubled the
1166          * number of buckets and dib_raw_t is smaller than any entry type.
1167          */
1168         for (idx = 0; idx < old_n_buckets; idx++) {
1169                 assert(old_dibs[idx] != DIB_RAW_REHASH);
1170                 new_dibs[idx] = old_dibs[idx] == DIB_RAW_FREE ? DIB_RAW_FREE
1171                                                               : DIB_RAW_REHASH;
1172         }
1173
1174         /* Zero the area of newly added entries (including the old DIB area) */
1175         memzero(bucket_at(h, old_n_buckets),
1176                (n_buckets(h) - old_n_buckets) * hi->entry_size);
1177
1178         /* The upper half of the new DIB array needs initialization */
1179         memset(&new_dibs[old_n_buckets], DIB_RAW_INIT,
1180                (n_buckets(h) - old_n_buckets) * sizeof(dib_raw_t));
1181
1182         /* Rehash entries that need it */
1183         n_rehashed = 0;
1184         for (idx = 0; idx < old_n_buckets; idx++) {
1185                 if (new_dibs[idx] != DIB_RAW_REHASH)
1186                         continue;
1187
1188                 optimal_idx = bucket_hash(h, bucket_at(h, idx)->key);
1189
1190                 /*
1191                  * Not much to do if by luck the entry hashes to its current
1192                  * location. Just set its DIB.
1193                  */
1194                 if (optimal_idx == idx) {
1195                         new_dibs[idx] = 0;
1196                         n_rehashed++;
1197                         continue;
1198                 }
1199
1200                 new_dibs[idx] = DIB_RAW_FREE;
1201                 bucket_move_entry(h, &swap, idx, IDX_PUT);
1202                 /* bucket_move_entry does not clear the source */
1203                 memzero(bucket_at(h, idx), hi->entry_size);
1204
1205                 do {
1206                         /*
1207                          * Find the new bucket for the current entry. This may make
1208                          * another entry homeless and load it into IDX_PUT.
1209                          */
1210                         rehash_next = hashmap_put_robin_hood(h, optimal_idx, &swap);
1211                         n_rehashed++;
1212
1213                         /* Did the current entry displace another one? */
1214                         if (rehash_next)
1215                                 optimal_idx = bucket_hash(h, bucket_at_swap(&swap, IDX_PUT)->p.b.key);
1216                 } while (rehash_next);
1217         }
1218
1219         assert(n_rehashed == n_entries(h));
1220
1221         return 1;
1222 }
1223
1224 /*
1225  * Finds an entry with a matching key
1226  * Returns: index of the found entry, or IDX_NIL if not found.
1227  */
1228 static unsigned base_bucket_scan(HashmapBase *h, unsigned idx, const void *key) {
1229         struct hashmap_base_entry *e;
1230         unsigned dib, distance;
1231         dib_raw_t *dibs = dib_raw_ptr(h);
1232
1233         assert(idx < n_buckets(h));
1234
1235         for (distance = 0; ; distance++) {
1236                 if (dibs[idx] == DIB_RAW_FREE)
1237                         return IDX_NIL;
1238
1239                 dib = bucket_calculate_dib(h, idx, dibs[idx]);
1240
1241                 if (dib < distance)
1242                         return IDX_NIL;
1243                 if (dib == distance) {
1244                         e = bucket_at(h, idx);
1245                         if (h->hash_ops->compare(e->key, key) == 0)
1246                                 return idx;
1247                 }
1248
1249                 idx = next_idx(h, idx);
1250         }
1251 }
1252 #define bucket_scan(h, idx, key) base_bucket_scan(HASHMAP_BASE(h), idx, key)
1253
1254 int hashmap_put(Hashmap *h, const void *key, void *value) {
1255         struct swap_entries swap;
1256         struct plain_hashmap_entry *e;
1257         unsigned hash, idx;
1258
1259         assert(h);
1260
1261         hash = bucket_hash(h, key);
1262         idx = bucket_scan(h, hash, key);
1263         if (idx != IDX_NIL) {
1264                 e = plain_bucket_at(h, idx);
1265                 if (e->value == value)
1266                         return 0;
1267                 return -EEXIST;
1268         }
1269
1270         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1271         e->b.key = key;
1272         e->value = value;
1273         return hashmap_put_boldly(h, hash, &swap, true);
1274 }
1275
1276 int set_put(Set *s, const void *key) {
1277         struct swap_entries swap;
1278         struct hashmap_base_entry *e;
1279         unsigned hash, idx;
1280
1281         assert(s);
1282
1283         hash = bucket_hash(s, key);
1284         idx = bucket_scan(s, hash, key);
1285         if (idx != IDX_NIL)
1286                 return 0;
1287
1288         e = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1289         e->key = key;
1290         return hashmap_put_boldly(s, hash, &swap, true);
1291 }
1292
1293 int hashmap_replace(Hashmap *h, const void *key, void *value) {
1294         struct swap_entries swap;
1295         struct plain_hashmap_entry *e;
1296         unsigned hash, idx;
1297
1298         assert(h);
1299
1300         hash = bucket_hash(h, key);
1301         idx = bucket_scan(h, hash, key);
1302         if (idx != IDX_NIL) {
1303                 e = plain_bucket_at(h, idx);
1304 #ifdef ENABLE_DEBUG_HASHMAP
1305                 /* Although the key is equal, the key pointer may have changed,
1306                  * and this would break our assumption for iterating. So count
1307                  * this operation as incompatible with iteration. */
1308                 if (e->b.key != key) {
1309                         h->b.debug.put_count++;
1310                         h->b.debug.rem_count++;
1311                         h->b.debug.last_rem_idx = idx;
1312                 }
1313 #endif
1314                 e->b.key = key;
1315                 e->value = value;
1316                 return 0;
1317         }
1318
1319         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1320         e->b.key = key;
1321         e->value = value;
1322         return hashmap_put_boldly(h, hash, &swap, true);
1323 }
1324
1325 int hashmap_update(Hashmap *h, const void *key, void *value) {
1326         struct plain_hashmap_entry *e;
1327         unsigned hash, idx;
1328
1329         assert(h);
1330
1331         hash = bucket_hash(h, key);
1332         idx = bucket_scan(h, hash, key);
1333         if (idx == IDX_NIL)
1334                 return -ENOENT;
1335
1336         e = plain_bucket_at(h, idx);
1337         e->value = value;
1338         return 0;
1339 }
1340
1341 void *internal_hashmap_get(HashmapBase *h, const void *key) {
1342         struct hashmap_base_entry *e;
1343         unsigned hash, idx;
1344
1345         if (!h)
1346                 return NULL;
1347
1348         hash = bucket_hash(h, key);
1349         idx = bucket_scan(h, hash, key);
1350         if (idx == IDX_NIL)
1351                 return NULL;
1352
1353         e = bucket_at(h, idx);
1354         return entry_value(h, e);
1355 }
1356
1357 void *hashmap_get2(Hashmap *h, const void *key, void **key2) {
1358         struct plain_hashmap_entry *e;
1359         unsigned hash, idx;
1360
1361         if (!h)
1362                 return NULL;
1363
1364         hash = bucket_hash(h, key);
1365         idx = bucket_scan(h, hash, key);
1366         if (idx == IDX_NIL)
1367                 return NULL;
1368
1369         e = plain_bucket_at(h, idx);
1370         if (key2)
1371                 *key2 = (void*) e->b.key;
1372
1373         return e->value;
1374 }
1375
1376 bool internal_hashmap_contains(HashmapBase *h, const void *key) {
1377         unsigned hash;
1378
1379         if (!h)
1380                 return false;
1381
1382         hash = bucket_hash(h, key);
1383         return bucket_scan(h, hash, key) != IDX_NIL;
1384 }
1385
1386 void *internal_hashmap_remove(HashmapBase *h, const void *key) {
1387         struct hashmap_base_entry *e;
1388         unsigned hash, idx;
1389         void *data;
1390
1391         if (!h)
1392                 return NULL;
1393
1394         hash = bucket_hash(h, key);
1395         idx = bucket_scan(h, hash, key);
1396         if (idx == IDX_NIL)
1397                 return NULL;
1398
1399         e = bucket_at(h, idx);
1400         data = entry_value(h, e);
1401         remove_entry(h, idx);
1402
1403         return data;
1404 }
1405
1406 void *hashmap_remove2(Hashmap *h, const void *key, void **rkey) {
1407         struct plain_hashmap_entry *e;
1408         unsigned hash, idx;
1409         void *data;
1410
1411         if (!h) {
1412                 if (rkey)
1413                         *rkey = NULL;
1414                 return NULL;
1415         }
1416
1417         hash = bucket_hash(h, key);
1418         idx = bucket_scan(h, hash, key);
1419         if (idx == IDX_NIL) {
1420                 if (rkey)
1421                         *rkey = NULL;
1422                 return NULL;
1423         }
1424
1425         e = plain_bucket_at(h, idx);
1426         data = e->value;
1427         if (rkey)
1428                 *rkey = (void*) e->b.key;
1429
1430         remove_entry(h, idx);
1431
1432         return data;
1433 }
1434
1435 int hashmap_remove_and_put(Hashmap *h, const void *old_key, const void *new_key, void *value) {
1436         struct swap_entries swap;
1437         struct plain_hashmap_entry *e;
1438         unsigned old_hash, new_hash, idx;
1439
1440         if (!h)
1441                 return -ENOENT;
1442
1443         old_hash = bucket_hash(h, old_key);
1444         idx = bucket_scan(h, old_hash, old_key);
1445         if (idx == IDX_NIL)
1446                 return -ENOENT;
1447
1448         new_hash = bucket_hash(h, new_key);
1449         if (bucket_scan(h, new_hash, new_key) != IDX_NIL)
1450                 return -EEXIST;
1451
1452         remove_entry(h, idx);
1453
1454         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1455         e->b.key = new_key;
1456         e->value = value;
1457         assert_se(hashmap_put_boldly(h, new_hash, &swap, false) == 1);
1458
1459         return 0;
1460 }
1461
1462 int set_remove_and_put(Set *s, const void *old_key, const void *new_key) {
1463         struct swap_entries swap;
1464         struct hashmap_base_entry *e;
1465         unsigned old_hash, new_hash, idx;
1466
1467         if (!s)
1468                 return -ENOENT;
1469
1470         old_hash = bucket_hash(s, old_key);
1471         idx = bucket_scan(s, old_hash, old_key);
1472         if (idx == IDX_NIL)
1473                 return -ENOENT;
1474
1475         new_hash = bucket_hash(s, new_key);
1476         if (bucket_scan(s, new_hash, new_key) != IDX_NIL)
1477                 return -EEXIST;
1478
1479         remove_entry(s, idx);
1480
1481         e = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1482         e->key = new_key;
1483         assert_se(hashmap_put_boldly(s, new_hash, &swap, false) == 1);
1484
1485         return 0;
1486 }
1487
1488 int hashmap_remove_and_replace(Hashmap *h, const void *old_key, const void *new_key, void *value) {
1489         struct swap_entries swap;
1490         struct plain_hashmap_entry *e;
1491         unsigned old_hash, new_hash, idx_old, idx_new;
1492
1493         if (!h)
1494                 return -ENOENT;
1495
1496         old_hash = bucket_hash(h, old_key);
1497         idx_old = bucket_scan(h, old_hash, old_key);
1498         if (idx_old == IDX_NIL)
1499                 return -ENOENT;
1500
1501         old_key = bucket_at(HASHMAP_BASE(h), idx_old)->key;
1502
1503         new_hash = bucket_hash(h, new_key);
1504         idx_new = bucket_scan(h, new_hash, new_key);
1505         if (idx_new != IDX_NIL)
1506                 if (idx_old != idx_new) {
1507                         remove_entry(h, idx_new);
1508                         /* Compensate for a possible backward shift. */
1509                         if (old_key != bucket_at(HASHMAP_BASE(h), idx_old)->key)
1510                                 idx_old = prev_idx(HASHMAP_BASE(h), idx_old);
1511                         assert(old_key == bucket_at(HASHMAP_BASE(h), idx_old)->key);
1512                 }
1513
1514         remove_entry(h, idx_old);
1515
1516         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1517         e->b.key = new_key;
1518         e->value = value;
1519         assert_se(hashmap_put_boldly(h, new_hash, &swap, false) == 1);
1520
1521         return 0;
1522 }
1523
1524 void *hashmap_remove_value(Hashmap *h, const void *key, void *value) {
1525         struct plain_hashmap_entry *e;
1526         unsigned hash, idx;
1527
1528         if (!h)
1529                 return NULL;
1530
1531         hash = bucket_hash(h, key);
1532         idx = bucket_scan(h, hash, key);
1533         if (idx == IDX_NIL)
1534                 return NULL;
1535
1536         e = plain_bucket_at(h, idx);
1537         if (e->value != value)
1538                 return NULL;
1539
1540         remove_entry(h, idx);
1541
1542         return value;
1543 }
1544
1545 static unsigned find_first_entry(HashmapBase *h) {
1546         Iterator i = ITERATOR_FIRST;
1547
1548         if (!h || !n_entries(h))
1549                 return IDX_NIL;
1550
1551         return hashmap_iterate_entry(h, &i);
1552 }
1553
1554 void *internal_hashmap_first(HashmapBase *h) {
1555         unsigned idx;
1556
1557         idx = find_first_entry(h);
1558         if (idx == IDX_NIL)
1559                 return NULL;
1560
1561         return entry_value(h, bucket_at(h, idx));
1562 }
1563
1564 void *internal_hashmap_first_key(HashmapBase *h) {
1565         struct hashmap_base_entry *e;
1566         unsigned idx;
1567
1568         idx = find_first_entry(h);
1569         if (idx == IDX_NIL)
1570                 return NULL;
1571
1572         e = bucket_at(h, idx);
1573         return (void*) e->key;
1574 }
1575
1576 void *internal_hashmap_steal_first(HashmapBase *h) {
1577         struct hashmap_base_entry *e;
1578         void *data;
1579         unsigned idx;
1580
1581         idx = find_first_entry(h);
1582         if (idx == IDX_NIL)
1583                 return NULL;
1584
1585         e = bucket_at(h, idx);
1586         data = entry_value(h, e);
1587         remove_entry(h, idx);
1588
1589         return data;
1590 }
1591
1592 void *internal_hashmap_steal_first_key(HashmapBase *h) {
1593         struct hashmap_base_entry *e;
1594         void *key;
1595         unsigned idx;
1596
1597         idx = find_first_entry(h);
1598         if (idx == IDX_NIL)
1599                 return NULL;
1600
1601         e = bucket_at(h, idx);
1602         key = (void*) e->key;
1603         remove_entry(h, idx);
1604
1605         return key;
1606 }
1607
1608 unsigned internal_hashmap_size(HashmapBase *h) {
1609
1610         if (!h)
1611                 return 0;
1612
1613         return n_entries(h);
1614 }
1615
1616 unsigned internal_hashmap_buckets(HashmapBase *h) {
1617
1618         if (!h)
1619                 return 0;
1620
1621         return n_buckets(h);
1622 }
1623
1624 int internal_hashmap_merge(Hashmap *h, Hashmap *other) {
1625         Iterator i;
1626         unsigned idx;
1627
1628         assert(h);
1629
1630         HASHMAP_FOREACH_IDX(idx, HASHMAP_BASE(other), i) {
1631                 struct plain_hashmap_entry *pe = plain_bucket_at(other, idx);
1632                 int r;
1633
1634                 r = hashmap_put(h, pe->b.key, pe->value);
1635                 if (r < 0 && r != -EEXIST)
1636                         return r;
1637         }
1638
1639         return 0;
1640 }
1641
1642 int set_merge(Set *s, Set *other) {
1643         Iterator i;
1644         unsigned idx;
1645
1646         assert(s);
1647
1648         HASHMAP_FOREACH_IDX(idx, HASHMAP_BASE(other), i) {
1649                 struct set_entry *se = set_bucket_at(other, idx);
1650                 int r;
1651
1652                 r = set_put(s, se->b.key);
1653                 if (r < 0)
1654                         return r;
1655         }
1656
1657         return 0;
1658 }
1659
1660 int internal_hashmap_reserve(HashmapBase *h, unsigned entries_add) {
1661         int r;
1662
1663         assert(h);
1664
1665         r = resize_buckets(h, entries_add);
1666         if (r < 0)
1667                 return r;
1668
1669         return 0;
1670 }
1671
1672 /*
1673  * The same as hashmap_merge(), but every new item from other is moved to h.
1674  * Keys already in h are skipped and stay in other.
1675  * Returns: 0 on success.
1676  *          -ENOMEM on alloc failure, in which case no move has been done.
1677  */
1678 int internal_hashmap_move(HashmapBase *h, HashmapBase *other) {
1679         struct swap_entries swap;
1680         struct hashmap_base_entry *e, *n;
1681         Iterator i;
1682         unsigned idx;
1683         int r;
1684
1685         assert(h);
1686
1687         if (!other)
1688                 return 0;
1689
1690         assert(other->type == h->type);
1691
1692         /*
1693          * This reserves buckets for the worst case, where none of other's
1694          * entries are yet present in h. This is preferable to risking
1695          * an allocation failure in the middle of the moving and having to
1696          * rollback or return a partial result.
1697          */
1698         r = resize_buckets(h, n_entries(other));
1699         if (r < 0)
1700                 return r;
1701
1702         HASHMAP_FOREACH_IDX(idx, other, i) {
1703                 unsigned h_hash;
1704
1705                 e = bucket_at(other, idx);
1706                 h_hash = bucket_hash(h, e->key);
1707                 if (bucket_scan(h, h_hash, e->key) != IDX_NIL)
1708                         continue;
1709
1710                 n = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1711                 n->key = e->key;
1712                 if (h->type != HASHMAP_TYPE_SET)
1713                         ((struct plain_hashmap_entry*) n)->value =
1714                                 ((struct plain_hashmap_entry*) e)->value;
1715                 assert_se(hashmap_put_boldly(h, h_hash, &swap, false) == 1);
1716
1717                 remove_entry(other, idx);
1718         }
1719
1720         return 0;
1721 }
1722
1723 int internal_hashmap_move_one(HashmapBase *h, HashmapBase *other, const void *key) {
1724         struct swap_entries swap;
1725         unsigned h_hash, other_hash, idx;
1726         struct hashmap_base_entry *e, *n;
1727         int r;
1728
1729         assert(h);
1730
1731         h_hash = bucket_hash(h, key);
1732         if (bucket_scan(h, h_hash, key) != IDX_NIL)
1733                 return -EEXIST;
1734
1735         if (!other)
1736                 return -ENOENT;
1737
1738         assert(other->type == h->type);
1739
1740         other_hash = bucket_hash(other, key);
1741         idx = bucket_scan(other, other_hash, key);
1742         if (idx == IDX_NIL)
1743                 return -ENOENT;
1744
1745         e = bucket_at(other, idx);
1746
1747         n = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1748         n->key = e->key;
1749         if (h->type != HASHMAP_TYPE_SET)
1750                 ((struct plain_hashmap_entry*) n)->value =
1751                         ((struct plain_hashmap_entry*) e)->value;
1752         r = hashmap_put_boldly(h, h_hash, &swap, true);
1753         if (r < 0)
1754                 return r;
1755
1756         remove_entry(other, idx);
1757         return 0;
1758 }
1759
1760 HashmapBase *internal_hashmap_copy(HashmapBase *h) {
1761         HashmapBase *copy;
1762         int r;
1763
1764         assert(h);
1765
1766         copy = hashmap_base_new(h->hash_ops, h->type  HASHMAP_DEBUG_SRC_ARGS);
1767         if (!copy)
1768                 return NULL;
1769
1770         switch (h->type) {
1771         case HASHMAP_TYPE_PLAIN:
1772         case HASHMAP_TYPE_ORDERED:
1773                 r = hashmap_merge((Hashmap*)copy, (Hashmap*)h);
1774                 break;
1775         case HASHMAP_TYPE_SET:
1776                 r = set_merge((Set*)copy, (Set*)h);
1777                 break;
1778         default:
1779                 assert_not_reached("Unknown hashmap type");
1780         }
1781
1782         if (r < 0) {
1783                 internal_hashmap_free(copy);
1784                 return NULL;
1785         }
1786
1787         return copy;
1788 }
1789
1790 char **internal_hashmap_get_strv(HashmapBase *h) {
1791         char **sv;
1792         Iterator i;
1793         unsigned idx, n;
1794
1795         sv = new(char*, n_entries(h)+1);
1796         if (!sv)
1797                 return NULL;
1798
1799         n = 0;
1800         HASHMAP_FOREACH_IDX(idx, h, i)
1801                 sv[n++] = entry_value(h, bucket_at(h, idx));
1802         sv[n] = NULL;
1803
1804         return sv;
1805 }
1806
1807 void *ordered_hashmap_next(OrderedHashmap *h, const void *key) {
1808         struct ordered_hashmap_entry *e;
1809         unsigned hash, idx;
1810
1811         if (!h)
1812                 return NULL;
1813
1814         hash = bucket_hash(h, key);
1815         idx = bucket_scan(h, hash, key);
1816         if (idx == IDX_NIL)
1817                 return NULL;
1818
1819         e = ordered_bucket_at(h, idx);
1820         if (e->iterate_next == IDX_NIL)
1821                 return NULL;
1822         return ordered_bucket_at(h, e->iterate_next)->p.value;
1823 }
1824
1825 int set_consume(Set *s, void *value) {
1826         int r;
1827
1828         r = set_put(s, value);
1829         if (r <= 0)
1830                 free(value);
1831
1832         return r;
1833 }
1834
1835 int set_put_strdup(Set *s, const char *p) {
1836         char *c;
1837         int r;
1838
1839         assert(s);
1840         assert(p);
1841
1842         c = strdup(p);
1843         if (!c)
1844                 return -ENOMEM;
1845
1846         r = set_consume(s, c);
1847         if (r == -EEXIST)
1848                 return 0;
1849
1850         return r;
1851 }
1852
1853 int set_put_strdupv(Set *s, char **l) {
1854         int n = 0, r;
1855         char **i;
1856
1857         STRV_FOREACH(i, l) {
1858                 r = set_put_strdup(s, *i);
1859                 if (r < 0)
1860                         return r;
1861
1862                 n += r;
1863         }
1864
1865         return n;
1866 }