1 /* SPDX-License-Identifier: LGPL-2.1-or-later */
2 
3 #include <errno.h>
4 #include <fnmatch.h>
5 #include <pthread.h>
6 #include <stdint.h>
7 #include <stdlib.h>
8 
9 #include "alloc-util.h"
10 #include "fileio.h"
11 #include "hashmap.h"
12 #include "macro.h"
13 #include "memory-util.h"
14 #include "mempool.h"
15 #include "missing_syscall.h"
16 #include "process-util.h"
17 #include "random-util.h"
18 #include "set.h"
19 #include "siphash24.h"
20 #include "string-util.h"
21 #include "strv.h"
22 
23 #if ENABLE_DEBUG_HASHMAP
24 #include "list.h"
25 #endif
26 
27 /*
28  * Implementation of hashmaps.
29  * Addressing: open
30  *   - uses less RAM compared to closed addressing (chaining), because
31  *     our entries are small (especially in Sets, which tend to contain
32  *     the majority of entries in systemd).
33  * Collision resolution: Robin Hood
34  *   - tends to equalize displacement of entries from their optimal buckets.
35  * Probe sequence: linear
36  *   - though theoretically worse than random probing/uniform hashing/double
37  *     hashing, it is good for cache locality.
38  *
39  * References:
40  * Celis, P. 1986. Robin Hood Hashing.
41  * Ph.D. Dissertation. University of Waterloo, Waterloo, Ont., Canada, Canada.
42  * https://cs.uwaterloo.ca/research/tr/1986/CS-86-14.pdf
43  * - The results are derived for random probing. Suggests deletion with
44  *   tombstones and two mean-centered search methods. None of that works
45  *   well for linear probing.
46  *
47  * Janson, S. 2005. Individual displacements for linear probing hashing with different insertion policies.
48  * ACM Trans. Algorithms 1, 2 (October 2005), 177-213.
49  * DOI=10.1145/1103963.1103964 http://doi.acm.org/10.1145/1103963.1103964
50  * http://www.math.uu.se/~svante/papers/sj157.pdf
51  * - Applies to Robin Hood with linear probing. Contains remarks on
52  *   the unsuitability of mean-centered search with linear probing.
53  *
54  * Viola, A. 2005. Exact distribution of individual displacements in linear probing hashing.
55  * ACM Trans. Algorithms 1, 2 (October 2005), 214-242.
56  * DOI=10.1145/1103963.1103965 http://doi.acm.org/10.1145/1103963.1103965
57  * - Similar to Janson. Note that Viola writes about C_{m,n} (number of probes
58  *   in a successful search), and Janson writes about displacement. C = d + 1.
59  *
60  * Goossaert, E. 2013. Robin Hood hashing: backward shift deletion.
61  * http://codecapsule.com/2013/11/17/robin-hood-hashing-backward-shift-deletion/
62  * - Explanation of backward shift deletion with pictures.
63  *
64  * Khuong, P. 2013. The Other Robin Hood Hashing.
65  * http://www.pvk.ca/Blog/2013/11/26/the-other-robin-hood-hashing/
66  * - Short summary of random vs. linear probing, and tombstones vs. backward shift.
67  */
68 
69 /*
70  * XXX Ideas for improvement:
71  * For unordered hashmaps, randomize iteration order, similarly to Perl:
72  * http://blog.booking.com/hardening-perls-hash-function.html
73  */
74 
75 /* INV_KEEP_FREE = 1 / (1 - max_load_factor)
76  * e.g. 1 / (1 - 0.8) = 5 ... keep one fifth of the buckets free. */
77 #define INV_KEEP_FREE            5U
78 
79 /* Fields common to entries of all hashmap/set types */
80 struct hashmap_base_entry {
81         const void *key;
82 };
83 
84 /* Entry types for specific hashmap/set types
85  * hashmap_base_entry must be at the beginning of each entry struct. */
86 
87 struct plain_hashmap_entry {
88         struct hashmap_base_entry b;
89         void *value;
90 };
91 
92 struct ordered_hashmap_entry {
93         struct plain_hashmap_entry p;
94         unsigned iterate_next, iterate_previous;
95 };
96 
97 struct set_entry {
98         struct hashmap_base_entry b;
99 };
100 
101 /* In several functions it is advantageous to have the hash table extended
102  * virtually by a couple of additional buckets. We reserve special index values
103  * for these "swap" buckets. */
104 #define _IDX_SWAP_BEGIN     (UINT_MAX - 3)
105 #define IDX_PUT             (_IDX_SWAP_BEGIN + 0)
106 #define IDX_TMP             (_IDX_SWAP_BEGIN + 1)
107 #define _IDX_SWAP_END       (_IDX_SWAP_BEGIN + 2)
108 
109 #define IDX_FIRST           (UINT_MAX - 1) /* special index for freshly initialized iterators */
110 #define IDX_NIL             UINT_MAX       /* special index value meaning "none" or "end" */
111 
112 assert_cc(IDX_FIRST == _IDX_SWAP_END);
113 assert_cc(IDX_FIRST == _IDX_ITERATOR_FIRST);
114 
115 /* Storage space for the "swap" buckets.
116  * All entry types can fit into an ordered_hashmap_entry. */
117 struct swap_entries {
118         struct ordered_hashmap_entry e[_IDX_SWAP_END - _IDX_SWAP_BEGIN];
119 };
120 
121 /* Distance from Initial Bucket */
122 typedef uint8_t dib_raw_t;
123 #define DIB_RAW_OVERFLOW ((dib_raw_t)0xfdU)   /* indicates DIB value is greater than representable */
124 #define DIB_RAW_REHASH   ((dib_raw_t)0xfeU)   /* entry yet to be rehashed during in-place resize */
125 #define DIB_RAW_FREE     ((dib_raw_t)0xffU)   /* a free bucket */
126 #define DIB_RAW_INIT     ((char)DIB_RAW_FREE) /* a byte to memset a DIB store with when initializing */
127 
128 #define DIB_FREE UINT_MAX
129 
130 #if ENABLE_DEBUG_HASHMAP
131 struct hashmap_debug_info {
132         LIST_FIELDS(struct hashmap_debug_info, debug_list);
133         unsigned max_entries;  /* high watermark of n_entries */
134 
135         /* who allocated this hashmap */
136         int line;
137         const char *file;
138         const char *func;
139 
140         /* fields to detect modification while iterating */
141         unsigned put_count;    /* counts puts into the hashmap */
142         unsigned rem_count;    /* counts removals from hashmap */
143         unsigned last_rem_idx; /* remembers last removal index */
144 };
145 
146 /* Tracks all existing hashmaps. Get at it from gdb. See sd_dump_hashmaps.py */
147 static LIST_HEAD(struct hashmap_debug_info, hashmap_debug_list);
148 static pthread_mutex_t hashmap_debug_list_mutex = PTHREAD_MUTEX_INITIALIZER;
149 #endif
150 
151 enum HashmapType {
152         HASHMAP_TYPE_PLAIN,
153         HASHMAP_TYPE_ORDERED,
154         HASHMAP_TYPE_SET,
155         _HASHMAP_TYPE_MAX
156 };
157 
158 struct _packed_ indirect_storage {
159         void *storage;                     /* where buckets and DIBs are stored */
160         uint8_t  hash_key[HASH_KEY_SIZE];  /* hash key; changes during resize */
161 
162         unsigned n_entries;                /* number of stored entries */
163         unsigned n_buckets;                /* number of buckets */
164 
165         unsigned idx_lowest_entry;         /* Index below which all buckets are free.
166                                               Makes "while (hashmap_steal_first())" loops
167                                               O(n) instead of O(n^2) for unordered hashmaps. */
168         uint8_t  _pad[3];                  /* padding for the whole HashmapBase */
169         /* The bitfields in HashmapBase complete the alignment of the whole thing. */
170 };
171 
172 struct direct_storage {
173         /* This gives us 39 bytes on 64bit, or 35 bytes on 32bit.
174          * That's room for 4 set_entries + 4 DIB bytes + 3 unused bytes on 64bit,
175          *              or 7 set_entries + 7 DIB bytes + 0 unused bytes on 32bit. */
176         uint8_t storage[sizeof(struct indirect_storage)];
177 };
178 
179 #define DIRECT_BUCKETS(entry_t) \
180         (sizeof(struct direct_storage) / (sizeof(entry_t) + sizeof(dib_raw_t)))
181 
182 /* We should be able to store at least one entry directly. */
183 assert_cc(DIRECT_BUCKETS(struct ordered_hashmap_entry) >= 1);
184 
185 /* We have 3 bits for n_direct_entries. */
186 assert_cc(DIRECT_BUCKETS(struct set_entry) < (1 << 3));
187 
188 /* Hashmaps with directly stored entries all use this shared hash key.
189  * It's no big deal if the key is guessed, because there can be only
190  * a handful of directly stored entries in a hashmap. When a hashmap
191  * outgrows direct storage, it gets its own key for indirect storage. */
192 static uint8_t shared_hash_key[HASH_KEY_SIZE];
193 
194 /* Fields that all hashmap/set types must have */
195 struct HashmapBase {
196         const struct hash_ops *hash_ops;  /* hash and compare ops to use */
197 
198         union _packed_ {
199                 struct indirect_storage indirect; /* if  has_indirect */
200                 struct direct_storage direct;     /* if !has_indirect */
201         };
202 
203         enum HashmapType type:2;     /* HASHMAP_TYPE_* */
204         bool has_indirect:1;         /* whether indirect storage is used */
205         unsigned n_direct_entries:3; /* Number of entries in direct storage.
206                                       * Only valid if !has_indirect. */
207         bool from_pool:1;            /* whether was allocated from mempool */
208         bool dirty:1;                /* whether dirtied since last iterated_cache_get() */
209         bool cached:1;               /* whether this hashmap is being cached */
210 
211 #if ENABLE_DEBUG_HASHMAP
212         struct hashmap_debug_info debug;
213 #endif
214 };
215 
216 /* Specific hash types
217  * HashmapBase must be at the beginning of each hashmap struct. */
218 
219 struct Hashmap {
220         struct HashmapBase b;
221 };
222 
223 struct OrderedHashmap {
224         struct HashmapBase b;
225         unsigned iterate_list_head, iterate_list_tail;
226 };
227 
228 struct Set {
229         struct HashmapBase b;
230 };
231 
232 typedef struct CacheMem {
233         const void **ptr;
234         size_t n_populated;
235         bool active:1;
236 } CacheMem;
237 
238 struct IteratedCache {
239         HashmapBase *hashmap;
240         CacheMem keys, values;
241 };
242 
243 DEFINE_MEMPOOL(hashmap_pool,         Hashmap,        8);
244 DEFINE_MEMPOOL(ordered_hashmap_pool, OrderedHashmap, 8);
245 /* No need for a separate Set pool */
246 assert_cc(sizeof(Hashmap) == sizeof(Set));
247 
248 struct hashmap_type_info {
249         size_t head_size;
250         size_t entry_size;
251         struct mempool *mempool;
252         unsigned n_direct_buckets;
253 };
254 
255 static _used_ const struct hashmap_type_info hashmap_type_info[_HASHMAP_TYPE_MAX] = {
256         [HASHMAP_TYPE_PLAIN] = {
257                 .head_size        = sizeof(Hashmap),
258                 .entry_size       = sizeof(struct plain_hashmap_entry),
259                 .mempool          = &hashmap_pool,
260                 .n_direct_buckets = DIRECT_BUCKETS(struct plain_hashmap_entry),
261         },
262         [HASHMAP_TYPE_ORDERED] = {
263                 .head_size        = sizeof(OrderedHashmap),
264                 .entry_size       = sizeof(struct ordered_hashmap_entry),
265                 .mempool          = &ordered_hashmap_pool,
266                 .n_direct_buckets = DIRECT_BUCKETS(struct ordered_hashmap_entry),
267         },
268         [HASHMAP_TYPE_SET] = {
269                 .head_size        = sizeof(Set),
270                 .entry_size       = sizeof(struct set_entry),
271                 .mempool          = &hashmap_pool,
272                 .n_direct_buckets = DIRECT_BUCKETS(struct set_entry),
273         },
274 };
275 
276 #if VALGRIND
cleanup_pools(void)277 _destructor_ static void cleanup_pools(void) {
278         _cleanup_free_ char *t = NULL;
279         int r;
280 
281         /* Be nice to valgrind */
282 
283         /* The pool is only allocated by the main thread, but the memory can
284          * be passed to other threads. Let's clean up if we are the main thread
285          * and no other threads are live. */
286         /* We build our own is_main_thread() here, which doesn't use C11
287          * TLS based caching of the result. That's because valgrind apparently
288          * doesn't like malloc() (which C11 TLS internally uses) to be called
289          * from a GCC destructors. */
290         if (getpid() != gettid())
291                 return;
292 
293         r = get_proc_field("/proc/self/status", "Threads", WHITESPACE, &t);
294         if (r < 0 || !streq(t, "1"))
295                 return;
296 
297         mempool_drop(&hashmap_pool);
298         mempool_drop(&ordered_hashmap_pool);
299 }
300 #endif
301 
n_buckets(HashmapBase * h)302 static unsigned n_buckets(HashmapBase *h) {
303         return h->has_indirect ? h->indirect.n_buckets
304                                : hashmap_type_info[h->type].n_direct_buckets;
305 }
306 
n_entries(HashmapBase * h)307 static unsigned n_entries(HashmapBase *h) {
308         return h->has_indirect ? h->indirect.n_entries
309                                : h->n_direct_entries;
310 }
311 
n_entries_inc(HashmapBase * h)312 static void n_entries_inc(HashmapBase *h) {
313         if (h->has_indirect)
314                 h->indirect.n_entries++;
315         else
316                 h->n_direct_entries++;
317 }
318 
n_entries_dec(HashmapBase * h)319 static void n_entries_dec(HashmapBase *h) {
320         if (h->has_indirect)
321                 h->indirect.n_entries--;
322         else
323                 h->n_direct_entries--;
324 }
325 
storage_ptr(HashmapBase * h)326 static void* storage_ptr(HashmapBase *h) {
327         return h->has_indirect ? h->indirect.storage
328                                : h->direct.storage;
329 }
330 
hash_key(HashmapBase * h)331 static uint8_t* hash_key(HashmapBase *h) {
332         return h->has_indirect ? h->indirect.hash_key
333                                : shared_hash_key;
334 }
335 
base_bucket_hash(HashmapBase * h,const void * p)336 static unsigned base_bucket_hash(HashmapBase *h, const void *p) {
337         struct siphash state;
338         uint64_t hash;
339 
340         siphash24_init(&state, hash_key(h));
341 
342         h->hash_ops->hash(p, &state);
343 
344         hash = siphash24_finalize(&state);
345 
346         return (unsigned) (hash % n_buckets(h));
347 }
348 #define bucket_hash(h, p) base_bucket_hash(HASHMAP_BASE(h), p)
349 
base_set_dirty(HashmapBase * h)350 static void base_set_dirty(HashmapBase *h) {
351         h->dirty = true;
352 }
353 #define hashmap_set_dirty(h) base_set_dirty(HASHMAP_BASE(h))
354 
get_hash_key(uint8_t hash_key[HASH_KEY_SIZE],bool reuse_is_ok)355 static void get_hash_key(uint8_t hash_key[HASH_KEY_SIZE], bool reuse_is_ok) {
356         static uint8_t current[HASH_KEY_SIZE];
357         static bool current_initialized = false;
358 
359         /* Returns a hash function key to use. In order to keep things
360          * fast we will not generate a new key each time we allocate a
361          * new hash table. Instead, we'll just reuse the most recently
362          * generated one, except if we never generated one or when we
363          * are rehashing an entire hash table because we reached a
364          * fill level */
365 
366         if (!current_initialized || !reuse_is_ok) {
367                 random_bytes(current, sizeof(current));
368                 current_initialized = true;
369         }
370 
371         memcpy(hash_key, current, sizeof(current));
372 }
373 
bucket_at(HashmapBase * h,unsigned idx)374 static struct hashmap_base_entry* bucket_at(HashmapBase *h, unsigned idx) {
375         return (struct hashmap_base_entry*)
376                 ((uint8_t*) storage_ptr(h) + idx * hashmap_type_info[h->type].entry_size);
377 }
378 
plain_bucket_at(Hashmap * h,unsigned idx)379 static struct plain_hashmap_entry* plain_bucket_at(Hashmap *h, unsigned idx) {
380         return (struct plain_hashmap_entry*) bucket_at(HASHMAP_BASE(h), idx);
381 }
382 
ordered_bucket_at(OrderedHashmap * h,unsigned idx)383 static struct ordered_hashmap_entry* ordered_bucket_at(OrderedHashmap *h, unsigned idx) {
384         return (struct ordered_hashmap_entry*) bucket_at(HASHMAP_BASE(h), idx);
385 }
386 
set_bucket_at(Set * h,unsigned idx)387 static struct set_entry *set_bucket_at(Set *h, unsigned idx) {
388         return (struct set_entry*) bucket_at(HASHMAP_BASE(h), idx);
389 }
390 
bucket_at_swap(struct swap_entries * swap,unsigned idx)391 static struct ordered_hashmap_entry* bucket_at_swap(struct swap_entries *swap, unsigned idx) {
392         return &swap->e[idx - _IDX_SWAP_BEGIN];
393 }
394 
395 /* Returns a pointer to the bucket at index idx.
396  * Understands real indexes and swap indexes, hence "_virtual". */
bucket_at_virtual(HashmapBase * h,struct swap_entries * swap,unsigned idx)397 static struct hashmap_base_entry* bucket_at_virtual(HashmapBase *h, struct swap_entries *swap,
398                                                     unsigned idx) {
399         if (idx < _IDX_SWAP_BEGIN)
400                 return bucket_at(h, idx);
401 
402         if (idx < _IDX_SWAP_END)
403                 return &bucket_at_swap(swap, idx)->p.b;
404 
405         assert_not_reached();
406 }
407 
dib_raw_ptr(HashmapBase * h)408 static dib_raw_t* dib_raw_ptr(HashmapBase *h) {
409         return (dib_raw_t*)
410                 ((uint8_t*) storage_ptr(h) + hashmap_type_info[h->type].entry_size * n_buckets(h));
411 }
412 
bucket_distance(HashmapBase * h,unsigned idx,unsigned from)413 static unsigned bucket_distance(HashmapBase *h, unsigned idx, unsigned from) {
414         return idx >= from ? idx - from
415                            : n_buckets(h) + idx - from;
416 }
417 
bucket_calculate_dib(HashmapBase * h,unsigned idx,dib_raw_t raw_dib)418 static unsigned bucket_calculate_dib(HashmapBase *h, unsigned idx, dib_raw_t raw_dib) {
419         unsigned initial_bucket;
420 
421         if (raw_dib == DIB_RAW_FREE)
422                 return DIB_FREE;
423 
424         if (_likely_(raw_dib < DIB_RAW_OVERFLOW))
425                 return raw_dib;
426 
427         /*
428          * Having an overflow DIB value is very unlikely. The hash function
429          * would have to be bad. For example, in a table of size 2^24 filled
430          * to load factor 0.9 the maximum observed DIB is only about 60.
431          * In theory (assuming I used Maxima correctly), for an infinite size
432          * hash table with load factor 0.8 the probability of a given entry
433          * having DIB > 40 is 1.9e-8.
434          * This returns the correct DIB value by recomputing the hash value in
435          * the unlikely case. XXX Hitting this case could be a hint to rehash.
436          */
437         initial_bucket = bucket_hash(h, bucket_at(h, idx)->key);
438         return bucket_distance(h, idx, initial_bucket);
439 }
440 
bucket_set_dib(HashmapBase * h,unsigned idx,unsigned dib)441 static void bucket_set_dib(HashmapBase *h, unsigned idx, unsigned dib) {
442         dib_raw_ptr(h)[idx] = dib != DIB_FREE ? MIN(dib, DIB_RAW_OVERFLOW) : DIB_RAW_FREE;
443 }
444 
skip_free_buckets(HashmapBase * h,unsigned idx)445 static unsigned skip_free_buckets(HashmapBase *h, unsigned idx) {
446         dib_raw_t *dibs;
447 
448         dibs = dib_raw_ptr(h);
449 
450         for ( ; idx < n_buckets(h); idx++)
451                 if (dibs[idx] != DIB_RAW_FREE)
452                         return idx;
453 
454         return IDX_NIL;
455 }
456 
bucket_mark_free(HashmapBase * h,unsigned idx)457 static void bucket_mark_free(HashmapBase *h, unsigned idx) {
458         memzero(bucket_at(h, idx), hashmap_type_info[h->type].entry_size);
459         bucket_set_dib(h, idx, DIB_FREE);
460 }
461 
bucket_move_entry(HashmapBase * h,struct swap_entries * swap,unsigned from,unsigned to)462 static void bucket_move_entry(HashmapBase *h, struct swap_entries *swap,
463                               unsigned from, unsigned to) {
464         struct hashmap_base_entry *e_from, *e_to;
465 
466         assert(from != to);
467 
468         e_from = bucket_at_virtual(h, swap, from);
469         e_to   = bucket_at_virtual(h, swap, to);
470 
471         memcpy(e_to, e_from, hashmap_type_info[h->type].entry_size);
472 
473         if (h->type == HASHMAP_TYPE_ORDERED) {
474                 OrderedHashmap *lh = (OrderedHashmap*) h;
475                 struct ordered_hashmap_entry *le, *le_to;
476 
477                 le_to = (struct ordered_hashmap_entry*) e_to;
478 
479                 if (le_to->iterate_next != IDX_NIL) {
480                         le = (struct ordered_hashmap_entry*)
481                              bucket_at_virtual(h, swap, le_to->iterate_next);
482                         le->iterate_previous = to;
483                 }
484 
485                 if (le_to->iterate_previous != IDX_NIL) {
486                         le = (struct ordered_hashmap_entry*)
487                              bucket_at_virtual(h, swap, le_to->iterate_previous);
488                         le->iterate_next = to;
489                 }
490 
491                 if (lh->iterate_list_head == from)
492                         lh->iterate_list_head = to;
493                 if (lh->iterate_list_tail == from)
494                         lh->iterate_list_tail = to;
495         }
496 }
497 
next_idx(HashmapBase * h,unsigned idx)498 static unsigned next_idx(HashmapBase *h, unsigned idx) {
499         return (idx + 1U) % n_buckets(h);
500 }
501 
prev_idx(HashmapBase * h,unsigned idx)502 static unsigned prev_idx(HashmapBase *h, unsigned idx) {
503         return (n_buckets(h) + idx - 1U) % n_buckets(h);
504 }
505 
entry_value(HashmapBase * h,struct hashmap_base_entry * e)506 static void* entry_value(HashmapBase *h, struct hashmap_base_entry *e) {
507         switch (h->type) {
508 
509         case HASHMAP_TYPE_PLAIN:
510         case HASHMAP_TYPE_ORDERED:
511                 return ((struct plain_hashmap_entry*)e)->value;
512 
513         case HASHMAP_TYPE_SET:
514                 return (void*) e->key;
515 
516         default:
517                 assert_not_reached();
518         }
519 }
520 
base_remove_entry(HashmapBase * h,unsigned idx)521 static void base_remove_entry(HashmapBase *h, unsigned idx) {
522         unsigned left, right, prev, dib;
523         dib_raw_t raw_dib, *dibs;
524 
525         dibs = dib_raw_ptr(h);
526         assert(dibs[idx] != DIB_RAW_FREE);
527 
528 #if ENABLE_DEBUG_HASHMAP
529         h->debug.rem_count++;
530         h->debug.last_rem_idx = idx;
531 #endif
532 
533         left = idx;
534         /* Find the stop bucket ("right"). It is either free or has DIB == 0. */
535         for (right = next_idx(h, left); ; right = next_idx(h, right)) {
536                 raw_dib = dibs[right];
537                 if (IN_SET(raw_dib, 0, DIB_RAW_FREE))
538                         break;
539 
540                 /* The buckets are not supposed to be all occupied and with DIB > 0.
541                  * That would mean we could make everyone better off by shifting them
542                  * backward. This scenario is impossible. */
543                 assert(left != right);
544         }
545 
546         if (h->type == HASHMAP_TYPE_ORDERED) {
547                 OrderedHashmap *lh = (OrderedHashmap*) h;
548                 struct ordered_hashmap_entry *le = ordered_bucket_at(lh, idx);
549 
550                 if (le->iterate_next != IDX_NIL)
551                         ordered_bucket_at(lh, le->iterate_next)->iterate_previous = le->iterate_previous;
552                 else
553                         lh->iterate_list_tail = le->iterate_previous;
554 
555                 if (le->iterate_previous != IDX_NIL)
556                         ordered_bucket_at(lh, le->iterate_previous)->iterate_next = le->iterate_next;
557                 else
558                         lh->iterate_list_head = le->iterate_next;
559         }
560 
561         /* Now shift all buckets in the interval (left, right) one step backwards */
562         for (prev = left, left = next_idx(h, left); left != right;
563              prev = left, left = next_idx(h, left)) {
564                 dib = bucket_calculate_dib(h, left, dibs[left]);
565                 assert(dib != 0);
566                 bucket_move_entry(h, NULL, left, prev);
567                 bucket_set_dib(h, prev, dib - 1);
568         }
569 
570         bucket_mark_free(h, prev);
571         n_entries_dec(h);
572         base_set_dirty(h);
573 }
574 #define remove_entry(h, idx) base_remove_entry(HASHMAP_BASE(h), idx)
575 
hashmap_iterate_in_insertion_order(OrderedHashmap * h,Iterator * i)576 static unsigned hashmap_iterate_in_insertion_order(OrderedHashmap *h, Iterator *i) {
577         struct ordered_hashmap_entry *e;
578         unsigned idx;
579 
580         assert(h);
581         assert(i);
582 
583         if (i->idx == IDX_NIL)
584                 goto at_end;
585 
586         if (i->idx == IDX_FIRST && h->iterate_list_head == IDX_NIL)
587                 goto at_end;
588 
589         if (i->idx == IDX_FIRST) {
590                 idx = h->iterate_list_head;
591                 e = ordered_bucket_at(h, idx);
592         } else {
593                 idx = i->idx;
594                 e = ordered_bucket_at(h, idx);
595                 /*
596                  * We allow removing the current entry while iterating, but removal may cause
597                  * a backward shift. The next entry may thus move one bucket to the left.
598                  * To detect when it happens, we remember the key pointer of the entry we were
599                  * going to iterate next. If it does not match, there was a backward shift.
600                  */
601                 if (e->p.b.key != i->next_key) {
602                         idx = prev_idx(HASHMAP_BASE(h), idx);
603                         e = ordered_bucket_at(h, idx);
604                 }
605                 assert(e->p.b.key == i->next_key);
606         }
607 
608 #if ENABLE_DEBUG_HASHMAP
609         i->prev_idx = idx;
610 #endif
611 
612         if (e->iterate_next != IDX_NIL) {
613                 struct ordered_hashmap_entry *n;
614                 i->idx = e->iterate_next;
615                 n = ordered_bucket_at(h, i->idx);
616                 i->next_key = n->p.b.key;
617         } else
618                 i->idx = IDX_NIL;
619 
620         return idx;
621 
622 at_end:
623         i->idx = IDX_NIL;
624         return IDX_NIL;
625 }
626 
hashmap_iterate_in_internal_order(HashmapBase * h,Iterator * i)627 static unsigned hashmap_iterate_in_internal_order(HashmapBase *h, Iterator *i) {
628         unsigned idx;
629 
630         assert(h);
631         assert(i);
632 
633         if (i->idx == IDX_NIL)
634                 goto at_end;
635 
636         if (i->idx == IDX_FIRST) {
637                 /* fast forward to the first occupied bucket */
638                 if (h->has_indirect) {
639                         i->idx = skip_free_buckets(h, h->indirect.idx_lowest_entry);
640                         h->indirect.idx_lowest_entry = i->idx;
641                 } else
642                         i->idx = skip_free_buckets(h, 0);
643 
644                 if (i->idx == IDX_NIL)
645                         goto at_end;
646         } else {
647                 struct hashmap_base_entry *e;
648 
649                 assert(i->idx > 0);
650 
651                 e = bucket_at(h, i->idx);
652                 /*
653                  * We allow removing the current entry while iterating, but removal may cause
654                  * a backward shift. The next entry may thus move one bucket to the left.
655                  * To detect when it happens, we remember the key pointer of the entry we were
656                  * going to iterate next. If it does not match, there was a backward shift.
657                  */
658                 if (e->key != i->next_key)
659                         e = bucket_at(h, --i->idx);
660 
661                 assert(e->key == i->next_key);
662         }
663 
664         idx = i->idx;
665 #if ENABLE_DEBUG_HASHMAP
666         i->prev_idx = idx;
667 #endif
668 
669         i->idx = skip_free_buckets(h, i->idx + 1);
670         if (i->idx != IDX_NIL)
671                 i->next_key = bucket_at(h, i->idx)->key;
672         else
673                 i->idx = IDX_NIL;
674 
675         return idx;
676 
677 at_end:
678         i->idx = IDX_NIL;
679         return IDX_NIL;
680 }
681 
hashmap_iterate_entry(HashmapBase * h,Iterator * i)682 static unsigned hashmap_iterate_entry(HashmapBase *h, Iterator *i) {
683         if (!h) {
684                 i->idx = IDX_NIL;
685                 return IDX_NIL;
686         }
687 
688 #if ENABLE_DEBUG_HASHMAP
689         if (i->idx == IDX_FIRST) {
690                 i->put_count = h->debug.put_count;
691                 i->rem_count = h->debug.rem_count;
692         } else {
693                 /* While iterating, must not add any new entries */
694                 assert(i->put_count == h->debug.put_count);
695                 /* ... or remove entries other than the current one */
696                 assert(i->rem_count == h->debug.rem_count ||
697                        (i->rem_count == h->debug.rem_count - 1 &&
698                         i->prev_idx == h->debug.last_rem_idx));
699                 /* Reset our removals counter */
700                 i->rem_count = h->debug.rem_count;
701         }
702 #endif
703 
704         return h->type == HASHMAP_TYPE_ORDERED ? hashmap_iterate_in_insertion_order((OrderedHashmap*) h, i)
705                                                : hashmap_iterate_in_internal_order(h, i);
706 }
707 
_hashmap_iterate(HashmapBase * h,Iterator * i,void ** value,const void ** key)708 bool _hashmap_iterate(HashmapBase *h, Iterator *i, void **value, const void **key) {
709         struct hashmap_base_entry *e;
710         void *data;
711         unsigned idx;
712 
713         idx = hashmap_iterate_entry(h, i);
714         if (idx == IDX_NIL) {
715                 if (value)
716                         *value = NULL;
717                 if (key)
718                         *key = NULL;
719 
720                 return false;
721         }
722 
723         e = bucket_at(h, idx);
724         data = entry_value(h, e);
725         if (value)
726                 *value = data;
727         if (key)
728                 *key = e->key;
729 
730         return true;
731 }
732 
733 #define HASHMAP_FOREACH_IDX(idx, h, i) \
734         for ((i) = ITERATOR_FIRST, (idx) = hashmap_iterate_entry((h), &(i)); \
735              (idx != IDX_NIL); \
736              (idx) = hashmap_iterate_entry((h), &(i)))
737 
_hashmap_iterated_cache_new(HashmapBase * h)738 IteratedCache* _hashmap_iterated_cache_new(HashmapBase *h) {
739         IteratedCache *cache;
740 
741         assert(h);
742         assert(!h->cached);
743 
744         if (h->cached)
745                 return NULL;
746 
747         cache = new0(IteratedCache, 1);
748         if (!cache)
749                 return NULL;
750 
751         cache->hashmap = h;
752         h->cached = true;
753 
754         return cache;
755 }
756 
reset_direct_storage(HashmapBase * h)757 static void reset_direct_storage(HashmapBase *h) {
758         const struct hashmap_type_info *hi = &hashmap_type_info[h->type];
759         void *p;
760 
761         assert(!h->has_indirect);
762 
763         p = mempset(h->direct.storage, 0, hi->entry_size * hi->n_direct_buckets);
764         memset(p, DIB_RAW_INIT, sizeof(dib_raw_t) * hi->n_direct_buckets);
765 }
766 
shared_hash_key_initialize(void)767 static void shared_hash_key_initialize(void) {
768         random_bytes(shared_hash_key, sizeof(shared_hash_key));
769 }
770 
hashmap_base_new(const struct hash_ops * hash_ops,enum HashmapType type HASHMAP_DEBUG_PARAMS)771 static struct HashmapBase* hashmap_base_new(const struct hash_ops *hash_ops, enum HashmapType type  HASHMAP_DEBUG_PARAMS) {
772         HashmapBase *h;
773         const struct hashmap_type_info *hi = &hashmap_type_info[type];
774         bool up;
775 
776         up = mempool_enabled();
777 
778         h = up ? mempool_alloc0_tile(hi->mempool) : malloc0(hi->head_size);
779         if (!h)
780                 return NULL;
781 
782         h->type = type;
783         h->from_pool = up;
784         h->hash_ops = hash_ops ?: &trivial_hash_ops;
785 
786         if (type == HASHMAP_TYPE_ORDERED) {
787                 OrderedHashmap *lh = (OrderedHashmap*)h;
788                 lh->iterate_list_head = lh->iterate_list_tail = IDX_NIL;
789         }
790 
791         reset_direct_storage(h);
792 
793         static pthread_once_t once = PTHREAD_ONCE_INIT;
794         assert_se(pthread_once(&once, shared_hash_key_initialize) == 0);
795 
796 #if ENABLE_DEBUG_HASHMAP
797         h->debug.func = func;
798         h->debug.file = file;
799         h->debug.line = line;
800         assert_se(pthread_mutex_lock(&hashmap_debug_list_mutex) == 0);
801         LIST_PREPEND(debug_list, hashmap_debug_list, &h->debug);
802         assert_se(pthread_mutex_unlock(&hashmap_debug_list_mutex) == 0);
803 #endif
804 
805         return h;
806 }
807 
_hashmap_new(const struct hash_ops * hash_ops HASHMAP_DEBUG_PARAMS)808 Hashmap *_hashmap_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
809         return (Hashmap*)        hashmap_base_new(hash_ops, HASHMAP_TYPE_PLAIN  HASHMAP_DEBUG_PASS_ARGS);
810 }
811 
_ordered_hashmap_new(const struct hash_ops * hash_ops HASHMAP_DEBUG_PARAMS)812 OrderedHashmap *_ordered_hashmap_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
813         return (OrderedHashmap*) hashmap_base_new(hash_ops, HASHMAP_TYPE_ORDERED  HASHMAP_DEBUG_PASS_ARGS);
814 }
815 
_set_new(const struct hash_ops * hash_ops HASHMAP_DEBUG_PARAMS)816 Set *_set_new(const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
817         return (Set*)            hashmap_base_new(hash_ops, HASHMAP_TYPE_SET  HASHMAP_DEBUG_PASS_ARGS);
818 }
819 
hashmap_base_ensure_allocated(HashmapBase ** h,const struct hash_ops * hash_ops,enum HashmapType type HASHMAP_DEBUG_PARAMS)820 static int hashmap_base_ensure_allocated(HashmapBase **h, const struct hash_ops *hash_ops,
821                                          enum HashmapType type  HASHMAP_DEBUG_PARAMS) {
822         HashmapBase *q;
823 
824         assert(h);
825 
826         if (*h)
827                 return 0;
828 
829         q = hashmap_base_new(hash_ops, type  HASHMAP_DEBUG_PASS_ARGS);
830         if (!q)
831                 return -ENOMEM;
832 
833         *h = q;
834         return 1;
835 }
836 
_hashmap_ensure_allocated(Hashmap ** h,const struct hash_ops * hash_ops HASHMAP_DEBUG_PARAMS)837 int _hashmap_ensure_allocated(Hashmap **h, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
838         return hashmap_base_ensure_allocated((HashmapBase**)h, hash_ops, HASHMAP_TYPE_PLAIN  HASHMAP_DEBUG_PASS_ARGS);
839 }
840 
_ordered_hashmap_ensure_allocated(OrderedHashmap ** h,const struct hash_ops * hash_ops HASHMAP_DEBUG_PARAMS)841 int _ordered_hashmap_ensure_allocated(OrderedHashmap **h, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
842         return hashmap_base_ensure_allocated((HashmapBase**)h, hash_ops, HASHMAP_TYPE_ORDERED  HASHMAP_DEBUG_PASS_ARGS);
843 }
844 
_set_ensure_allocated(Set ** s,const struct hash_ops * hash_ops HASHMAP_DEBUG_PARAMS)845 int _set_ensure_allocated(Set **s, const struct hash_ops *hash_ops  HASHMAP_DEBUG_PARAMS) {
846         return hashmap_base_ensure_allocated((HashmapBase**)s, hash_ops, HASHMAP_TYPE_SET  HASHMAP_DEBUG_PASS_ARGS);
847 }
848 
_hashmap_ensure_put(Hashmap ** h,const struct hash_ops * hash_ops,const void * key,void * value HASHMAP_DEBUG_PARAMS)849 int _hashmap_ensure_put(Hashmap **h, const struct hash_ops *hash_ops, const void *key, void *value  HASHMAP_DEBUG_PARAMS) {
850         int r;
851 
852         r = _hashmap_ensure_allocated(h, hash_ops  HASHMAP_DEBUG_PASS_ARGS);
853         if (r < 0)
854                 return r;
855 
856         return hashmap_put(*h, key, value);
857 }
858 
_ordered_hashmap_ensure_put(OrderedHashmap ** h,const struct hash_ops * hash_ops,const void * key,void * value HASHMAP_DEBUG_PARAMS)859 int _ordered_hashmap_ensure_put(OrderedHashmap **h, const struct hash_ops *hash_ops, const void *key, void *value  HASHMAP_DEBUG_PARAMS) {
860         int r;
861 
862         r = _ordered_hashmap_ensure_allocated(h, hash_ops  HASHMAP_DEBUG_PASS_ARGS);
863         if (r < 0)
864                 return r;
865 
866         return ordered_hashmap_put(*h, key, value);
867 }
868 
hashmap_free_no_clear(HashmapBase * h)869 static void hashmap_free_no_clear(HashmapBase *h) {
870         assert(!h->has_indirect);
871         assert(h->n_direct_entries == 0);
872 
873 #if ENABLE_DEBUG_HASHMAP
874         assert_se(pthread_mutex_lock(&hashmap_debug_list_mutex) == 0);
875         LIST_REMOVE(debug_list, hashmap_debug_list, &h->debug);
876         assert_se(pthread_mutex_unlock(&hashmap_debug_list_mutex) == 0);
877 #endif
878 
879         if (h->from_pool) {
880                 /* Ensure that the object didn't get migrated between threads. */
881                 assert_se(is_main_thread());
882                 mempool_free_tile(hashmap_type_info[h->type].mempool, h);
883         } else
884                 free(h);
885 }
886 
_hashmap_free(HashmapBase * h,free_func_t default_free_key,free_func_t default_free_value)887 HashmapBase* _hashmap_free(HashmapBase *h, free_func_t default_free_key, free_func_t default_free_value) {
888         if (h) {
889                 _hashmap_clear(h, default_free_key, default_free_value);
890                 hashmap_free_no_clear(h);
891         }
892 
893         return NULL;
894 }
895 
_hashmap_clear(HashmapBase * h,free_func_t default_free_key,free_func_t default_free_value)896 void _hashmap_clear(HashmapBase *h, free_func_t default_free_key, free_func_t default_free_value) {
897         free_func_t free_key, free_value;
898         if (!h)
899                 return;
900 
901         free_key = h->hash_ops->free_key ?: default_free_key;
902         free_value = h->hash_ops->free_value ?: default_free_value;
903 
904         if (free_key || free_value) {
905 
906                 /* If destructor calls are defined, let's destroy things defensively: let's take the item out of the
907                  * hash table, and only then call the destructor functions. If these destructors then try to unregister
908                  * themselves from our hash table a second time, the entry is already gone. */
909 
910                 while (_hashmap_size(h) > 0) {
911                         void *k = NULL;
912                         void *v;
913 
914                         v = _hashmap_first_key_and_value(h, true, &k);
915 
916                         if (free_key)
917                                 free_key(k);
918 
919                         if (free_value)
920                                 free_value(v);
921                 }
922         }
923 
924         if (h->has_indirect) {
925                 free(h->indirect.storage);
926                 h->has_indirect = false;
927         }
928 
929         h->n_direct_entries = 0;
930         reset_direct_storage(h);
931 
932         if (h->type == HASHMAP_TYPE_ORDERED) {
933                 OrderedHashmap *lh = (OrderedHashmap*) h;
934                 lh->iterate_list_head = lh->iterate_list_tail = IDX_NIL;
935         }
936 
937         base_set_dirty(h);
938 }
939 
940 static int resize_buckets(HashmapBase *h, unsigned entries_add);
941 
942 /*
943  * Finds an empty bucket to put an entry into, starting the scan at 'idx'.
944  * Performs Robin Hood swaps as it goes. The entry to put must be placed
945  * by the caller into swap slot IDX_PUT.
946  * If used for in-place resizing, may leave a displaced entry in swap slot
947  * IDX_PUT. Caller must rehash it next.
948  * Returns: true if it left a displaced entry to rehash next in IDX_PUT,
949  *          false otherwise.
950  */
hashmap_put_robin_hood(HashmapBase * h,unsigned idx,struct swap_entries * swap)951 static bool hashmap_put_robin_hood(HashmapBase *h, unsigned idx,
952                                    struct swap_entries *swap) {
953         dib_raw_t raw_dib, *dibs;
954         unsigned dib, distance;
955 
956 #if ENABLE_DEBUG_HASHMAP
957         h->debug.put_count++;
958 #endif
959 
960         dibs = dib_raw_ptr(h);
961 
962         for (distance = 0; ; distance++) {
963                 raw_dib = dibs[idx];
964                 if (IN_SET(raw_dib, DIB_RAW_FREE, DIB_RAW_REHASH)) {
965                         if (raw_dib == DIB_RAW_REHASH)
966                                 bucket_move_entry(h, swap, idx, IDX_TMP);
967 
968                         if (h->has_indirect && h->indirect.idx_lowest_entry > idx)
969                                 h->indirect.idx_lowest_entry = idx;
970 
971                         bucket_set_dib(h, idx, distance);
972                         bucket_move_entry(h, swap, IDX_PUT, idx);
973                         if (raw_dib == DIB_RAW_REHASH) {
974                                 bucket_move_entry(h, swap, IDX_TMP, IDX_PUT);
975                                 return true;
976                         }
977 
978                         return false;
979                 }
980 
981                 dib = bucket_calculate_dib(h, idx, raw_dib);
982 
983                 if (dib < distance) {
984                         /* Found a wealthier entry. Go Robin Hood! */
985                         bucket_set_dib(h, idx, distance);
986 
987                         /* swap the entries */
988                         bucket_move_entry(h, swap, idx, IDX_TMP);
989                         bucket_move_entry(h, swap, IDX_PUT, idx);
990                         bucket_move_entry(h, swap, IDX_TMP, IDX_PUT);
991 
992                         distance = dib;
993                 }
994 
995                 idx = next_idx(h, idx);
996         }
997 }
998 
999 /*
1000  * Puts an entry into a hashmap, boldly - no check whether key already exists.
1001  * The caller must place the entry (only its key and value, not link indexes)
1002  * in swap slot IDX_PUT.
1003  * Caller must ensure: the key does not exist yet in the hashmap.
1004  *                     that resize is not needed if !may_resize.
1005  * Returns: 1 if entry was put successfully.
1006  *          -ENOMEM if may_resize==true and resize failed with -ENOMEM.
1007  *          Cannot return -ENOMEM if !may_resize.
1008  */
hashmap_base_put_boldly(HashmapBase * h,unsigned idx,struct swap_entries * swap,bool may_resize)1009 static int hashmap_base_put_boldly(HashmapBase *h, unsigned idx,
1010                                    struct swap_entries *swap, bool may_resize) {
1011         struct ordered_hashmap_entry *new_entry;
1012         int r;
1013 
1014         assert(idx < n_buckets(h));
1015 
1016         new_entry = bucket_at_swap(swap, IDX_PUT);
1017 
1018         if (may_resize) {
1019                 r = resize_buckets(h, 1);
1020                 if (r < 0)
1021                         return r;
1022                 if (r > 0)
1023                         idx = bucket_hash(h, new_entry->p.b.key);
1024         }
1025         assert(n_entries(h) < n_buckets(h));
1026 
1027         if (h->type == HASHMAP_TYPE_ORDERED) {
1028                 OrderedHashmap *lh = (OrderedHashmap*) h;
1029 
1030                 new_entry->iterate_next = IDX_NIL;
1031                 new_entry->iterate_previous = lh->iterate_list_tail;
1032 
1033                 if (lh->iterate_list_tail != IDX_NIL) {
1034                         struct ordered_hashmap_entry *old_tail;
1035 
1036                         old_tail = ordered_bucket_at(lh, lh->iterate_list_tail);
1037                         assert(old_tail->iterate_next == IDX_NIL);
1038                         old_tail->iterate_next = IDX_PUT;
1039                 }
1040 
1041                 lh->iterate_list_tail = IDX_PUT;
1042                 if (lh->iterate_list_head == IDX_NIL)
1043                         lh->iterate_list_head = IDX_PUT;
1044         }
1045 
1046         assert_se(hashmap_put_robin_hood(h, idx, swap) == false);
1047 
1048         n_entries_inc(h);
1049 #if ENABLE_DEBUG_HASHMAP
1050         h->debug.max_entries = MAX(h->debug.max_entries, n_entries(h));
1051 #endif
1052 
1053         base_set_dirty(h);
1054 
1055         return 1;
1056 }
1057 #define hashmap_put_boldly(h, idx, swap, may_resize) \
1058         hashmap_base_put_boldly(HASHMAP_BASE(h), idx, swap, may_resize)
1059 
1060 /*
1061  * Returns 0 if resize is not needed.
1062  *         1 if successfully resized.
1063  *         -ENOMEM on allocation failure.
1064  */
resize_buckets(HashmapBase * h,unsigned entries_add)1065 static int resize_buckets(HashmapBase *h, unsigned entries_add) {
1066         struct swap_entries swap;
1067         void *new_storage;
1068         dib_raw_t *old_dibs, *new_dibs;
1069         const struct hashmap_type_info *hi;
1070         unsigned idx, optimal_idx;
1071         unsigned old_n_buckets, new_n_buckets, n_rehashed, new_n_entries;
1072         uint8_t new_shift;
1073         bool rehash_next;
1074 
1075         assert(h);
1076 
1077         hi = &hashmap_type_info[h->type];
1078         new_n_entries = n_entries(h) + entries_add;
1079 
1080         /* overflow? */
1081         if (_unlikely_(new_n_entries < entries_add))
1082                 return -ENOMEM;
1083 
1084         /* For direct storage we allow 100% load, because it's tiny. */
1085         if (!h->has_indirect && new_n_entries <= hi->n_direct_buckets)
1086                 return 0;
1087 
1088         /*
1089          * Load factor = n/m = 1 - (1/INV_KEEP_FREE).
1090          * From it follows: m = n + n/(INV_KEEP_FREE - 1)
1091          */
1092         new_n_buckets = new_n_entries + new_n_entries / (INV_KEEP_FREE - 1);
1093         /* overflow? */
1094         if (_unlikely_(new_n_buckets < new_n_entries))
1095                 return -ENOMEM;
1096 
1097         if (_unlikely_(new_n_buckets > UINT_MAX / (hi->entry_size + sizeof(dib_raw_t))))
1098                 return -ENOMEM;
1099 
1100         old_n_buckets = n_buckets(h);
1101 
1102         if (_likely_(new_n_buckets <= old_n_buckets))
1103                 return 0;
1104 
1105         new_shift = log2u_round_up(MAX(
1106                         new_n_buckets * (hi->entry_size + sizeof(dib_raw_t)),
1107                         2 * sizeof(struct direct_storage)));
1108 
1109         /* Realloc storage (buckets and DIB array). */
1110         new_storage = realloc(h->has_indirect ? h->indirect.storage : NULL,
1111                               1U << new_shift);
1112         if (!new_storage)
1113                 return -ENOMEM;
1114 
1115         /* Must upgrade direct to indirect storage. */
1116         if (!h->has_indirect) {
1117                 memcpy(new_storage, h->direct.storage,
1118                        old_n_buckets * (hi->entry_size + sizeof(dib_raw_t)));
1119                 h->indirect.n_entries = h->n_direct_entries;
1120                 h->indirect.idx_lowest_entry = 0;
1121                 h->n_direct_entries = 0;
1122         }
1123 
1124         /* Get a new hash key. If we've just upgraded to indirect storage,
1125          * allow reusing a previously generated key. It's still a different key
1126          * from the shared one that we used for direct storage. */
1127         get_hash_key(h->indirect.hash_key, !h->has_indirect);
1128 
1129         h->has_indirect = true;
1130         h->indirect.storage = new_storage;
1131         h->indirect.n_buckets = (1U << new_shift) /
1132                                 (hi->entry_size + sizeof(dib_raw_t));
1133 
1134         old_dibs = (dib_raw_t*)((uint8_t*) new_storage + hi->entry_size * old_n_buckets);
1135         new_dibs = dib_raw_ptr(h);
1136 
1137         /*
1138          * Move the DIB array to the new place, replacing valid DIB values with
1139          * DIB_RAW_REHASH to indicate all of the used buckets need rehashing.
1140          * Note: Overlap is not possible, because we have at least doubled the
1141          * number of buckets and dib_raw_t is smaller than any entry type.
1142          */
1143         for (idx = 0; idx < old_n_buckets; idx++) {
1144                 assert(old_dibs[idx] != DIB_RAW_REHASH);
1145                 new_dibs[idx] = old_dibs[idx] == DIB_RAW_FREE ? DIB_RAW_FREE
1146                                                               : DIB_RAW_REHASH;
1147         }
1148 
1149         /* Zero the area of newly added entries (including the old DIB area) */
1150         memzero(bucket_at(h, old_n_buckets),
1151                (n_buckets(h) - old_n_buckets) * hi->entry_size);
1152 
1153         /* The upper half of the new DIB array needs initialization */
1154         memset(&new_dibs[old_n_buckets], DIB_RAW_INIT,
1155                (n_buckets(h) - old_n_buckets) * sizeof(dib_raw_t));
1156 
1157         /* Rehash entries that need it */
1158         n_rehashed = 0;
1159         for (idx = 0; idx < old_n_buckets; idx++) {
1160                 if (new_dibs[idx] != DIB_RAW_REHASH)
1161                         continue;
1162 
1163                 optimal_idx = bucket_hash(h, bucket_at(h, idx)->key);
1164 
1165                 /*
1166                  * Not much to do if by luck the entry hashes to its current
1167                  * location. Just set its DIB.
1168                  */
1169                 if (optimal_idx == idx) {
1170                         new_dibs[idx] = 0;
1171                         n_rehashed++;
1172                         continue;
1173                 }
1174 
1175                 new_dibs[idx] = DIB_RAW_FREE;
1176                 bucket_move_entry(h, &swap, idx, IDX_PUT);
1177                 /* bucket_move_entry does not clear the source */
1178                 memzero(bucket_at(h, idx), hi->entry_size);
1179 
1180                 do {
1181                         /*
1182                          * Find the new bucket for the current entry. This may make
1183                          * another entry homeless and load it into IDX_PUT.
1184                          */
1185                         rehash_next = hashmap_put_robin_hood(h, optimal_idx, &swap);
1186                         n_rehashed++;
1187 
1188                         /* Did the current entry displace another one? */
1189                         if (rehash_next)
1190                                 optimal_idx = bucket_hash(h, bucket_at_swap(&swap, IDX_PUT)->p.b.key);
1191                 } while (rehash_next);
1192         }
1193 
1194         assert(n_rehashed == n_entries(h));
1195 
1196         return 1;
1197 }
1198 
1199 /*
1200  * Finds an entry with a matching key
1201  * Returns: index of the found entry, or IDX_NIL if not found.
1202  */
base_bucket_scan(HashmapBase * h,unsigned idx,const void * key)1203 static unsigned base_bucket_scan(HashmapBase *h, unsigned idx, const void *key) {
1204         struct hashmap_base_entry *e;
1205         unsigned dib, distance;
1206         dib_raw_t *dibs = dib_raw_ptr(h);
1207 
1208         assert(idx < n_buckets(h));
1209 
1210         for (distance = 0; ; distance++) {
1211                 if (dibs[idx] == DIB_RAW_FREE)
1212                         return IDX_NIL;
1213 
1214                 dib = bucket_calculate_dib(h, idx, dibs[idx]);
1215 
1216                 if (dib < distance)
1217                         return IDX_NIL;
1218                 if (dib == distance) {
1219                         e = bucket_at(h, idx);
1220                         if (h->hash_ops->compare(e->key, key) == 0)
1221                                 return idx;
1222                 }
1223 
1224                 idx = next_idx(h, idx);
1225         }
1226 }
1227 #define bucket_scan(h, idx, key) base_bucket_scan(HASHMAP_BASE(h), idx, key)
1228 
hashmap_put(Hashmap * h,const void * key,void * value)1229 int hashmap_put(Hashmap *h, const void *key, void *value) {
1230         struct swap_entries swap;
1231         struct plain_hashmap_entry *e;
1232         unsigned hash, idx;
1233 
1234         assert(h);
1235 
1236         hash = bucket_hash(h, key);
1237         idx = bucket_scan(h, hash, key);
1238         if (idx != IDX_NIL) {
1239                 e = plain_bucket_at(h, idx);
1240                 if (e->value == value)
1241                         return 0;
1242                 return -EEXIST;
1243         }
1244 
1245         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1246         e->b.key = key;
1247         e->value = value;
1248         return hashmap_put_boldly(h, hash, &swap, true);
1249 }
1250 
set_put(Set * s,const void * key)1251 int set_put(Set *s, const void *key) {
1252         struct swap_entries swap;
1253         struct hashmap_base_entry *e;
1254         unsigned hash, idx;
1255 
1256         assert(s);
1257 
1258         hash = bucket_hash(s, key);
1259         idx = bucket_scan(s, hash, key);
1260         if (idx != IDX_NIL)
1261                 return 0;
1262 
1263         e = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1264         e->key = key;
1265         return hashmap_put_boldly(s, hash, &swap, true);
1266 }
1267 
_set_ensure_put(Set ** s,const struct hash_ops * hash_ops,const void * key HASHMAP_DEBUG_PARAMS)1268 int _set_ensure_put(Set **s, const struct hash_ops *hash_ops, const void *key  HASHMAP_DEBUG_PARAMS) {
1269         int r;
1270 
1271         r = _set_ensure_allocated(s, hash_ops  HASHMAP_DEBUG_PASS_ARGS);
1272         if (r < 0)
1273                 return r;
1274 
1275         return set_put(*s, key);
1276 }
1277 
_set_ensure_consume(Set ** s,const struct hash_ops * hash_ops,void * key HASHMAP_DEBUG_PARAMS)1278 int _set_ensure_consume(Set **s, const struct hash_ops *hash_ops, void *key  HASHMAP_DEBUG_PARAMS) {
1279         int r;
1280 
1281         r = _set_ensure_put(s, hash_ops, key  HASHMAP_DEBUG_PASS_ARGS);
1282         if (r <= 0) {
1283                 if (hash_ops && hash_ops->free_key)
1284                         hash_ops->free_key(key);
1285                 else
1286                         free(key);
1287         }
1288 
1289         return r;
1290 }
1291 
hashmap_replace(Hashmap * h,const void * key,void * value)1292 int hashmap_replace(Hashmap *h, const void *key, void *value) {
1293         struct swap_entries swap;
1294         struct plain_hashmap_entry *e;
1295         unsigned hash, idx;
1296 
1297         assert(h);
1298 
1299         hash = bucket_hash(h, key);
1300         idx = bucket_scan(h, hash, key);
1301         if (idx != IDX_NIL) {
1302                 e = plain_bucket_at(h, idx);
1303 #if ENABLE_DEBUG_HASHMAP
1304                 /* Although the key is equal, the key pointer may have changed,
1305                  * and this would break our assumption for iterating. So count
1306                  * this operation as incompatible with iteration. */
1307                 if (e->b.key != key) {
1308                         h->b.debug.put_count++;
1309                         h->b.debug.rem_count++;
1310                         h->b.debug.last_rem_idx = idx;
1311                 }
1312 #endif
1313                 e->b.key = key;
1314                 e->value = value;
1315                 hashmap_set_dirty(h);
1316 
1317                 return 0;
1318         }
1319 
1320         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1321         e->b.key = key;
1322         e->value = value;
1323         return hashmap_put_boldly(h, hash, &swap, true);
1324 }
1325 
hashmap_update(Hashmap * h,const void * key,void * value)1326 int hashmap_update(Hashmap *h, const void *key, void *value) {
1327         struct plain_hashmap_entry *e;
1328         unsigned hash, idx;
1329 
1330         assert(h);
1331 
1332         hash = bucket_hash(h, key);
1333         idx = bucket_scan(h, hash, key);
1334         if (idx == IDX_NIL)
1335                 return -ENOENT;
1336 
1337         e = plain_bucket_at(h, idx);
1338         e->value = value;
1339         hashmap_set_dirty(h);
1340 
1341         return 0;
1342 }
1343 
_hashmap_get(HashmapBase * h,const void * key)1344 void* _hashmap_get(HashmapBase *h, const void *key) {
1345         struct hashmap_base_entry *e;
1346         unsigned hash, idx;
1347 
1348         if (!h)
1349                 return NULL;
1350 
1351         hash = bucket_hash(h, key);
1352         idx = bucket_scan(h, hash, key);
1353         if (idx == IDX_NIL)
1354                 return NULL;
1355 
1356         e = bucket_at(h, idx);
1357         return entry_value(h, e);
1358 }
1359 
hashmap_get2(Hashmap * h,const void * key,void ** key2)1360 void* hashmap_get2(Hashmap *h, const void *key, void **key2) {
1361         struct plain_hashmap_entry *e;
1362         unsigned hash, idx;
1363 
1364         if (!h)
1365                 return NULL;
1366 
1367         hash = bucket_hash(h, key);
1368         idx = bucket_scan(h, hash, key);
1369         if (idx == IDX_NIL)
1370                 return NULL;
1371 
1372         e = plain_bucket_at(h, idx);
1373         if (key2)
1374                 *key2 = (void*) e->b.key;
1375 
1376         return e->value;
1377 }
1378 
_hashmap_contains(HashmapBase * h,const void * key)1379 bool _hashmap_contains(HashmapBase *h, const void *key) {
1380         unsigned hash;
1381 
1382         if (!h)
1383                 return false;
1384 
1385         hash = bucket_hash(h, key);
1386         return bucket_scan(h, hash, key) != IDX_NIL;
1387 }
1388 
_hashmap_remove(HashmapBase * h,const void * key)1389 void* _hashmap_remove(HashmapBase *h, const void *key) {
1390         struct hashmap_base_entry *e;
1391         unsigned hash, idx;
1392         void *data;
1393 
1394         if (!h)
1395                 return NULL;
1396 
1397         hash = bucket_hash(h, key);
1398         idx = bucket_scan(h, hash, key);
1399         if (idx == IDX_NIL)
1400                 return NULL;
1401 
1402         e = bucket_at(h, idx);
1403         data = entry_value(h, e);
1404         remove_entry(h, idx);
1405 
1406         return data;
1407 }
1408 
hashmap_remove2(Hashmap * h,const void * key,void ** rkey)1409 void* hashmap_remove2(Hashmap *h, const void *key, void **rkey) {
1410         struct plain_hashmap_entry *e;
1411         unsigned hash, idx;
1412         void *data;
1413 
1414         if (!h) {
1415                 if (rkey)
1416                         *rkey = NULL;
1417                 return NULL;
1418         }
1419 
1420         hash = bucket_hash(h, key);
1421         idx = bucket_scan(h, hash, key);
1422         if (idx == IDX_NIL) {
1423                 if (rkey)
1424                         *rkey = NULL;
1425                 return NULL;
1426         }
1427 
1428         e = plain_bucket_at(h, idx);
1429         data = e->value;
1430         if (rkey)
1431                 *rkey = (void*) e->b.key;
1432 
1433         remove_entry(h, idx);
1434 
1435         return data;
1436 }
1437 
hashmap_remove_and_put(Hashmap * h,const void * old_key,const void * new_key,void * value)1438 int hashmap_remove_and_put(Hashmap *h, const void *old_key, const void *new_key, void *value) {
1439         struct swap_entries swap;
1440         struct plain_hashmap_entry *e;
1441         unsigned old_hash, new_hash, idx;
1442 
1443         if (!h)
1444                 return -ENOENT;
1445 
1446         old_hash = bucket_hash(h, old_key);
1447         idx = bucket_scan(h, old_hash, old_key);
1448         if (idx == IDX_NIL)
1449                 return -ENOENT;
1450 
1451         new_hash = bucket_hash(h, new_key);
1452         if (bucket_scan(h, new_hash, new_key) != IDX_NIL)
1453                 return -EEXIST;
1454 
1455         remove_entry(h, idx);
1456 
1457         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1458         e->b.key = new_key;
1459         e->value = value;
1460         assert_se(hashmap_put_boldly(h, new_hash, &swap, false) == 1);
1461 
1462         return 0;
1463 }
1464 
set_remove_and_put(Set * s,const void * old_key,const void * new_key)1465 int set_remove_and_put(Set *s, const void *old_key, const void *new_key) {
1466         struct swap_entries swap;
1467         struct hashmap_base_entry *e;
1468         unsigned old_hash, new_hash, idx;
1469 
1470         if (!s)
1471                 return -ENOENT;
1472 
1473         old_hash = bucket_hash(s, old_key);
1474         idx = bucket_scan(s, old_hash, old_key);
1475         if (idx == IDX_NIL)
1476                 return -ENOENT;
1477 
1478         new_hash = bucket_hash(s, new_key);
1479         if (bucket_scan(s, new_hash, new_key) != IDX_NIL)
1480                 return -EEXIST;
1481 
1482         remove_entry(s, idx);
1483 
1484         e = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1485         e->key = new_key;
1486         assert_se(hashmap_put_boldly(s, new_hash, &swap, false) == 1);
1487 
1488         return 0;
1489 }
1490 
hashmap_remove_and_replace(Hashmap * h,const void * old_key,const void * new_key,void * value)1491 int hashmap_remove_and_replace(Hashmap *h, const void *old_key, const void *new_key, void *value) {
1492         struct swap_entries swap;
1493         struct plain_hashmap_entry *e;
1494         unsigned old_hash, new_hash, idx_old, idx_new;
1495 
1496         if (!h)
1497                 return -ENOENT;
1498 
1499         old_hash = bucket_hash(h, old_key);
1500         idx_old = bucket_scan(h, old_hash, old_key);
1501         if (idx_old == IDX_NIL)
1502                 return -ENOENT;
1503 
1504         old_key = bucket_at(HASHMAP_BASE(h), idx_old)->key;
1505 
1506         new_hash = bucket_hash(h, new_key);
1507         idx_new = bucket_scan(h, new_hash, new_key);
1508         if (idx_new != IDX_NIL)
1509                 if (idx_old != idx_new) {
1510                         remove_entry(h, idx_new);
1511                         /* Compensate for a possible backward shift. */
1512                         if (old_key != bucket_at(HASHMAP_BASE(h), idx_old)->key)
1513                                 idx_old = prev_idx(HASHMAP_BASE(h), idx_old);
1514                         assert(old_key == bucket_at(HASHMAP_BASE(h), idx_old)->key);
1515                 }
1516 
1517         remove_entry(h, idx_old);
1518 
1519         e = &bucket_at_swap(&swap, IDX_PUT)->p;
1520         e->b.key = new_key;
1521         e->value = value;
1522         assert_se(hashmap_put_boldly(h, new_hash, &swap, false) == 1);
1523 
1524         return 0;
1525 }
1526 
_hashmap_remove_value(HashmapBase * h,const void * key,void * value)1527 void* _hashmap_remove_value(HashmapBase *h, const void *key, void *value) {
1528         struct hashmap_base_entry *e;
1529         unsigned hash, idx;
1530 
1531         if (!h)
1532                 return NULL;
1533 
1534         hash = bucket_hash(h, key);
1535         idx = bucket_scan(h, hash, key);
1536         if (idx == IDX_NIL)
1537                 return NULL;
1538 
1539         e = bucket_at(h, idx);
1540         if (entry_value(h, e) != value)
1541                 return NULL;
1542 
1543         remove_entry(h, idx);
1544 
1545         return value;
1546 }
1547 
find_first_entry(HashmapBase * h)1548 static unsigned find_first_entry(HashmapBase *h) {
1549         Iterator i = ITERATOR_FIRST;
1550 
1551         if (!h || !n_entries(h))
1552                 return IDX_NIL;
1553 
1554         return hashmap_iterate_entry(h, &i);
1555 }
1556 
_hashmap_first_key_and_value(HashmapBase * h,bool remove,void ** ret_key)1557 void* _hashmap_first_key_and_value(HashmapBase *h, bool remove, void **ret_key) {
1558         struct hashmap_base_entry *e;
1559         void *key, *data;
1560         unsigned idx;
1561 
1562         idx = find_first_entry(h);
1563         if (idx == IDX_NIL) {
1564                 if (ret_key)
1565                         *ret_key = NULL;
1566                 return NULL;
1567         }
1568 
1569         e = bucket_at(h, idx);
1570         key = (void*) e->key;
1571         data = entry_value(h, e);
1572 
1573         if (remove)
1574                 remove_entry(h, idx);
1575 
1576         if (ret_key)
1577                 *ret_key = key;
1578 
1579         return data;
1580 }
1581 
_hashmap_size(HashmapBase * h)1582 unsigned _hashmap_size(HashmapBase *h) {
1583         if (!h)
1584                 return 0;
1585 
1586         return n_entries(h);
1587 }
1588 
_hashmap_buckets(HashmapBase * h)1589 unsigned _hashmap_buckets(HashmapBase *h) {
1590         if (!h)
1591                 return 0;
1592 
1593         return n_buckets(h);
1594 }
1595 
_hashmap_merge(Hashmap * h,Hashmap * other)1596 int _hashmap_merge(Hashmap *h, Hashmap *other) {
1597         Iterator i;
1598         unsigned idx;
1599 
1600         assert(h);
1601 
1602         HASHMAP_FOREACH_IDX(idx, HASHMAP_BASE(other), i) {
1603                 struct plain_hashmap_entry *pe = plain_bucket_at(other, idx);
1604                 int r;
1605 
1606                 r = hashmap_put(h, pe->b.key, pe->value);
1607                 if (r < 0 && r != -EEXIST)
1608                         return r;
1609         }
1610 
1611         return 0;
1612 }
1613 
set_merge(Set * s,Set * other)1614 int set_merge(Set *s, Set *other) {
1615         Iterator i;
1616         unsigned idx;
1617 
1618         assert(s);
1619 
1620         HASHMAP_FOREACH_IDX(idx, HASHMAP_BASE(other), i) {
1621                 struct set_entry *se = set_bucket_at(other, idx);
1622                 int r;
1623 
1624                 r = set_put(s, se->b.key);
1625                 if (r < 0)
1626                         return r;
1627         }
1628 
1629         return 0;
1630 }
1631 
_hashmap_reserve(HashmapBase * h,unsigned entries_add)1632 int _hashmap_reserve(HashmapBase *h, unsigned entries_add) {
1633         int r;
1634 
1635         assert(h);
1636 
1637         r = resize_buckets(h, entries_add);
1638         if (r < 0)
1639                 return r;
1640 
1641         return 0;
1642 }
1643 
1644 /*
1645  * The same as hashmap_merge(), but every new item from other is moved to h.
1646  * Keys already in h are skipped and stay in other.
1647  * Returns: 0 on success.
1648  *          -ENOMEM on alloc failure, in which case no move has been done.
1649  */
_hashmap_move(HashmapBase * h,HashmapBase * other)1650 int _hashmap_move(HashmapBase *h, HashmapBase *other) {
1651         struct swap_entries swap;
1652         struct hashmap_base_entry *e, *n;
1653         Iterator i;
1654         unsigned idx;
1655         int r;
1656 
1657         assert(h);
1658 
1659         if (!other)
1660                 return 0;
1661 
1662         assert(other->type == h->type);
1663 
1664         /*
1665          * This reserves buckets for the worst case, where none of other's
1666          * entries are yet present in h. This is preferable to risking
1667          * an allocation failure in the middle of the moving and having to
1668          * rollback or return a partial result.
1669          */
1670         r = resize_buckets(h, n_entries(other));
1671         if (r < 0)
1672                 return r;
1673 
1674         HASHMAP_FOREACH_IDX(idx, other, i) {
1675                 unsigned h_hash;
1676 
1677                 e = bucket_at(other, idx);
1678                 h_hash = bucket_hash(h, e->key);
1679                 if (bucket_scan(h, h_hash, e->key) != IDX_NIL)
1680                         continue;
1681 
1682                 n = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1683                 n->key = e->key;
1684                 if (h->type != HASHMAP_TYPE_SET)
1685                         ((struct plain_hashmap_entry*) n)->value =
1686                                 ((struct plain_hashmap_entry*) e)->value;
1687                 assert_se(hashmap_put_boldly(h, h_hash, &swap, false) == 1);
1688 
1689                 remove_entry(other, idx);
1690         }
1691 
1692         return 0;
1693 }
1694 
_hashmap_move_one(HashmapBase * h,HashmapBase * other,const void * key)1695 int _hashmap_move_one(HashmapBase *h, HashmapBase *other, const void *key) {
1696         struct swap_entries swap;
1697         unsigned h_hash, other_hash, idx;
1698         struct hashmap_base_entry *e, *n;
1699         int r;
1700 
1701         assert(h);
1702 
1703         h_hash = bucket_hash(h, key);
1704         if (bucket_scan(h, h_hash, key) != IDX_NIL)
1705                 return -EEXIST;
1706 
1707         if (!other)
1708                 return -ENOENT;
1709 
1710         assert(other->type == h->type);
1711 
1712         other_hash = bucket_hash(other, key);
1713         idx = bucket_scan(other, other_hash, key);
1714         if (idx == IDX_NIL)
1715                 return -ENOENT;
1716 
1717         e = bucket_at(other, idx);
1718 
1719         n = &bucket_at_swap(&swap, IDX_PUT)->p.b;
1720         n->key = e->key;
1721         if (h->type != HASHMAP_TYPE_SET)
1722                 ((struct plain_hashmap_entry*) n)->value =
1723                         ((struct plain_hashmap_entry*) e)->value;
1724         r = hashmap_put_boldly(h, h_hash, &swap, true);
1725         if (r < 0)
1726                 return r;
1727 
1728         remove_entry(other, idx);
1729         return 0;
1730 }
1731 
_hashmap_copy(HashmapBase * h HASHMAP_DEBUG_PARAMS)1732 HashmapBase* _hashmap_copy(HashmapBase *h  HASHMAP_DEBUG_PARAMS) {
1733         HashmapBase *copy;
1734         int r;
1735 
1736         assert(h);
1737 
1738         copy = hashmap_base_new(h->hash_ops, h->type  HASHMAP_DEBUG_PASS_ARGS);
1739         if (!copy)
1740                 return NULL;
1741 
1742         switch (h->type) {
1743         case HASHMAP_TYPE_PLAIN:
1744         case HASHMAP_TYPE_ORDERED:
1745                 r = hashmap_merge((Hashmap*)copy, (Hashmap*)h);
1746                 break;
1747         case HASHMAP_TYPE_SET:
1748                 r = set_merge((Set*)copy, (Set*)h);
1749                 break;
1750         default:
1751                 assert_not_reached();
1752         }
1753 
1754         if (r < 0)
1755                 return _hashmap_free(copy, false, false);
1756 
1757         return copy;
1758 }
1759 
_hashmap_get_strv(HashmapBase * h)1760 char** _hashmap_get_strv(HashmapBase *h) {
1761         char **sv;
1762         Iterator i;
1763         unsigned idx, n;
1764 
1765         if (!h)
1766                 return new0(char*, 1);
1767 
1768         sv = new(char*, n_entries(h)+1);
1769         if (!sv)
1770                 return NULL;
1771 
1772         n = 0;
1773         HASHMAP_FOREACH_IDX(idx, h, i)
1774                 sv[n++] = entry_value(h, bucket_at(h, idx));
1775         sv[n] = NULL;
1776 
1777         return sv;
1778 }
1779 
ordered_hashmap_next(OrderedHashmap * h,const void * key)1780 void* ordered_hashmap_next(OrderedHashmap *h, const void *key) {
1781         struct ordered_hashmap_entry *e;
1782         unsigned hash, idx;
1783 
1784         if (!h)
1785                 return NULL;
1786 
1787         hash = bucket_hash(h, key);
1788         idx = bucket_scan(h, hash, key);
1789         if (idx == IDX_NIL)
1790                 return NULL;
1791 
1792         e = ordered_bucket_at(h, idx);
1793         if (e->iterate_next == IDX_NIL)
1794                 return NULL;
1795         return ordered_bucket_at(h, e->iterate_next)->p.value;
1796 }
1797 
set_consume(Set * s,void * value)1798 int set_consume(Set *s, void *value) {
1799         int r;
1800 
1801         assert(s);
1802         assert(value);
1803 
1804         r = set_put(s, value);
1805         if (r <= 0)
1806                 free(value);
1807 
1808         return r;
1809 }
1810 
_hashmap_put_strdup_full(Hashmap ** h,const struct hash_ops * hash_ops,const char * k,const char * v HASHMAP_DEBUG_PARAMS)1811 int _hashmap_put_strdup_full(Hashmap **h, const struct hash_ops *hash_ops, const char *k, const char *v  HASHMAP_DEBUG_PARAMS) {
1812         int r;
1813 
1814         r = _hashmap_ensure_allocated(h, hash_ops  HASHMAP_DEBUG_PASS_ARGS);
1815         if (r < 0)
1816                 return r;
1817 
1818         _cleanup_free_ char *kdup = NULL, *vdup = NULL;
1819 
1820         kdup = strdup(k);
1821         if (!kdup)
1822                 return -ENOMEM;
1823 
1824         if (v) {
1825                 vdup = strdup(v);
1826                 if (!vdup)
1827                         return -ENOMEM;
1828         }
1829 
1830         r = hashmap_put(*h, kdup, vdup);
1831         if (r < 0) {
1832                 if (r == -EEXIST && streq_ptr(v, hashmap_get(*h, kdup)))
1833                         return 0;
1834                 return r;
1835         }
1836 
1837         /* 0 with non-null vdup would mean vdup is already in the hashmap, which cannot be */
1838         assert(vdup == NULL || r > 0);
1839         if (r > 0)
1840                 kdup = vdup = NULL;
1841 
1842         return r;
1843 }
1844 
_set_put_strdup_full(Set ** s,const struct hash_ops * hash_ops,const char * p HASHMAP_DEBUG_PARAMS)1845 int _set_put_strdup_full(Set **s, const struct hash_ops *hash_ops, const char *p  HASHMAP_DEBUG_PARAMS) {
1846         char *c;
1847         int r;
1848 
1849         assert(s);
1850         assert(p);
1851 
1852         r = _set_ensure_allocated(s, hash_ops  HASHMAP_DEBUG_PASS_ARGS);
1853         if (r < 0)
1854                 return r;
1855 
1856         if (set_contains(*s, (char*) p))
1857                 return 0;
1858 
1859         c = strdup(p);
1860         if (!c)
1861                 return -ENOMEM;
1862 
1863         return set_consume(*s, c);
1864 }
1865 
_set_put_strdupv_full(Set ** s,const struct hash_ops * hash_ops,char ** l HASHMAP_DEBUG_PARAMS)1866 int _set_put_strdupv_full(Set **s, const struct hash_ops *hash_ops, char **l  HASHMAP_DEBUG_PARAMS) {
1867         int n = 0, r;
1868 
1869         assert(s);
1870 
1871         STRV_FOREACH(i, l) {
1872                 r = _set_put_strdup_full(s, hash_ops, *i  HASHMAP_DEBUG_PASS_ARGS);
1873                 if (r < 0)
1874                         return r;
1875 
1876                 n += r;
1877         }
1878 
1879         return n;
1880 }
1881 
set_put_strsplit(Set * s,const char * v,const char * separators,ExtractFlags flags)1882 int set_put_strsplit(Set *s, const char *v, const char *separators, ExtractFlags flags) {
1883         const char *p = v;
1884         int r;
1885 
1886         assert(s);
1887         assert(v);
1888 
1889         for (;;) {
1890                 char *word;
1891 
1892                 r = extract_first_word(&p, &word, separators, flags);
1893                 if (r <= 0)
1894                         return r;
1895 
1896                 r = set_consume(s, word);
1897                 if (r < 0)
1898                         return r;
1899         }
1900 }
1901 
1902 /* expand the cachemem if needed, return true if newly (re)activated. */
cachemem_maintain(CacheMem * mem,size_t size)1903 static int cachemem_maintain(CacheMem *mem, size_t size) {
1904         assert(mem);
1905 
1906         if (!GREEDY_REALLOC(mem->ptr, size)) {
1907                 if (size > 0)
1908                         return -ENOMEM;
1909         }
1910 
1911         if (!mem->active) {
1912                 mem->active = true;
1913                 return true;
1914         }
1915 
1916         return false;
1917 }
1918 
iterated_cache_get(IteratedCache * cache,const void *** res_keys,const void *** res_values,unsigned * res_n_entries)1919 int iterated_cache_get(IteratedCache *cache, const void ***res_keys, const void ***res_values, unsigned *res_n_entries) {
1920         bool sync_keys = false, sync_values = false;
1921         size_t size;
1922         int r;
1923 
1924         assert(cache);
1925         assert(cache->hashmap);
1926 
1927         size = n_entries(cache->hashmap);
1928 
1929         if (res_keys) {
1930                 r = cachemem_maintain(&cache->keys, size);
1931                 if (r < 0)
1932                         return r;
1933 
1934                 sync_keys = r;
1935         } else
1936                 cache->keys.active = false;
1937 
1938         if (res_values) {
1939                 r = cachemem_maintain(&cache->values, size);
1940                 if (r < 0)
1941                         return r;
1942 
1943                 sync_values = r;
1944         } else
1945                 cache->values.active = false;
1946 
1947         if (cache->hashmap->dirty) {
1948                 if (cache->keys.active)
1949                         sync_keys = true;
1950                 if (cache->values.active)
1951                         sync_values = true;
1952 
1953                 cache->hashmap->dirty = false;
1954         }
1955 
1956         if (sync_keys || sync_values) {
1957                 unsigned i, idx;
1958                 Iterator iter;
1959 
1960                 i = 0;
1961                 HASHMAP_FOREACH_IDX(idx, cache->hashmap, iter) {
1962                         struct hashmap_base_entry *e;
1963 
1964                         e = bucket_at(cache->hashmap, idx);
1965 
1966                         if (sync_keys)
1967                                 cache->keys.ptr[i] = e->key;
1968                         if (sync_values)
1969                                 cache->values.ptr[i] = entry_value(cache->hashmap, e);
1970                         i++;
1971                 }
1972         }
1973 
1974         if (res_keys)
1975                 *res_keys = cache->keys.ptr;
1976         if (res_values)
1977                 *res_values = cache->values.ptr;
1978         if (res_n_entries)
1979                 *res_n_entries = size;
1980 
1981         return 0;
1982 }
1983 
iterated_cache_free(IteratedCache * cache)1984 IteratedCache* iterated_cache_free(IteratedCache *cache) {
1985         if (cache) {
1986                 free(cache->keys.ptr);
1987                 free(cache->values.ptr);
1988         }
1989 
1990         return mfree(cache);
1991 }
1992 
set_strjoin(Set * s,const char * separator,bool wrap_with_separator,char ** ret)1993 int set_strjoin(Set *s, const char *separator, bool wrap_with_separator, char **ret) {
1994         _cleanup_free_ char *str = NULL;
1995         size_t separator_len, len = 0;
1996         const char *value;
1997         bool first;
1998 
1999         assert(ret);
2000 
2001         if (set_isempty(s)) {
2002                 *ret = NULL;
2003                 return 0;
2004         }
2005 
2006         separator_len = strlen_ptr(separator);
2007 
2008         if (separator_len == 0)
2009                 wrap_with_separator = false;
2010 
2011         first = !wrap_with_separator;
2012 
2013         SET_FOREACH(value, s) {
2014                 size_t l = strlen_ptr(value);
2015 
2016                 if (l == 0)
2017                         continue;
2018 
2019                 if (!GREEDY_REALLOC(str, len + l + (first ? 0 : separator_len) + (wrap_with_separator ? separator_len : 0) + 1))
2020                         return -ENOMEM;
2021 
2022                 if (separator_len > 0 && !first) {
2023                         memcpy(str + len, separator, separator_len);
2024                         len += separator_len;
2025                 }
2026 
2027                 memcpy(str + len, value, l);
2028                 len += l;
2029                 first = false;
2030         }
2031 
2032         if (wrap_with_separator) {
2033                 memcpy(str + len, separator, separator_len);
2034                 len += separator_len;
2035         }
2036 
2037         str[len] = '\0';
2038 
2039         *ret = TAKE_PTR(str);
2040         return 0;
2041 }
2042 
set_equal(Set * a,Set * b)2043 bool set_equal(Set *a, Set *b) {
2044         void *p;
2045 
2046         /* Checks whether each entry of 'a' is also in 'b' and vice versa, i.e. the two sets contain the same
2047          * entries */
2048 
2049         if (a == b)
2050                 return true;
2051 
2052         if (set_isempty(a) && set_isempty(b))
2053                 return true;
2054 
2055         if (set_size(a) != set_size(b)) /* Cheap check that hopefully catches a lot of inequality cases
2056                                          * already */
2057                 return false;
2058 
2059         SET_FOREACH(p, a)
2060                 if (!set_contains(b, p))
2061                         return false;
2062 
2063         /* If we have the same hashops, then we don't need to check things backwards given we compared the
2064          * size and that all of a is in b. */
2065         if (a->b.hash_ops == b->b.hash_ops)
2066                 return true;
2067 
2068         SET_FOREACH(p, b)
2069                 if (!set_contains(a, p))
2070                         return false;
2071 
2072         return true;
2073 }
2074 
set_fnmatch_one(Set * patterns,const char * needle)2075 static bool set_fnmatch_one(Set *patterns, const char *needle) {
2076         const char *p;
2077 
2078         assert(needle);
2079 
2080         SET_FOREACH(p, patterns)
2081                 if (fnmatch(p, needle, 0) == 0)
2082                         return true;
2083 
2084         return false;
2085 }
2086 
set_fnmatch(Set * include_patterns,Set * exclude_patterns,const char * needle)2087 bool set_fnmatch(Set *include_patterns, Set *exclude_patterns, const char *needle) {
2088         assert(needle);
2089 
2090         if (set_fnmatch_one(exclude_patterns, needle))
2091                 return false;
2092 
2093         if (set_isempty(include_patterns))
2094                 return true;
2095 
2096         return set_fnmatch_one(include_patterns, needle);
2097 }
2098