| |
1 /* |
| |
2 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER. |
| |
3 * |
| |
4 * Copyright 2021 Mike Becker, Olaf Wintermann All rights reserved. |
| |
5 * |
| |
6 * Redistribution and use in source and binary forms, with or without |
| |
7 * modification, are permitted provided that the following conditions are met: |
| |
8 * |
| |
9 * 1. Redistributions of source code must retain the above copyright |
| |
10 * notice, this list of conditions and the following disclaimer. |
| |
11 * |
| |
12 * 2. Redistributions in binary form must reproduce the above copyright |
| |
13 * notice, this list of conditions and the following disclaimer in the |
| |
14 * documentation and/or other materials provided with the distribution. |
| |
15 * |
| |
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" |
| |
17 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| |
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| |
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE |
| |
20 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR |
| |
21 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF |
| |
22 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS |
| |
23 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN |
| |
24 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
| |
25 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
| |
26 * POSSIBILITY OF SUCH DAMAGE. |
| |
27 */ |
| |
28 |
| |
29 #include "cx/hash_map.h" |
| |
30 #include "cx/utils.h" |
| |
31 |
| |
32 #include <string.h> |
| |
33 #include <assert.h> |
| |
34 |
| |
35 struct cx_hash_map_element_s { |
| |
36 /** A pointer to the next element in the current bucket. */ |
| |
37 struct cx_hash_map_element_s *next; |
| |
38 |
| |
39 /** The corresponding key. */ |
| |
40 CxHashKey key; |
| |
41 |
| |
42 /** The value data. */ |
| |
43 char data[]; |
| |
44 }; |
| |
45 |
| |
46 static void cx_hash_map_clear(struct cx_map_s *map) { |
| |
47 struct cx_hash_map_s *hash_map = (struct cx_hash_map_s *) map; |
| |
48 cx_for_n(i, hash_map->bucket_count) { |
| |
49 struct cx_hash_map_element_s *elem = hash_map->buckets[i]; |
| |
50 if (elem != NULL) { |
| |
51 do { |
| |
52 struct cx_hash_map_element_s *next = elem->next; |
| |
53 // invoke the destructor |
| |
54 cx_invoke_destructor(map, elem->data); |
| |
55 // free the key data |
| |
56 cxFree(map->collection.allocator, (void *) elem->key.data); |
| |
57 // free the node |
| |
58 cxFree(map->collection.allocator, elem); |
| |
59 // proceed |
| |
60 elem = next; |
| |
61 } while (elem != NULL); |
| |
62 |
| |
63 // do not leave a dangling pointer |
| |
64 hash_map->buckets[i] = NULL; |
| |
65 } |
| |
66 } |
| |
67 map->collection.size = 0; |
| |
68 } |
| |
69 |
| |
70 static void cx_hash_map_destructor(struct cx_map_s *map) { |
| |
71 struct cx_hash_map_s *hash_map = (struct cx_hash_map_s *) map; |
| |
72 |
| |
73 // free the buckets |
| |
74 cx_hash_map_clear(map); |
| |
75 cxFree(map->collection.allocator, hash_map->buckets); |
| |
76 |
| |
77 // free the map structure |
| |
78 cxFree(map->collection.allocator, map); |
| |
79 } |
| |
80 |
| |
81 static int cx_hash_map_put( |
| |
82 CxMap *map, |
| |
83 CxHashKey key, |
| |
84 void *value |
| |
85 ) { |
| |
86 struct cx_hash_map_s *hash_map = (struct cx_hash_map_s *) map; |
| |
87 CxAllocator const *allocator = map->collection.allocator; |
| |
88 |
| |
89 unsigned hash = key.hash; |
| |
90 if (hash == 0) { |
| |
91 cx_hash_murmur(&key); |
| |
92 hash = key.hash; |
| |
93 } |
| |
94 |
| |
95 size_t slot = hash % hash_map->bucket_count; |
| |
96 struct cx_hash_map_element_s *elm = hash_map->buckets[slot]; |
| |
97 struct cx_hash_map_element_s *prev = NULL; |
| |
98 |
| |
99 while (elm != NULL && elm->key.hash < hash) { |
| |
100 prev = elm; |
| |
101 elm = elm->next; |
| |
102 } |
| |
103 |
| |
104 if (elm != NULL && elm->key.hash == hash && elm->key.len == key.len && |
| |
105 memcmp(elm->key.data, key.data, key.len) == 0) { |
| |
106 // overwrite existing element |
| |
107 if (map->collection.store_pointer) { |
| |
108 memcpy(elm->data, &value, sizeof(void *)); |
| |
109 } else { |
| |
110 memcpy(elm->data, value, map->collection.elem_size); |
| |
111 } |
| |
112 } else { |
| |
113 // allocate new element |
| |
114 struct cx_hash_map_element_s *e = cxMalloc( |
| |
115 allocator, |
| |
116 sizeof(struct cx_hash_map_element_s) + map->collection.elem_size |
| |
117 ); |
| |
118 if (e == NULL) { |
| |
119 return -1; |
| |
120 } |
| |
121 |
| |
122 // write the value |
| |
123 if (map->collection.store_pointer) { |
| |
124 memcpy(e->data, &value, sizeof(void *)); |
| |
125 } else { |
| |
126 memcpy(e->data, value, map->collection.elem_size); |
| |
127 } |
| |
128 |
| |
129 // copy the key |
| |
130 void *kd = cxMalloc(allocator, key.len); |
| |
131 if (kd == NULL) { |
| |
132 return -1; |
| |
133 } |
| |
134 memcpy(kd, key.data, key.len); |
| |
135 e->key.data = kd; |
| |
136 e->key.len = key.len; |
| |
137 e->key.hash = hash; |
| |
138 |
| |
139 // insert the element into the linked list |
| |
140 if (prev == NULL) { |
| |
141 hash_map->buckets[slot] = e; |
| |
142 } else { |
| |
143 prev->next = e; |
| |
144 } |
| |
145 e->next = elm; |
| |
146 |
| |
147 // increase the size |
| |
148 map->collection.size++; |
| |
149 } |
| |
150 |
| |
151 return 0; |
| |
152 } |
| |
153 |
| |
154 static void cx_hash_map_unlink( |
| |
155 struct cx_hash_map_s *hash_map, |
| |
156 size_t slot, |
| |
157 struct cx_hash_map_element_s *prev, |
| |
158 struct cx_hash_map_element_s *elm |
| |
159 ) { |
| |
160 // unlink |
| |
161 if (prev == NULL) { |
| |
162 hash_map->buckets[slot] = elm->next; |
| |
163 } else { |
| |
164 prev->next = elm->next; |
| |
165 } |
| |
166 // free element |
| |
167 cxFree(hash_map->base.collection.allocator, (void *) elm->key.data); |
| |
168 cxFree(hash_map->base.collection.allocator, elm); |
| |
169 // decrease size |
| |
170 hash_map->base.collection.size--; |
| |
171 } |
| |
172 |
| |
173 /** |
| |
174 * Helper function to avoid code duplication. |
| |
175 * |
| |
176 * @param map the map |
| |
177 * @param key the key to look up |
| |
178 * @param remove flag indicating whether the looked up entry shall be removed |
| |
179 * @param destroy flag indicating whether the destructor shall be invoked |
| |
180 * @return a pointer to the value corresponding to the key or \c NULL |
| |
181 */ |
| |
182 static void *cx_hash_map_get_remove( |
| |
183 CxMap *map, |
| |
184 CxHashKey key, |
| |
185 bool remove, |
| |
186 bool destroy |
| |
187 ) { |
| |
188 struct cx_hash_map_s *hash_map = (struct cx_hash_map_s *) map; |
| |
189 |
| |
190 unsigned hash = key.hash; |
| |
191 if (hash == 0) { |
| |
192 cx_hash_murmur(&key); |
| |
193 hash = key.hash; |
| |
194 } |
| |
195 |
| |
196 size_t slot = hash % hash_map->bucket_count; |
| |
197 struct cx_hash_map_element_s *elm = hash_map->buckets[slot]; |
| |
198 struct cx_hash_map_element_s *prev = NULL; |
| |
199 while (elm && elm->key.hash <= hash) { |
| |
200 if (elm->key.hash == hash && elm->key.len == key.len) { |
| |
201 if (memcmp(elm->key.data, key.data, key.len) == 0) { |
| |
202 void *data = NULL; |
| |
203 if (destroy) { |
| |
204 cx_invoke_destructor(map, elm->data); |
| |
205 } else { |
| |
206 if (map->collection.store_pointer) { |
| |
207 data = *(void **) elm->data; |
| |
208 } else { |
| |
209 data = elm->data; |
| |
210 } |
| |
211 } |
| |
212 if (remove) { |
| |
213 cx_hash_map_unlink(hash_map, slot, prev, elm); |
| |
214 } |
| |
215 return data; |
| |
216 } |
| |
217 } |
| |
218 prev = elm; |
| |
219 elm = prev->next; |
| |
220 } |
| |
221 |
| |
222 return NULL; |
| |
223 } |
| |
224 |
| |
225 static void *cx_hash_map_get( |
| |
226 CxMap const *map, |
| |
227 CxHashKey key |
| |
228 ) { |
| |
229 // we can safely cast, because we know the map stays untouched |
| |
230 return cx_hash_map_get_remove((CxMap *) map, key, false, false); |
| |
231 } |
| |
232 |
| |
233 static void *cx_hash_map_remove( |
| |
234 CxMap *map, |
| |
235 CxHashKey key, |
| |
236 bool destroy |
| |
237 ) { |
| |
238 return cx_hash_map_get_remove(map, key, true, destroy); |
| |
239 } |
| |
240 |
| |
241 static void *cx_hash_map_iter_current_entry(void const *it) { |
| |
242 struct cx_iterator_s const *iter = it; |
| |
243 // struct has to have a compatible signature |
| |
244 return (struct cx_map_entry_s *) &(iter->kv_data); |
| |
245 } |
| |
246 |
| |
247 static void *cx_hash_map_iter_current_key(void const *it) { |
| |
248 struct cx_iterator_s const *iter = it; |
| |
249 struct cx_hash_map_element_s *elm = iter->elem_handle; |
| |
250 return &elm->key; |
| |
251 } |
| |
252 |
| |
253 static void *cx_hash_map_iter_current_value(void const *it) { |
| |
254 struct cx_iterator_s const *iter = it; |
| |
255 struct cx_hash_map_s const *map = iter->src_handle.c; |
| |
256 struct cx_hash_map_element_s *elm = iter->elem_handle; |
| |
257 if (map->base.collection.store_pointer) { |
| |
258 return *(void **) elm->data; |
| |
259 } else { |
| |
260 return elm->data; |
| |
261 } |
| |
262 } |
| |
263 |
| |
264 static bool cx_hash_map_iter_valid(void const *it) { |
| |
265 struct cx_iterator_s const *iter = it; |
| |
266 return iter->elem_handle != NULL; |
| |
267 } |
| |
268 |
| |
269 static void cx_hash_map_iter_next(void *it) { |
| |
270 struct cx_iterator_s *iter = it; |
| |
271 struct cx_hash_map_element_s *elm = iter->elem_handle; |
| |
272 struct cx_hash_map_s *map = iter->src_handle.m; |
| |
273 |
| |
274 // remove current element, if asked |
| |
275 if (iter->base.remove) { |
| |
276 |
| |
277 // clear the flag |
| |
278 iter->base.remove = false; |
| |
279 |
| |
280 // determine the next element |
| |
281 struct cx_hash_map_element_s *next = elm->next; |
| |
282 |
| |
283 // search the previous element |
| |
284 struct cx_hash_map_element_s *prev = NULL; |
| |
285 if (map->buckets[iter->slot] != elm) { |
| |
286 prev = map->buckets[iter->slot]; |
| |
287 while (prev->next != elm) { |
| |
288 prev = prev->next; |
| |
289 } |
| |
290 } |
| |
291 |
| |
292 // destroy |
| |
293 cx_invoke_destructor((struct cx_map_s *) map, elm->data); |
| |
294 |
| |
295 // unlink |
| |
296 cx_hash_map_unlink(map, iter->slot, prev, elm); |
| |
297 |
| |
298 // advance |
| |
299 elm = next; |
| |
300 } else { |
| |
301 // just advance |
| |
302 elm = elm->next; |
| |
303 iter->index++; |
| |
304 } |
| |
305 |
| |
306 // search the next bucket, if required |
| |
307 while (elm == NULL && ++iter->slot < map->bucket_count) { |
| |
308 elm = map->buckets[iter->slot]; |
| |
309 } |
| |
310 |
| |
311 // fill the struct with the next element |
| |
312 iter->elem_handle = elm; |
| |
313 if (elm == NULL) { |
| |
314 iter->kv_data.key = NULL; |
| |
315 iter->kv_data.value = NULL; |
| |
316 } else { |
| |
317 iter->kv_data.key = &elm->key; |
| |
318 if (map->base.collection.store_pointer) { |
| |
319 iter->kv_data.value = *(void **) elm->data; |
| |
320 } else { |
| |
321 iter->kv_data.value = elm->data; |
| |
322 } |
| |
323 } |
| |
324 } |
| |
325 |
| |
326 static CxIterator cx_hash_map_iterator( |
| |
327 CxMap const *map, |
| |
328 enum cx_map_iterator_type type |
| |
329 ) { |
| |
330 CxIterator iter; |
| |
331 |
| |
332 iter.src_handle.c = map; |
| |
333 iter.elem_count = map->collection.size; |
| |
334 |
| |
335 switch (type) { |
| |
336 case CX_MAP_ITERATOR_PAIRS: |
| |
337 iter.elem_size = sizeof(CxMapEntry); |
| |
338 iter.base.current = cx_hash_map_iter_current_entry; |
| |
339 break; |
| |
340 case CX_MAP_ITERATOR_KEYS: |
| |
341 iter.elem_size = sizeof(CxHashKey); |
| |
342 iter.base.current = cx_hash_map_iter_current_key; |
| |
343 break; |
| |
344 case CX_MAP_ITERATOR_VALUES: |
| |
345 iter.elem_size = map->collection.elem_size; |
| |
346 iter.base.current = cx_hash_map_iter_current_value; |
| |
347 break; |
| |
348 default: |
| |
349 assert(false); |
| |
350 } |
| |
351 |
| |
352 iter.base.valid = cx_hash_map_iter_valid; |
| |
353 iter.base.next = cx_hash_map_iter_next; |
| |
354 iter.base.remove = false; |
| |
355 iter.base.mutating = false; |
| |
356 |
| |
357 iter.slot = 0; |
| |
358 iter.index = 0; |
| |
359 |
| |
360 if (map->collection.size > 0) { |
| |
361 struct cx_hash_map_s *hash_map = (struct cx_hash_map_s *) map; |
| |
362 struct cx_hash_map_element_s *elm = hash_map->buckets[0]; |
| |
363 while (elm == NULL) { |
| |
364 elm = hash_map->buckets[++iter.slot]; |
| |
365 } |
| |
366 iter.elem_handle = elm; |
| |
367 iter.kv_data.key = &elm->key; |
| |
368 if (map->collection.store_pointer) { |
| |
369 iter.kv_data.value = *(void **) elm->data; |
| |
370 } else { |
| |
371 iter.kv_data.value = elm->data; |
| |
372 } |
| |
373 } else { |
| |
374 iter.elem_handle = NULL; |
| |
375 iter.kv_data.key = NULL; |
| |
376 iter.kv_data.value = NULL; |
| |
377 } |
| |
378 |
| |
379 return iter; |
| |
380 } |
| |
381 |
| |
382 static cx_map_class cx_hash_map_class = { |
| |
383 cx_hash_map_destructor, |
| |
384 cx_hash_map_clear, |
| |
385 cx_hash_map_put, |
| |
386 cx_hash_map_get, |
| |
387 cx_hash_map_remove, |
| |
388 cx_hash_map_iterator, |
| |
389 }; |
| |
390 |
| |
391 CxMap *cxHashMapCreate( |
| |
392 CxAllocator const *allocator, |
| |
393 size_t itemsize, |
| |
394 size_t buckets |
| |
395 ) { |
| |
396 if (buckets == 0) { |
| |
397 // implementation defined default |
| |
398 buckets = 16; |
| |
399 } |
| |
400 |
| |
401 struct cx_hash_map_s *map = cxCalloc(allocator, 1, |
| |
402 sizeof(struct cx_hash_map_s)); |
| |
403 if (map == NULL) return NULL; |
| |
404 |
| |
405 // initialize hash map members |
| |
406 map->bucket_count = buckets; |
| |
407 map->buckets = cxCalloc(allocator, buckets, |
| |
408 sizeof(struct cx_hash_map_element_s *)); |
| |
409 if (map->buckets == NULL) { |
| |
410 cxFree(allocator, map); |
| |
411 return NULL; |
| |
412 } |
| |
413 |
| |
414 // initialize base members |
| |
415 map->base.cl = &cx_hash_map_class; |
| |
416 map->base.collection.allocator = allocator; |
| |
417 |
| |
418 if (itemsize > 0) { |
| |
419 map->base.collection.store_pointer = false; |
| |
420 map->base.collection.elem_size = itemsize; |
| |
421 } else { |
| |
422 map->base.collection.store_pointer = true; |
| |
423 map->base.collection.elem_size = sizeof(void *); |
| |
424 } |
| |
425 |
| |
426 return (CxMap *) map; |
| |
427 } |
| |
428 |
| |
429 int cxMapRehash(CxMap *map) { |
| |
430 struct cx_hash_map_s *hash_map = (struct cx_hash_map_s *) map; |
| |
431 if (map->collection.size > ((hash_map->bucket_count * 3) >> 2)) { |
| |
432 |
| |
433 size_t new_bucket_count = (map->collection.size * 5) >> 1; |
| |
434 struct cx_hash_map_element_s **new_buckets = cxCalloc( |
| |
435 map->collection.allocator, |
| |
436 new_bucket_count, sizeof(struct cx_hash_map_element_s *) |
| |
437 ); |
| |
438 |
| |
439 if (new_buckets == NULL) { |
| |
440 return 1; |
| |
441 } |
| |
442 |
| |
443 // iterate through the elements and assign them to their new slots |
| |
444 cx_for_n(slot, hash_map->bucket_count) { |
| |
445 struct cx_hash_map_element_s *elm = hash_map->buckets[slot]; |
| |
446 while (elm != NULL) { |
| |
447 struct cx_hash_map_element_s *next = elm->next; |
| |
448 size_t new_slot = elm->key.hash % new_bucket_count; |
| |
449 |
| |
450 // find position where to insert |
| |
451 struct cx_hash_map_element_s *bucket_next = new_buckets[new_slot]; |
| |
452 struct cx_hash_map_element_s *bucket_prev = NULL; |
| |
453 while (bucket_next != NULL && |
| |
454 bucket_next->key.hash < elm->key.hash) { |
| |
455 bucket_prev = bucket_next; |
| |
456 bucket_next = bucket_next->next; |
| |
457 } |
| |
458 |
| |
459 // insert |
| |
460 if (bucket_prev == NULL) { |
| |
461 elm->next = new_buckets[new_slot]; |
| |
462 new_buckets[new_slot] = elm; |
| |
463 } else { |
| |
464 bucket_prev->next = elm; |
| |
465 elm->next = bucket_next; |
| |
466 } |
| |
467 |
| |
468 // advance |
| |
469 elm = next; |
| |
470 } |
| |
471 } |
| |
472 |
| |
473 // assign result to the map |
| |
474 hash_map->bucket_count = new_bucket_count; |
| |
475 cxFree(map->collection.allocator, hash_map->buckets); |
| |
476 hash_map->buckets = new_buckets; |
| |
477 } |
| |
478 return 0; |
| |
479 } |