1 | /**************************************************************************/ |
2 | /* oa_hash_map.h */ |
3 | /**************************************************************************/ |
4 | /* This file is part of: */ |
5 | /* GODOT ENGINE */ |
6 | /* https://godotengine.org */ |
7 | /**************************************************************************/ |
8 | /* Copyright (c) 2014-present Godot Engine contributors (see AUTHORS.md). */ |
9 | /* Copyright (c) 2007-2014 Juan Linietsky, Ariel Manzur. */ |
10 | /* */ |
11 | /* Permission is hereby granted, free of charge, to any person obtaining */ |
12 | /* a copy of this software and associated documentation files (the */ |
13 | /* "Software"), to deal in the Software without restriction, including */ |
14 | /* without limitation the rights to use, copy, modify, merge, publish, */ |
15 | /* distribute, sublicense, and/or sell copies of the Software, and to */ |
16 | /* permit persons to whom the Software is furnished to do so, subject to */ |
17 | /* the following conditions: */ |
18 | /* */ |
19 | /* The above copyright notice and this permission notice shall be */ |
20 | /* included in all copies or substantial portions of the Software. */ |
21 | /* */ |
22 | /* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, */ |
23 | /* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF */ |
24 | /* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. */ |
25 | /* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY */ |
26 | /* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, */ |
27 | /* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE */ |
28 | /* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ |
29 | /**************************************************************************/ |
30 | |
31 | #ifndef OA_HASH_MAP_H |
32 | #define OA_HASH_MAP_H |
33 | |
34 | #include "core/math/math_funcs.h" |
35 | #include "core/os/memory.h" |
36 | #include "core/templates/hashfuncs.h" |
37 | |
38 | /** |
39 | * A HashMap implementation that uses open addressing with Robin Hood hashing. |
40 | * Robin Hood hashing swaps out entries that have a smaller probing distance |
41 | * than the to-be-inserted entry, that evens out the average probing distance |
42 | * and enables faster lookups. Backward shift deletion is employed to further |
43 | * improve the performance and to avoid infinite loops in rare cases. |
44 | * |
45 | * The entries are stored inplace, so huge keys or values might fill cache lines |
46 | * a lot faster. |
47 | * |
48 | * Only used keys and values are constructed. For free positions there's space |
49 | * in the arrays for each, but that memory is kept uninitialized. |
50 | * |
51 | * The assignment operator copy the pairs from one map to the other. |
52 | */ |
53 | template <class TKey, class TValue, |
54 | class Hasher = HashMapHasherDefault, |
55 | class Comparator = HashMapComparatorDefault<TKey>> |
56 | class OAHashMap { |
57 | private: |
58 | TValue *values = nullptr; |
59 | TKey *keys = nullptr; |
60 | uint32_t *hashes = nullptr; |
61 | |
62 | uint32_t capacity = 0; |
63 | |
64 | uint32_t num_elements = 0; |
65 | |
66 | static const uint32_t EMPTY_HASH = 0; |
67 | |
68 | _FORCE_INLINE_ uint32_t _hash(const TKey &p_key) const { |
69 | uint32_t hash = Hasher::hash(p_key); |
70 | |
71 | if (hash == EMPTY_HASH) { |
72 | hash = EMPTY_HASH + 1; |
73 | } |
74 | |
75 | return hash; |
76 | } |
77 | |
78 | _FORCE_INLINE_ uint32_t _get_probe_length(uint32_t p_pos, uint32_t p_hash) const { |
79 | uint32_t original_pos = p_hash % capacity; |
80 | return (p_pos - original_pos + capacity) % capacity; |
81 | } |
82 | |
83 | _FORCE_INLINE_ void _construct(uint32_t p_pos, uint32_t p_hash, const TKey &p_key, const TValue &p_value) { |
84 | memnew_placement(&keys[p_pos], TKey(p_key)); |
85 | memnew_placement(&values[p_pos], TValue(p_value)); |
86 | hashes[p_pos] = p_hash; |
87 | |
88 | num_elements++; |
89 | } |
90 | |
91 | bool _lookup_pos(const TKey &p_key, uint32_t &r_pos) const { |
92 | uint32_t hash = _hash(p_key); |
93 | uint32_t pos = hash % capacity; |
94 | uint32_t distance = 0; |
95 | |
96 | while (true) { |
97 | if (hashes[pos] == EMPTY_HASH) { |
98 | return false; |
99 | } |
100 | |
101 | if (distance > _get_probe_length(pos, hashes[pos])) { |
102 | return false; |
103 | } |
104 | |
105 | if (hashes[pos] == hash && Comparator::compare(keys[pos], p_key)) { |
106 | r_pos = pos; |
107 | return true; |
108 | } |
109 | |
110 | pos = (pos + 1) % capacity; |
111 | distance++; |
112 | } |
113 | } |
114 | |
115 | void _insert_with_hash(uint32_t p_hash, const TKey &p_key, const TValue &p_value) { |
116 | uint32_t hash = p_hash; |
117 | uint32_t distance = 0; |
118 | uint32_t pos = hash % capacity; |
119 | |
120 | TKey key = p_key; |
121 | TValue value = p_value; |
122 | |
123 | while (true) { |
124 | if (hashes[pos] == EMPTY_HASH) { |
125 | _construct(pos, hash, key, value); |
126 | |
127 | return; |
128 | } |
129 | |
130 | // not an empty slot, let's check the probing length of the existing one |
131 | uint32_t existing_probe_len = _get_probe_length(pos, hashes[pos]); |
132 | if (existing_probe_len < distance) { |
133 | SWAP(hash, hashes[pos]); |
134 | SWAP(key, keys[pos]); |
135 | SWAP(value, values[pos]); |
136 | distance = existing_probe_len; |
137 | } |
138 | |
139 | pos = (pos + 1) % capacity; |
140 | distance++; |
141 | } |
142 | } |
143 | |
144 | void _resize_and_rehash(uint32_t p_new_capacity) { |
145 | uint32_t old_capacity = capacity; |
146 | |
147 | // Capacity can't be 0. |
148 | capacity = MAX(1u, p_new_capacity); |
149 | |
150 | TKey *old_keys = keys; |
151 | TValue *old_values = values; |
152 | uint32_t *old_hashes = hashes; |
153 | |
154 | num_elements = 0; |
155 | keys = static_cast<TKey *>(Memory::alloc_static(sizeof(TKey) * capacity)); |
156 | values = static_cast<TValue *>(Memory::alloc_static(sizeof(TValue) * capacity)); |
157 | hashes = static_cast<uint32_t *>(Memory::alloc_static(sizeof(uint32_t) * capacity)); |
158 | |
159 | for (uint32_t i = 0; i < capacity; i++) { |
160 | hashes[i] = 0; |
161 | } |
162 | |
163 | if (old_capacity == 0) { |
164 | // Nothing to do. |
165 | return; |
166 | } |
167 | |
168 | for (uint32_t i = 0; i < old_capacity; i++) { |
169 | if (old_hashes[i] == EMPTY_HASH) { |
170 | continue; |
171 | } |
172 | |
173 | _insert_with_hash(old_hashes[i], old_keys[i], old_values[i]); |
174 | |
175 | old_keys[i].~TKey(); |
176 | old_values[i].~TValue(); |
177 | } |
178 | |
179 | Memory::free_static(old_keys); |
180 | Memory::free_static(old_values); |
181 | Memory::free_static(old_hashes); |
182 | } |
183 | |
184 | void _resize_and_rehash() { |
185 | _resize_and_rehash(capacity * 2); |
186 | } |
187 | |
188 | public: |
189 | _FORCE_INLINE_ uint32_t get_capacity() const { return capacity; } |
190 | _FORCE_INLINE_ uint32_t get_num_elements() const { return num_elements; } |
191 | |
192 | bool is_empty() const { |
193 | return num_elements == 0; |
194 | } |
195 | |
196 | void clear() { |
197 | for (uint32_t i = 0; i < capacity; i++) { |
198 | if (hashes[i] == EMPTY_HASH) { |
199 | continue; |
200 | } |
201 | |
202 | hashes[i] = EMPTY_HASH; |
203 | values[i].~TValue(); |
204 | keys[i].~TKey(); |
205 | } |
206 | |
207 | num_elements = 0; |
208 | } |
209 | |
210 | void insert(const TKey &p_key, const TValue &p_value) { |
211 | if (num_elements + 1 > 0.9 * capacity) { |
212 | _resize_and_rehash(); |
213 | } |
214 | |
215 | uint32_t hash = _hash(p_key); |
216 | |
217 | _insert_with_hash(hash, p_key, p_value); |
218 | } |
219 | |
220 | void set(const TKey &p_key, const TValue &p_data) { |
221 | uint32_t pos = 0; |
222 | bool exists = _lookup_pos(p_key, pos); |
223 | |
224 | if (exists) { |
225 | values[pos] = p_data; |
226 | } else { |
227 | insert(p_key, p_data); |
228 | } |
229 | } |
230 | |
231 | /** |
232 | * returns true if the value was found, false otherwise. |
233 | * |
234 | * if r_data is not nullptr then the value will be written to the object |
235 | * it points to. |
236 | */ |
237 | bool lookup(const TKey &p_key, TValue &r_data) const { |
238 | uint32_t pos = 0; |
239 | bool exists = _lookup_pos(p_key, pos); |
240 | |
241 | if (exists) { |
242 | r_data = values[pos]; |
243 | return true; |
244 | } |
245 | |
246 | return false; |
247 | } |
248 | |
249 | const TValue *lookup_ptr(const TKey &p_key) const { |
250 | uint32_t pos = 0; |
251 | bool exists = _lookup_pos(p_key, pos); |
252 | |
253 | if (exists) { |
254 | return &values[pos]; |
255 | } |
256 | return nullptr; |
257 | } |
258 | |
259 | TValue *lookup_ptr(const TKey &p_key) { |
260 | uint32_t pos = 0; |
261 | bool exists = _lookup_pos(p_key, pos); |
262 | |
263 | if (exists) { |
264 | return &values[pos]; |
265 | } |
266 | return nullptr; |
267 | } |
268 | |
269 | _FORCE_INLINE_ bool has(const TKey &p_key) const { |
270 | uint32_t _pos = 0; |
271 | return _lookup_pos(p_key, _pos); |
272 | } |
273 | |
274 | void remove(const TKey &p_key) { |
275 | uint32_t pos = 0; |
276 | bool exists = _lookup_pos(p_key, pos); |
277 | |
278 | if (!exists) { |
279 | return; |
280 | } |
281 | |
282 | uint32_t next_pos = (pos + 1) % capacity; |
283 | while (hashes[next_pos] != EMPTY_HASH && |
284 | _get_probe_length(next_pos, hashes[next_pos]) != 0) { |
285 | SWAP(hashes[next_pos], hashes[pos]); |
286 | SWAP(keys[next_pos], keys[pos]); |
287 | SWAP(values[next_pos], values[pos]); |
288 | pos = next_pos; |
289 | next_pos = (pos + 1) % capacity; |
290 | } |
291 | |
292 | hashes[pos] = EMPTY_HASH; |
293 | values[pos].~TValue(); |
294 | keys[pos].~TKey(); |
295 | |
296 | num_elements--; |
297 | } |
298 | |
299 | /** |
300 | * reserves space for a number of elements, useful to avoid many resizes and rehashes |
301 | * if adding a known (possibly large) number of elements at once, must be larger than old |
302 | * capacity. |
303 | **/ |
304 | void reserve(uint32_t p_new_capacity) { |
305 | ERR_FAIL_COND(p_new_capacity < capacity); |
306 | _resize_and_rehash(p_new_capacity); |
307 | } |
308 | |
309 | struct Iterator { |
310 | bool valid; |
311 | |
312 | const TKey *key; |
313 | TValue *value = nullptr; |
314 | |
315 | private: |
316 | uint32_t pos; |
317 | friend class OAHashMap; |
318 | }; |
319 | |
320 | Iterator iter() const { |
321 | Iterator it; |
322 | |
323 | it.valid = true; |
324 | it.pos = 0; |
325 | |
326 | return next_iter(it); |
327 | } |
328 | |
329 | Iterator next_iter(const Iterator &p_iter) const { |
330 | if (!p_iter.valid) { |
331 | return p_iter; |
332 | } |
333 | |
334 | Iterator it; |
335 | it.valid = false; |
336 | it.pos = p_iter.pos; |
337 | it.key = nullptr; |
338 | it.value = nullptr; |
339 | |
340 | for (uint32_t i = it.pos; i < capacity; i++) { |
341 | it.pos = i + 1; |
342 | |
343 | if (hashes[i] == EMPTY_HASH) { |
344 | continue; |
345 | } |
346 | |
347 | it.valid = true; |
348 | it.key = &keys[i]; |
349 | it.value = &values[i]; |
350 | return it; |
351 | } |
352 | |
353 | return it; |
354 | } |
355 | |
356 | OAHashMap(const OAHashMap &p_other) { |
357 | (*this) = p_other; |
358 | } |
359 | |
360 | void operator=(const OAHashMap &p_other) { |
361 | if (capacity != 0) { |
362 | clear(); |
363 | } |
364 | |
365 | _resize_and_rehash(p_other.capacity); |
366 | |
367 | for (Iterator it = p_other.iter(); it.valid; it = p_other.next_iter(it)) { |
368 | set(*it.key, *it.value); |
369 | } |
370 | } |
371 | |
372 | OAHashMap(uint32_t p_initial_capacity = 64) { |
373 | // Capacity can't be 0. |
374 | capacity = MAX(1u, p_initial_capacity); |
375 | |
376 | keys = static_cast<TKey *>(Memory::alloc_static(sizeof(TKey) * capacity)); |
377 | values = static_cast<TValue *>(Memory::alloc_static(sizeof(TValue) * capacity)); |
378 | hashes = static_cast<uint32_t *>(Memory::alloc_static(sizeof(uint32_t) * capacity)); |
379 | |
380 | for (uint32_t i = 0; i < capacity; i++) { |
381 | hashes[i] = EMPTY_HASH; |
382 | } |
383 | } |
384 | |
385 | ~OAHashMap() { |
386 | for (uint32_t i = 0; i < capacity; i++) { |
387 | if (hashes[i] == EMPTY_HASH) { |
388 | continue; |
389 | } |
390 | |
391 | values[i].~TValue(); |
392 | keys[i].~TKey(); |
393 | } |
394 | |
395 | Memory::free_static(keys); |
396 | Memory::free_static(values); |
397 | Memory::free_static(hashes); |
398 | } |
399 | }; |
400 | |
401 | #endif // OA_HASH_MAP_H |
402 | |