ckh.c source code [Aerospike/modules/jemalloc/src/ckh.c]

1	/*
2	*******************************************************************************
3	* Implementation of (2^1+,2) cuckoo hashing, where 2^1+ indicates that each
4	* hash bucket contains 2^n cells, for n >= 1, and 2 indicates that two hash
5	* functions are employed. The original cuckoo hashing algorithm was described
6	* in:
7	*
8	* Pagh, R., F.F. Rodler (2004) Cuckoo Hashing. Journal of Algorithms
9	* 51(2):122-144.
10	*
11	* Generalization of cuckoo hashing was discussed in:
12	*
13	* Erlingsson, U., M. Manasse, F. McSherry (2006) A cool and practical
14	* alternative to traditional hash tables. In Proceedings of the 7th
15	* Workshop on Distributed Data and Structures (WDAS'06), Santa Clara, CA,
16	* January 2006.
17	*
18	* This implementation uses precisely two hash functions because that is the
19	* fewest that can work, and supporting multiple hashes is an implementation
20	* burden. Here is a reproduction of Figure 1 from Erlingsson et al. (2006)
21	* that shows approximate expected maximum load factors for various
22	* configurations:
23	*
24	* \| #cells/bucket \|
25	* #hashes \| 1 \| 2 \| 4 \| 8 \|
26	* --------+-------+-------+-------+-------+
27	* 1 \| 0.006 \| 0.006 \| 0.03 \| 0.12 \|
28	* 2 \| 0.49 \| 0.86 \|>0.93< \|>0.96< \|
29	* 3 \| 0.91 \| 0.97 \| 0.98 \| 0.999 \|
30	* 4 \| 0.97 \| 0.99 \| 0.999 \| \|
31	*
32	* The number of cells per bucket is chosen such that a bucket fits in one cache
33	* line. So, on 32- and 64-bit systems, we use (8,2) and (4,2) cuckoo hashing,
34	* respectively.
35	*
36	******************************************************************************/
37	#define JEMALLOC_CKH_C_
38	#include "jemalloc/internal/jemalloc_internal.h"
39
40	/****************************************************************************/
41	/ Function prototypes for non-inline static functions. /
42
43	static bool ckh_grow(tsdn_t tsdn, ckh_t ckh);
44	static void ckh_shrink(tsdn_t tsdn, ckh_t ckh);
45
46	/****************************************************************************/
47
48	/*
49	* Search bucket for key and return the cell number if found; SIZE_T_MAX
50	* otherwise.
51	*/
52	JEMALLOC_INLINE_C size_t
53	ckh_bucket_search(ckh_t ckh, size_t bucket, const* void *key)
54	{
55	ckhc_t *cell;
56	unsigned i;
57
58	for (i = `0`; i < (ZU(`1`) << LG_CKH_BUCKET_CELLS); i++) {
59	cell = &ckh->tab[(bucket << LG_CKH_BUCKET_CELLS) + i];
60	if (cell->key != NULL && ckh->keycomp(key, cell->key))
61	return ((bucket << LG_CKH_BUCKET_CELLS) + i);
62	}
63
64	return (SIZE_T_MAX);
65	}
66
67	/*
68	* Search table for key and return cell number if found; SIZE_T_MAX otherwise.
69	*/
70	JEMALLOC_INLINE_C size_t
71	ckh_isearch(ckh_t ckh, const* void *key)
72	{
73	size_t hashes[`2`], bucket, cell;
74
75	assert(ckh != NULL);
76
77	ckh->hash(key, hashes);
78
79	/ Search primary bucket. /
80	bucket = hashes[`0`] & ((ZU(`1`) << ckh->lg_curbuckets) - `1`);
81	cell = ckh_bucket_search(ckh, bucket, key);
82	if (cell != SIZE_T_MAX)
83	return (cell);
84
85	/ Search secondary bucket. /
86	bucket = hashes[`1`] & ((ZU(`1`) << ckh->lg_curbuckets) - `1`);
87	cell = ckh_bucket_search(ckh, bucket, key);
88	return (cell);
89	}
90
91	JEMALLOC_INLINE_C bool
92	ckh_try_bucket_insert(ckh_t ckh, size_t bucket, const* void *key,
93	const void *data)
94	{
95	ckhc_t *cell;
96	unsigned offset, i;
97
98	/*
99	* Cycle through the cells in the bucket, starting at a random position.
100	* The randomness avoids worst-case search overhead as buckets fill up.
101	*/
102	offset = (unsigned)prng_lg_range(&ckh->prng_state, LG_CKH_BUCKET_CELLS);
103	for (i = `0`; i < (ZU(`1`) << LG_CKH_BUCKET_CELLS); i++) {
104	cell = &ckh->tab[(bucket << LG_CKH_BUCKET_CELLS) +
105	((i + offset) & ((ZU(`1`) << LG_CKH_BUCKET_CELLS) - `1`))];
106	if (cell->key == NULL) {
107	cell->key = key;
108	cell->data = data;
109	ckh->count++;
110	return (false);
111	}
112	}
113
114	return (true);
115	}
116
117	/*
118	* No space is available in bucket. Randomly evict an item, then try to find an
119	* alternate location for that item. Iteratively repeat this
120	* eviction/relocation procedure until either success or detection of an
121	* eviction/relocation bucket cycle.
122	*/
123	JEMALLOC_INLINE_C bool
124	ckh_evict_reloc_insert(ckh_t ckh, size_t argbucket, void* const **argkey,
125	void const **argdata)
126	{
127	const void key, data, tkey, tdata;
128	ckhc_t *cell;
129	size_t hashes[`2`], bucket, tbucket;
130	unsigned i;
131
132	bucket = argbucket;
133	key = *argkey;
134	data = *argdata;
135	while (true) {
136	/*
137	* Choose a random item within the bucket to evict. This is
138	* critical to correct function, because without (eventually)
139	* evicting all items within a bucket during iteration, it
140	* would be possible to get stuck in an infinite loop if there
141	* were an item for which both hashes indicated the same
142	* bucket.
143	*/
144	i = (unsigned)prng_lg_range(&ckh->prng_state,
145	LG_CKH_BUCKET_CELLS);
146	cell = &ckh->tab[(bucket << LG_CKH_BUCKET_CELLS) + i];
147	assert(cell->key != NULL);
148
149	/ Swap cell->{key,data} and {key,data} (evict). /
150	tkey = cell->key; tdata = cell->data;
151	cell->key = key; cell->data = data;
152	key = tkey; data = tdata;
153
154	#ifdef CKH_COUNT
155	ckh->nrelocs++;
156	#endif
157
158	/ Find the alternate bucket for the evicted item. /
159	ckh->hash(key, hashes);
160	tbucket = hashes[`1`] & ((ZU(`1`) << ckh->lg_curbuckets) - `1`);
161	if (tbucket == bucket) {
162	tbucket = hashes[`0`] & ((ZU(`1`) << ckh->lg_curbuckets)
163	- `1`);
164	/*
165	* It may be that (tbucket == bucket) still, if the
166	* item's hashes both indicate this bucket. However,
167	* we are guaranteed to eventually escape this bucket
168	* during iteration, assuming pseudo-random item
169	* selection (true randomness would make infinite
170	* looping a remote possibility). The reason we can
171	* never get trapped forever is that there are two
172	* cases:
173	*
174	* 1) This bucket == argbucket, so we will quickly
175	* detect an eviction cycle and terminate.
176	* 2) An item was evicted to this bucket from another,
177	* which means that at least one item in this bucket
178	* has hashes that indicate distinct buckets.
179	*/
180	}
181	/ Check for a cycle. /
182	if (tbucket == argbucket) {
183	*argkey = key;
184	*argdata = data;
185	return (true);
186	}
187
188	bucket = tbucket;
189	if (!ckh_try_bucket_insert(ckh, bucket, key, data))
190	return (false);
191	}
192	}
193
194	JEMALLOC_INLINE_C bool
195	ckh_try_insert(ckh_t ckh, void* const*argkey, void* const**argdata)
196	{
197	size_t hashes[`2`], bucket;
198	const void key = argkey;
199	const void data = argdata;
200
201	ckh->hash(key, hashes);
202
203	/ Try to insert in primary bucket. /
204	bucket = hashes[`0`] & ((ZU(`1`) << ckh->lg_curbuckets) - `1`);
205	if (!ckh_try_bucket_insert(ckh, bucket, key, data))
206	return (false);
207
208	/ Try to insert in secondary bucket. /
209	bucket = hashes[`1`] & ((ZU(`1`) << ckh->lg_curbuckets) - `1`);
210	if (!ckh_try_bucket_insert(ckh, bucket, key, data))
211	return (false);
212
213	/*
214	* Try to find a place for this item via iterative eviction/relocation.
215	*/
216	return (ckh_evict_reloc_insert(ckh, bucket, argkey, argdata));
217	}
218
219	/*
220	* Try to rebuild the hash table from scratch by inserting all items from the
221	* old table into the new.
222	*/
223	JEMALLOC_INLINE_C bool
224	ckh_rebuild(ckh_t ckh, ckhc_t aTab)
225	{
226	size_t count, i, nins;
227	const void key, data;
228
229	count = ckh->count;
230	ckh->count = `0`;
231	for (i = nins = `0`; nins < count; i++) {
232	if (aTab[i].key != NULL) {
233	key = aTab[i].key;
234	data = aTab[i].data;
235	if (ckh_try_insert(ckh, &key, &data)) {
236	ckh->count = count;
237	return (true);
238	}
239	nins++;
240	}
241	}
242
243	return (false);
244	}
245
246	static bool
247	ckh_grow(tsdn_t tsdn, ckh_t ckh)
248	{
249	bool ret;
250	ckhc_t tab, ttab;
251	unsigned lg_prevbuckets, lg_curcells;
252
253	#ifdef CKH_COUNT
254	ckh->ngrows++;
255	#endif
256
257	/*
258	* It is possible (though unlikely, given well behaved hashes) that the
259	* table will have to be doubled more than once in order to create a
260	* usable table.
261	*/
262	lg_prevbuckets = ckh->lg_curbuckets;
263	lg_curcells = ckh->lg_curbuckets + LG_CKH_BUCKET_CELLS;
264	while (true) {
265	size_t usize;
266
267	lg_curcells++;
268	usize = sa2u(sizeof(ckhc_t) << lg_curcells, CACHELINE);
269	if (unlikely(usize == `0` \|\| usize > HUGE_MAXCLASS)) {
270	ret = true;
271	goto label_return;
272	}
273	tab = (ckhc_t *)ipallocztm(tsdn, usize, CACHELINE, true, NULL,
274	true, arena_ichoose(tsdn, NULL));
275	if (tab == NULL) {
276	ret = true;
277	goto label_return;
278	}
279	/ Swap in new table. /
280	ttab = ckh->tab;
281	ckh->tab = tab;
282	tab = ttab;
283	ckh->lg_curbuckets = lg_curcells - LG_CKH_BUCKET_CELLS;
284
285	if (!ckh_rebuild(ckh, tab)) {
286	idalloctm(tsdn, tab, NULL, true, true);
287	break;
288	}
289
290	/ Rebuilding failed, so back out partially rebuilt table. /
291	idalloctm(tsdn, ckh->tab, NULL, true, true);
292	ckh->tab = tab;
293	ckh->lg_curbuckets = lg_prevbuckets;
294	}
295
296	ret = false;
297	label_return:
298	return (ret);
299	}
300
301	static void
302	ckh_shrink(tsdn_t tsdn, ckh_t ckh)
303	{
304	ckhc_t tab, ttab;
305	size_t usize;
306	unsigned lg_prevbuckets, lg_curcells;
307
308	/*
309	* It is possible (though unlikely, given well behaved hashes) that the
310	* table rebuild will fail.
311	*/
312	lg_prevbuckets = ckh->lg_curbuckets;
313	lg_curcells = ckh->lg_curbuckets + LG_CKH_BUCKET_CELLS - `1`;
314	usize = sa2u(sizeof(ckhc_t) << lg_curcells, CACHELINE);
315	if (unlikely(usize == `0` \|\| usize > HUGE_MAXCLASS))
316	return;
317	tab = (ckhc_t *)ipallocztm(tsdn, usize, CACHELINE, true, NULL, true,
318	arena_ichoose(tsdn, NULL));
319	if (tab == NULL) {
320	/*
321	* An OOM error isn't worth propagating, since it doesn't
322	* prevent this or future operations from proceeding.
323	*/
324	return;
325	}
326	/ Swap in new table. /
327	ttab = ckh->tab;
328	ckh->tab = tab;
329	tab = ttab;
330	ckh->lg_curbuckets = lg_curcells - LG_CKH_BUCKET_CELLS;
331
332	if (!ckh_rebuild(ckh, tab)) {
333	idalloctm(tsdn, tab, NULL, true, true);
334	#ifdef CKH_COUNT
335	ckh->nshrinks++;
336	#endif
337	return;
338	}
339
340	/ Rebuilding failed, so back out partially rebuilt table. /
341	idalloctm(tsdn, ckh->tab, NULL, true, true);
342	ckh->tab = tab;
343	ckh->lg_curbuckets = lg_prevbuckets;
344	#ifdef CKH_COUNT
345	ckh->nshrinkfails++;
346	#endif
347	}
348
349	bool
350	ckh_new(tsdn_t tsdn, ckh_t ckh, size_t minitems, ckh_hash_t *hash,
351	ckh_keycomp_t *keycomp)
352	{
353	bool ret;
354	size_t mincells, usize;
355	unsigned lg_mincells;
356
357	assert(minitems > `0`);
358	assert(hash != NULL);
359	assert(keycomp != NULL);
360
361	#ifdef CKH_COUNT
362	ckh->ngrows = `0`;
363	ckh->nshrinks = `0`;
364	ckh->nshrinkfails = `0`;
365	ckh->ninserts = `0`;
366	ckh->nrelocs = `0`;
367	#endif
368	ckh->prng_state = `42`; / Value doesn't really matter. /
369	ckh->count = `0`;
370
371	/*
372	* Find the minimum power of 2 that is large enough to fit minitems
373	* entries. We are using (2+,2) cuckoo hashing, which has an expected
374	* maximum load factor of at least ~0.86, so 0.75 is a conservative load
375	* factor that will typically allow mincells items to fit without ever
376	* growing the table.
377	*/
378	assert(LG_CKH_BUCKET_CELLS > `0`);
379	mincells = ((minitems + (`3` - (minitems % `3`))) / `3`) << `2`;
380	for (lg_mincells = LG_CKH_BUCKET_CELLS;
381	(ZU(`1`) << lg_mincells) < mincells;
382	lg_mincells++)
383	; / Do nothing. /
384	ckh->lg_minbuckets = lg_mincells - LG_CKH_BUCKET_CELLS;
385	ckh->lg_curbuckets = lg_mincells - LG_CKH_BUCKET_CELLS;
386	ckh->hash = hash;
387	ckh->keycomp = keycomp;
388
389	usize = sa2u(sizeof(ckhc_t) << lg_mincells, CACHELINE);
390	if (unlikely(usize == `0` \|\| usize > HUGE_MAXCLASS)) {
391	ret = true;
392	goto label_return;
393	}
394	ckh->tab = (ckhc_t *)ipallocztm(tsdn, usize, CACHELINE, true, NULL,
395	true, arena_ichoose(tsdn, NULL));
396	if (ckh->tab == NULL) {
397	ret = true;
398	goto label_return;
399	}
400
401	ret = false;
402	label_return:
403	return (ret);
404	}
405
406	void
407	ckh_delete(tsdn_t tsdn, ckh_t ckh)
408	{
409
410	assert(ckh != NULL);
411
412	#ifdef CKH_VERBOSE
413	malloc_printf(
414	"%s(%p): ngrows: %"FMTu64", nshrinks: %"FMTu64","
415	" nshrinkfails: %"FMTu64", ninserts: %"FMTu64","
416	" nrelocs: %"FMTu64"\n", __func__, ckh,
417	(unsigned long long)ckh->ngrows,
418	(unsigned long long)ckh->nshrinks,
419	(unsigned long long)ckh->nshrinkfails,
420	(unsigned long long)ckh->ninserts,
421	(unsigned long long)ckh->nrelocs);
422	#endif
423
424	idalloctm(tsdn, ckh->tab, NULL, true, true);
425	if (config_debug)
426	memset(ckh, JEMALLOC_FREE_JUNK, sizeof(ckh_t));
427	}
428
429	size_t
430	ckh_count(ckh_t *ckh)
431	{
432
433	assert(ckh != NULL);
434
435	return (ckh->count);
436	}
437
438	bool
439	ckh_iter(ckh_t ckh, size_t tabind, void *key, void* **data)
440	{
441	size_t i, ncells;
442
443	for (i = *tabind, ncells = (ZU(`1`) << (ckh->lg_curbuckets +
444	LG_CKH_BUCKET_CELLS)); i < ncells; i++) {
445	if (ckh->tab[i].key != NULL) {
446	if (key != NULL)
447	key = (void* *)ckh->tab[i].key;
448	if (data != NULL)
449	data = (void* *)ckh->tab[i].data;
450	*tabind = i + `1`;
451	return (false);
452	}
453	}
454
455	return (true);
456	}
457
458	bool
459	ckh_insert(tsdn_t tsdn, ckh_t ckh, const void key, const* void *data)
460	{
461	bool ret;
462
463	assert(ckh != NULL);
464	assert(ckh_search(ckh, key, NULL, NULL));
465
466	#ifdef CKH_COUNT
467	ckh->ninserts++;
468	#endif
469
470	while (ckh_try_insert(ckh, &key, &data)) {
471	if (ckh_grow(tsdn, ckh)) {
472	ret = true;
473	goto label_return;
474	}
475	}
476
477	ret = false;
478	label_return:
479	return (ret);
480	}
481
482	bool
483	ckh_remove(tsdn_t tsdn, ckh_t ckh, const void searchkey, void* **key,
484	void **data)
485	{
486	size_t cell;
487
488	assert(ckh != NULL);
489
490	cell = ckh_isearch(ckh, searchkey);
491	if (cell != SIZE_T_MAX) {
492	if (key != NULL)
493	key = (void* *)ckh->tab[cell].key;
494	if (data != NULL)
495	data = (void* *)ckh->tab[cell].data;
496	ckh->tab[cell].key = NULL;
497	ckh->tab[cell].data = NULL; / Not necessary. /
498
499	ckh->count--;
500	/ Try to halve the table if it is less than 1/4 full. /
501	if (ckh->count < (ZU(`1`) << (ckh->lg_curbuckets
502	+ LG_CKH_BUCKET_CELLS - `2`)) && ckh->lg_curbuckets
503	> ckh->lg_minbuckets) {
504	/ Ignore error due to OOM. /
505	ckh_shrink(tsdn, ckh);
506	}
507
508	return (false);
509	}
510
511	return (true);
512	}
513
514	bool
515	ckh_search(ckh_t ckh, const* void searchkey, void* *key, void* **data)
516	{
517	size_t cell;
518
519	assert(ckh != NULL);
520
521	cell = ckh_isearch(ckh, searchkey);
522	if (cell != SIZE_T_MAX) {
523	if (key != NULL)
524	key = (void* *)ckh->tab[cell].key;
525	if (data != NULL)
526	data = (void* *)ckh->tab[cell].data;
527	return (false);
528	}
529
530	return (true);
531	}
532
533	void
534	ckh_string_hash(const void *key, size_t r_hash[`2`])
535	{
536
537	hash(key, strlen((const char *)key), `0x94122f33U`, r_hash);
538	}
539
540	bool
541	ckh_string_keycomp(const void k1, const* void *k2)
542	{
543
544	assert(k1 != NULL);
545	assert(k2 != NULL);
546
547	return (strcmp((char )k1, (char* *)k2) ? false : true);
548	}
549
550	void
551	ckh_pointer_hash(const void *key, size_t r_hash[`2`])
552	{
553	union {
554	const void *v;
555	size_t i;
556	} u;
557
558	assert(sizeof(u.v) == sizeof(u.i));
559	u.v = key;
560	hash(&u.i, sizeof(u.i), `0xd983396eU`, r_hash);
561	}
562
563	bool
564	ckh_pointer_keycomp(const void k1, const* void *k2)
565	{
566
567	return ((k1 == k2) ? true : false);
568	}
569

Browse the source code of Aerospike/modules/jemalloc/src/ckh.c