concurrentHashTable.hpp source code [OpenJDK/src/hotspot/share/utilities/concurrentHashTable.hpp]

1	/*
2	* Copyright (c) 2018, 2019, Oracle and/or its affiliates. All rights reserved.
3	* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4	*
5	* This code is free software; you can redistribute it and/or modify it
6	* under the terms of the GNU General Public License version 2 only, as
7	* published by the Free Software Foundation.
8	*
9	* This code is distributed in the hope that it will be useful, but WITHOUT
10	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12	* version 2 for more details (a copy is included in the LICENSE file that
13	* accompanied this code).
14	*
15	* You should have received a copy of the GNU General Public License version
16	* 2 along with this work; if not, write to the Free Software Foundation,
17	* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18	*
19	* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20	* or visit www.oracle.com if you need additional information or have any
21	* questions.
22	*
23	*/
24
25	#ifndef SHARE_UTILITIES_CONCURRENTHASHTABLE_HPP
26	#define SHARE_UTILITIES_CONCURRENTHASHTABLE_HPP
27
28	#include "memory/allocation.hpp"
29	#include "utilities/globalCounter.hpp"
30	#include "utilities/globalDefinitions.hpp"
31	#include "utilities/tableStatistics.hpp"
32
33	// A mostly concurrent-hash-table where the read-side is wait-free, inserts are
34	// CAS and deletes mutual exclude each other on per bucket-basis. VALUE is the
35	// type kept inside each Node and CONFIG contains hash and allocation methods.
36	// A CALLBACK_FUNC and LOOKUP_FUNC needs to be provided for get and insert.
37
38	class Thread;
39	class Mutex;
40
41	template <typename VALUE, typename CONFIG, MEMFLAGS F>
42	class ConcurrentHashTable : public CHeapObj<F> {
43	private:
44	// This is the internal node structure.
45	// Only constructed with placement new from memory allocated with MEMFLAGS of
46	// the InternalTable or user-defined memory.
47	class Node {
48	private:
49	Node * volatile _next;
50	VALUE _value;
51	public:
52	Node(const VALUE& value, Node* next = NULL)
53	: _next(next), _value(value) {
54	assert((((uintptr_t)this) & ((uintptr_t)`0x3`)) == `0`,
55	"Must 16 bit aligned.");
56	}
57
58	Node* next() const;
59	void set_next(Node* node) { _next = node; }
60	Node* const volatile * next_ptr() { return &_next; }
61
62	VALUE* value() { return &_value; }
63
64	// Creates a node.
65	static Node* create_node(const VALUE& value, Node* next = NULL) {
66	return new (CONFIG::allocate_node(sizeof(Node), value)) Node(value, next);
67	}
68	// Destroys a node.
69	static void destroy_node(Node* node) {
70	CONFIG::free_node((void*)node, node->_value);
71	}
72
73	void print_on(outputStream* st) const {};
74	void print_value_on(outputStream* st) const {};
75	};
76
77	// Only constructed with placement new from an array allocated with MEMFLAGS
78	// of InternalTable.
79	class Bucket {
80	private:
81
82	// Embedded state in two low bits in first pointer is a spinlock with 3
83	// states, unlocked, locked, redirect. You must never busy-spin on trylock()
84	// or call lock() without _resize_lock, that would deadlock. Redirect can
85	// only be installed by owner and is the final state of a bucket.
86	// The only two valid flows are:
87	// unlocked -> locked -> unlocked
88	// unlocked -> locked -> redirect
89	// Locked state only applies to an updater.
90	// Reader only check for redirect.
91	Node * volatile _first;
92
93	static const uintptr_t STATE_LOCK_BIT = `0x1`;
94	static const uintptr_t STATE_REDIRECT_BIT = `0x2`;
95	static const uintptr_t STATE_MASK = `0x3`;
96
97	// Get the first pointer unmasked.
98	Node* first_raw() const;
99
100	// Methods to manipulate the embedded.
101	static bool is_state(Node* node, uintptr_t bits) {
102	return (bits & (uintptr_t)node) == bits;
103	}
104
105	static Node* set_state(Node* n, uintptr_t bits) {
106	return (Node*)(bits \| (uintptr_t)n);
107	}
108
109	static uintptr_t get_state(Node* node) {
110	return (((uintptr_t)node) & STATE_MASK);
111	}
112
113	static Node* clear_state(Node* node) {
114	return (Node*)(((uintptr_t)node) & (~(STATE_MASK)));
115	}
116
117	static Node* clear_set_state(Node* node, Node* state) {
118	return (Node*)(((uintptr_t)clear_state(node)) ^ get_state(state));
119	}
120
121	public:
122	// A bucket is only one pointer with the embedded state.
123	Bucket() : _first(NULL) {};
124
125	// Get the first pointer unmasked.
126	Node* first() const;
127
128	// Get a pointer to the const first pointer. Do not deference this
129	// pointer, the pointer pointed to _may_ contain an embedded state. Such
130	// pointer should only be used as input to release_assign_node_ptr.
131	Node* const volatile * first_ptr() { return &_first; }
132
133	// This is the only place where a pointer to a Node pointer that potentially
134	// is _first should be changed. Otherwise we destroy the embedded state. We
135	// only give out pointer to const Node pointer to avoid accidental
136	// assignment, thus here we must cast const part away. Method is not static
137	// due to an assert.
138	void release_assign_node_ptr(Node* const volatile * dst, Node* node) const;
139
140	// This method assigns this buckets last Node next ptr to input Node.
141	void release_assign_last_node_next(Node* node);
142
143	// Setting the first pointer must be done with CAS.
144	bool cas_first(Node node, Node expect);
145
146	// Returns true if this bucket is redirecting to a new table.
147	// Redirect is a terminal state and will never change.
148	bool have_redirect() const;
149
150	// Return true if this bucket is locked for updates.
151	bool is_locked() const;
152
153	// Return true if this bucket was locked.
154	bool trylock();
155
156	// The bucket might be invalid, due to a concurrent resize. The lock()
157	// method do no respect that and can deadlock if caller do not hold
158	// _resize_lock.
159	void lock();
160
161	// Unlocks this bucket.
162	void unlock();
163
164	// Installs redirect in this bucket.
165	// Prior to doing so you must have successfully locked this bucket.
166	void redirect();
167	};
168
169	// The backing storage table holding the buckets and it's size and mask-bits.
170	// Table is always a power of two for two reasons:
171	// - Re-size can only change the size into half or double
172	// (any pow 2 would also be possible).
173	// - Use masking of hash for bucket index.
174	class InternalTable : public CHeapObj<F> {
175	private:
176	Bucket* _buckets; // Bucket array.
177	public:
178	const size_t _log2_size; // Size in log2.
179	const size_t _size; // Size in log10.
180
181	// The mask used on hash for selecting bucket.
182	// The masked value is guaranteed be to inside the buckets array.
183	const size_t _hash_mask;
184
185	// Create a backing table
186	InternalTable(size_t log2_size);
187	~InternalTable();
188
189	Bucket* get_buckets() { return _buckets; }
190	Bucket* get_bucket(size_t idx) { return &_buckets[idx]; }
191	};
192
193	// Used as default functor when no functor supplied for some methods.
194	struct NoOp {
195	void operator()(VALUE*) {}
196	const VALUE& operator()() {}
197	void operator()(bool, VALUE*) {}
198	} noOp;
199
200	// For materializing a supplied value.
201	class LazyValueRetrieve {
202	private:
203	const VALUE& _val;
204	public:
205	LazyValueRetrieve(const VALUE& val) : _val(val) {}
206	const VALUE& operator()() { return _val; }
207	};
208
209	InternalTable* _table; // Active table.
210	InternalTable* _new_table; // Table we are resizing to.
211
212	// Default sizes
213	static const size_t DEFAULT_MAX_SIZE_LOG2 = `21`;
214	static const size_t DEFAULT_START_SIZE_LOG2 = `13`;
215	static const size_t DEFAULT_GROW_HINT = `4`; // Chain length
216
217	const size_t _log2_size_limit; // The biggest size.
218	const size_t _log2_start_size; // Start size.
219	const size_t _grow_hint; // Number of linked items
220
221	volatile bool _size_limit_reached;
222
223	// We serialize resizers and other bulk operations which do not support
224	// concurrent resize with this lock.
225	Mutex* _resize_lock;
226	// Since we need to drop mutex for safepoints, but stop other threads from
227	// taking the mutex after a safepoint this bool is the actual state. After
228	// acquiring the mutex you must check if this is already locked. If so you
229	// must drop the mutex until the real lock holder grabs the mutex.
230	volatile Thread* _resize_lock_owner;
231
232	// Return true if lock mutex/state succeeded.
233	bool try_resize_lock(Thread* locker);
234	// Returns when both mutex and state are proper locked.
235	void lock_resize_lock(Thread* locker);
236	// Unlocks mutex and state.
237	void unlock_resize_lock(Thread* locker);
238
239	// This method sets the _invisible_epoch and do a write_synchronize.
240	// Subsequent calls check the state of _invisible_epoch and determine if the
241	// write_synchronize can be avoided. If not, it sets the _invisible_epoch
242	// again and do a write_synchronize.
243	void write_synchonize_on_visible_epoch(Thread* thread);
244	// To be-able to avoid write_synchronize in resize and other bulk operation,
245	// this field keep tracks if a version of the hash-table was ever been seen.
246	// We the working thread pointer as tag for debugging. The _invisible_epoch
247	// can only be used by the owner of _resize_lock.
248	volatile Thread* _invisible_epoch;
249
250	// Scoped critical section, which also handles the invisible epochs.
251	// An invisible epoch/version do not need a write_synchronize().
252	class ScopedCS: public StackObj {
253	protected:
254	Thread* _thread;
255	ConcurrentHashTable<VALUE, CONFIG, F>* _cht;
256	GlobalCounter::CSContext _cs_context;
257	public:
258	ScopedCS(Thread* thread, ConcurrentHashTable<VALUE, CONFIG, F>* cht);
259	~ScopedCS();
260	};
261
262
263	// Max number of deletes in one bucket chain during bulk delete.
264	static const size_t BULK_DELETE_LIMIT = `256`;
265
266	// Simple getters and setters for the internal table.
267	InternalTable* get_table() const;
268	InternalTable* get_new_table() const;
269	InternalTable* set_table_from_new();
270
271	// Destroys all nodes.
272	void free_nodes();
273
274	// Mask away high bits of hash.
275	static size_t bucket_idx_hash(InternalTable* table, const uintx hash) {
276	return ((size_t)hash) & table->_hash_mask;
277	}
278
279	// Returns bucket for hash for that internal table.
280	Bucket* get_bucket_in(InternalTable* table, const uintx hash) const {
281	size_t bucket_index = bucket_idx_hash(table, hash);
282	return table->get_bucket(bucket_index);
283	}
284
285	// Return correct bucket for reading and handles resizing.
286	Bucket* get_bucket(const uintx hash) const;
287
288	// Return correct bucket for updates and handles resizing.
289	Bucket* get_bucket_locked(Thread* thread, const uintx hash);
290
291	// Finds a node.
292	template <typename LOOKUP_FUNC>
293	Node* get_node(const Bucket* const bucket, LOOKUP_FUNC& lookup_f,
294	bool* have_dead, size_t* loops = NULL) const;
295
296	// Method for shrinking.
297	bool internal_shrink_prolog(Thread* thread, size_t log2_size);
298	void internal_shrink_epilog(Thread* thread);
299	void internal_shrink_range(Thread* thread, size_t start, size_t stop);
300	bool internal_shrink(Thread* thread, size_t size_limit_log2);
301
302	// Methods for growing.
303	bool unzip_bucket(Thread* thread, InternalTable* old_table,
304	InternalTable* new_table, size_t even_index,
305	size_t odd_index);
306	bool internal_grow_prolog(Thread* thread, size_t log2_size);
307	void internal_grow_epilog(Thread* thread);
308	void internal_grow_range(Thread* thread, size_t start, size_t stop);
309	bool internal_grow(Thread* thread, size_t log2_size);
310
311	// Get a value.
312	template <typename LOOKUP_FUNC>
313	VALUE* internal_get(Thread* thread, LOOKUP_FUNC& lookup_f,
314	bool* grow_hint = NULL);
315
316	// Plain insert.
317	template <typename LOOKUP_FUNC>
318	bool internal_insert(Thread* thread, LOOKUP_FUNC& lookup_f, const VALUE& value,
319	bool* grow_hint, bool* clean_hint);
320
321	// Returns true if an item matching LOOKUP_FUNC is removed.
322	// Calls DELETE_FUNC before destroying the node.
323	template <typename LOOKUP_FUNC, typename DELETE_FUNC>
324	bool internal_remove(Thread* thread, LOOKUP_FUNC& lookup_f,
325	DELETE_FUNC& delete_f);
326
327	// Visits nodes with FUNC.
328	template <typename FUNC>
329	static bool visit_nodes(Bucket* bucket, FUNC& visitor_f);
330
331	// During shrink/grow we cannot guarantee that we only visit nodes once, with
332	// current algorithm. To keep it simple caller will have locked
333	// _resize_lock.
334	template <typename FUNC>
335	void do_scan_locked(Thread* thread, FUNC& scan_f);
336
337	// Check for dead items in a bucket.
338	template <typename EVALUATE_FUNC>
339	size_t delete_check_nodes(Bucket* bucket, EVALUATE_FUNC& eval_f,
340	size_t num_del, Node** ndel);
341
342	// Check for dead items in this table. During shrink/grow we cannot guarantee
343	// that we only visit nodes once. To keep it simple caller will have locked
344	// _resize_lock.
345	template <typename EVALUATE_FUNC, typename DELETE_FUNC>
346	void do_bulk_delete_locked(Thread* thread, EVALUATE_FUNC& eval_f
347	, DELETE_FUNC& del_f) {
348	do_bulk_delete_locked_for(thread, `0`, _table->_size, eval_f, del_f);
349	}
350
351	// To have prefetching for a VALUE that is pointer during
352	// do_bulk_delete_locked, we have this helper classes. One for non-pointer
353	// case without prefect and one for pointer with prefect.
354	template <bool b, typename EVALUATE_FUNC>
355	struct HaveDeletables {
356	static bool have_deletable(Bucket* bucket, EVALUATE_FUNC& eval_f,
357	Bucket* prefetch_bucket);
358	};
359	template<typename EVALUATE_FUNC>
360	struct HaveDeletables<true, EVALUATE_FUNC> {
361	static bool have_deletable(Bucket* bucket, EVALUATE_FUNC& eval_f,
362	Bucket* prefetch_bucket);
363	};
364
365	// Check for dead items in this table with range. During shrink/grow we cannot
366	// guarantee that we only visit nodes once. To keep it simple caller will
367	// have locked _resize_lock.
368	template <typename EVALUATE_FUNC, typename DELETE_FUNC>
369	void do_bulk_delete_locked_for(Thread* thread, size_t start_idx,
370	size_t stop_idx, EVALUATE_FUNC& eval_f,
371	DELETE_FUNC& del_f, bool is_mt = false);
372
373	// Method to delete one items.
374	template <typename LOOKUP_FUNC>
375	void delete_in_bucket(Thread* thread, Bucket* bucket, LOOKUP_FUNC& lookup_f);
376
377	public:
378	ConcurrentHashTable(size_t log2size = DEFAULT_START_SIZE_LOG2,
379	size_t log2size_limit = DEFAULT_MAX_SIZE_LOG2,
380	size_t grow_hint = DEFAULT_GROW_HINT);
381
382	~ConcurrentHashTable();
383
384	TableRateStatistics _stats_rate;
385
386	size_t get_size_log2(Thread* thread);
387	size_t get_node_size() const { return sizeof(Node); }
388	bool is_max_size_reached() { return _size_limit_reached; }
389
390	// This means no paused bucket resize operation is going to resume
391	// on this table.
392	bool is_safepoint_safe() { return _resize_lock_owner == NULL; }
393
394	// Re-size operations.
395	bool shrink(Thread* thread, size_t size_limit_log2 = `0`);
396	bool grow(Thread* thread, size_t size_limit_log2 = `0`);
397
398	// All callbacks for get are under critical sections. Other callbacks may be
399	// under critical section or may have locked parts of table. Calling any
400	// methods on the table during a callback is not supported.Only MultiGetHandle
401	// supports multiple gets.
402
403	// Get methods return true on found item with LOOKUP_FUNC and FOUND_FUNC is
404	// called.
405	template <typename LOOKUP_FUNC, typename FOUND_FUNC>
406	bool get(Thread* thread, LOOKUP_FUNC& lookup_f, FOUND_FUNC& foundf,
407	bool* grow_hint = NULL);
408
409	// Returns true true if the item was inserted, duplicates are found with
410	// LOOKUP_FUNC.
411	template <typename LOOKUP_FUNC>
412	bool insert(Thread* thread, LOOKUP_FUNC& lookup_f, const VALUE& value,
413	bool* grow_hint = NULL, bool* clean_hint = NULL) {
414	return internal_insert(thread, lookup_f, value, grow_hint, clean_hint);
415	}
416
417	// This does a fast unsafe insert and can thus only be used when there is no
418	// risk for a duplicates and no other threads uses this table.
419	bool unsafe_insert(const VALUE& value);
420
421	// Returns true if items was deleted matching LOOKUP_FUNC and
422	// prior to destruction DELETE_FUNC is called.
423	template <typename LOOKUP_FUNC, typename DELETE_FUNC>
424	bool remove(Thread* thread, LOOKUP_FUNC& lookup_f, DELETE_FUNC& del_f) {
425	return internal_remove(thread, lookup_f, del_f);
426	}
427
428	// Same without DELETE_FUNC.
429	template <typename LOOKUP_FUNC>
430	bool remove(Thread* thread, LOOKUP_FUNC& lookup_f) {
431	return internal_remove(thread, lookup_f, noOp);
432	}
433
434	// Visit all items with SCAN_FUNC if no concurrent resize. Takes the resize
435	// lock to avoid concurrent resizes. Else returns false.
436	template <typename SCAN_FUNC>
437	bool try_scan(Thread* thread, SCAN_FUNC& scan_f);
438
439	// Visit all items with SCAN_FUNC when the resize lock is obtained.
440	template <typename SCAN_FUNC>
441	void do_scan(Thread* thread, SCAN_FUNC& scan_f);
442
443	// Visit all items with SCAN_FUNC without any protection.
444	// It will assume there is no other thread accessing this
445	// table during the safepoint. Must be called with VM thread.
446	template <typename SCAN_FUNC>
447	void do_safepoint_scan(SCAN_FUNC& scan_f);
448
449	// Destroying items matching EVALUATE_FUNC, before destroying items
450	// DELETE_FUNC is called, if resize lock is obtained. Else returns false.
451	template <typename EVALUATE_FUNC, typename DELETE_FUNC>
452	bool try_bulk_delete(Thread* thread, EVALUATE_FUNC& eval_f,
453	DELETE_FUNC& del_f);
454
455	// Destroying items matching EVALUATE_FUNC, before destroying items
456	// DELETE_FUNC is called, when the resize lock is successfully obtained.
457	template <typename EVALUATE_FUNC, typename DELETE_FUNC>
458	void bulk_delete(Thread* thread, EVALUATE_FUNC& eval_f, DELETE_FUNC& del_f);
459
460	// Calcuate statistics. Item sizes are calculated with VALUE_SIZE_FUNC.
461	template <typename VALUE_SIZE_FUNC>
462	TableStatistics statistics_calculate(Thread* thread, VALUE_SIZE_FUNC& vs_f);
463
464	// Gets statistics if available, if not return old one. Item sizes are calculated with
465	// VALUE_SIZE_FUNC.
466	template <typename VALUE_SIZE_FUNC>
467	TableStatistics statistics_get(Thread* thread, VALUE_SIZE_FUNC& vs_f, TableStatistics old);
468
469	// Writes statistics to the outputStream. Item sizes are calculated with
470	// VALUE_SIZE_FUNC.
471	template <typename VALUE_SIZE_FUNC>
472	void statistics_to(Thread* thread, VALUE_SIZE_FUNC& vs_f, outputStream* st,
473	const char* table_name);
474
475	// Moves all nodes from this table to to_cht
476	bool try_move_nodes_to(Thread* thread, ConcurrentHashTable<VALUE, CONFIG, F>* to_cht);
477
478	// This is a Curiously Recurring Template Pattern (CRPT) interface for the
479	// specialization.
480	struct BaseConfig {
481	public:
482	// Called when the hash table needs the hash for a VALUE.
483	static uintx get_hash(const VALUE& value, bool* dead) {
484	return CONFIG::get_hash(value, dead);
485	}
486	// Default node allocation.
487	static void* allocate_node(size_t size, const VALUE& value);
488	// Default node reclamation.
489	static void free_node(void* memory, const VALUE& value);
490	};
491
492	// Scoped multi getter.
493	class MultiGetHandle : private ScopedCS {
494	public:
495	MultiGetHandle(Thread* thread, ConcurrentHashTable<VALUE, CONFIG, F>* cht)
496	: ScopedCS(thread, cht) {}
497	// In the MultiGetHandle scope you can lookup items matching LOOKUP_FUNC.
498	// The VALUEs are safe as long as you never save the VALUEs outside the
499	// scope, e.g. after ~MultiGetHandle().
500	template <typename LOOKUP_FUNC>
501	VALUE* get(LOOKUP_FUNC& lookup_f, bool* grow_hint = NULL);
502	};
503
504	private:
505	class BucketsOperation;
506
507	public:
508	class BulkDeleteTask;
509	class GrowTask;
510	};
511
512	#endif // SHARE_UTILITIES_CONCURRENTHASHTABLE_HPP
513

Browse the source code of OpenJDK/src/hotspot/share/utilities/concurrentHashTable.hpp