ptrQueue.hpp source code [OpenJDK/src/hotspot/share/gc/shared/ptrQueue.hpp]

1	/*
2	* Copyright (c) 2001, 2019, Oracle and/or its affiliates. All rights reserved.
3	* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4	*
5	* This code is free software; you can redistribute it and/or modify it
6	* under the terms of the GNU General Public License version 2 only, as
7	* published by the Free Software Foundation.
8	*
9	* This code is distributed in the hope that it will be useful, but WITHOUT
10	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12	* version 2 for more details (a copy is included in the LICENSE file that
13	* accompanied this code).
14	*
15	* You should have received a copy of the GNU General Public License version
16	* 2 along with this work; if not, write to the Free Software Foundation,
17	* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18	*
19	* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20	* or visit www.oracle.com if you need additional information or have any
21	* questions.
22	*
23	*/
24
25	#ifndef SHARE_GC_SHARED_PTRQUEUE_HPP
26	#define SHARE_GC_SHARED_PTRQUEUE_HPP
27
28	#include "memory/padded.hpp"
29	#include "utilities/align.hpp"
30	#include "utilities/debug.hpp"
31	#include "utilities/lockFreeStack.hpp"
32	#include "utilities/sizes.hpp"
33
34	class Mutex;
35	class Monitor;
36
37	// There are various techniques that require threads to be able to log
38	// addresses. For example, a generational write barrier might log
39	// the addresses of modified old-generation objects. This type supports
40	// this operation.
41
42	class BufferNode;
43	class PtrQueueSet;
44	class PtrQueue {
45	friend class VMStructs;
46
47	// Noncopyable - not defined.
48	PtrQueue(const PtrQueue&);
49	PtrQueue& operator=(const PtrQueue&);
50
51	// The ptr queue set to which this queue belongs.
52	PtrQueueSet* const _qset;
53
54	// Whether updates should be logged.
55	bool _active;
56
57	// The (byte) index at which an object was last enqueued. Starts at
58	// capacity_in_bytes (indicating an empty buffer) and goes towards zero.
59	// Value is always pointer-size aligned.
60	size_t _index;
61
62	// Size of the current buffer, in bytes.
63	// Value is always pointer-size aligned.
64	size_t _capacity_in_bytes;
65
66	static const size_t _element_size = sizeof(void*);
67
68	// Get the capacity, in bytes. The capacity must have been set.
69	size_t capacity_in_bytes() const {
70	assert(_capacity_in_bytes > `0`, "capacity not set");
71	return _capacity_in_bytes;
72	}
73
74	static size_t byte_index_to_index(size_t ind) {
75	assert(is_aligned(ind, _element_size), "precondition");
76	return ind / _element_size;
77	}
78
79	static size_t index_to_byte_index(size_t ind) {
80	return ind * _element_size;
81	}
82
83	protected:
84	// The buffer.
85	void** _buf;
86
87	size_t index() const {
88	return byte_index_to_index(_index);
89	}
90
91	void set_index(size_t new_index) {
92	size_t byte_index = index_to_byte_index(new_index);
93	assert(byte_index <= capacity_in_bytes(), "precondition");
94	_index = byte_index;
95	}
96
97	size_t capacity() const {
98	return byte_index_to_index(capacity_in_bytes());
99	}
100
101	PtrQueueSet* qset() const { return _qset; }
102
103	// Process queue entries and release resources.
104	void flush_impl();
105
106	// Process (some of) the buffer and leave it in place for further use,
107	// or enqueue the buffer and allocate a new one.
108	virtual void handle_completed_buffer() = `0`;
109
110	void allocate_buffer();
111
112	// Enqueue the current buffer in the qset and allocate a new buffer.
113	void enqueue_completed_buffer();
114
115	// Initialize this queue to contain a null buffer, and be part of the
116	// given PtrQueueSet.
117	PtrQueue(PtrQueueSet* qset, bool active = false);
118
119	// Requires queue flushed.
120	~PtrQueue();
121
122	public:
123
124	// Forcibly set empty.
125	void reset() {
126	if (_buf != NULL) {
127	_index = capacity_in_bytes();
128	}
129	}
130
131	void enqueue(volatile void* ptr) {
132	enqueue((void*)(ptr));
133	}
134
135	// Enqueues the given "obj".
136	void enqueue(void* ptr) {
137	if (!_active) return;
138	else enqueue_known_active(ptr);
139	}
140
141	void handle_zero_index();
142
143	void enqueue_known_active(void* ptr);
144
145	// Return the size of the in-use region.
146	size_t size() const {
147	size_t result = `0`;
148	if (_buf != NULL) {
149	assert(_index <= capacity_in_bytes(), "Invariant");
150	result = byte_index_to_index(capacity_in_bytes() - _index);
151	}
152	return result;
153	}
154
155	bool is_empty() const {
156	return _buf == NULL \|\| capacity_in_bytes() == _index;
157	}
158
159	// Set the "active" property of the queue to "b". An enqueue to an
160	// inactive thread is a no-op. Setting a queue to inactive resets its
161	// log to the empty state.
162	void set_active(bool b) {
163	_active = b;
164	if (!b && _buf != NULL) {
165	reset();
166	} else if (b && _buf != NULL) {
167	assert(index() == capacity(),
168	"invariant: queues are empty when activated.");
169	}
170	}
171
172	bool is_active() const { return _active; }
173
174	// To support compiler.
175
176	protected:
177	template<typename Derived>
178	static ByteSize byte_offset_of_index() {
179	return byte_offset_of(Derived, _index);
180	}
181
182	static ByteSize byte_width_of_index() { return in_ByteSize(sizeof(size_t)); }
183
184	template<typename Derived>
185	static ByteSize byte_offset_of_buf() {
186	return byte_offset_of(Derived, _buf);
187	}
188
189	static ByteSize byte_width_of_buf() { return in_ByteSize(_element_size); }
190
191	template<typename Derived>
192	static ByteSize byte_offset_of_active() {
193	return byte_offset_of(Derived, _active);
194	}
195
196	static ByteSize byte_width_of_active() { return in_ByteSize(sizeof(bool)); }
197
198	};
199
200	class BufferNode {
201	size_t _index;
202	BufferNode* volatile _next;
203	void* _buffer[`1`]; // Pseudo flexible array member.
204
205	BufferNode() : _index(`0`), _next(NULL) { }
206	~BufferNode() { }
207
208	static size_t buffer_offset() {
209	return offset_of(BufferNode, _buffer);
210	}
211
212	static BufferNode* volatile* next_ptr(BufferNode& bn) { return &bn._next; }
213
214	AIX_ONLY(public:) // xlC 12 on AIX doesn't implement C++ DR45.
215	// Allocate a new BufferNode with the "buffer" having size elements.
216	static BufferNode* allocate(size_t size);
217
218	// Free a BufferNode.
219	static void deallocate(BufferNode* node);
220
221	public:
222	typedef LockFreeStack<BufferNode, &next_ptr> Stack;
223
224	BufferNode* next() const { return _next; }
225	void set_next(BufferNode* n) { _next = n; }
226	size_t index() const { return _index; }
227	void set_index(size_t i) { _index = i; }
228
229	// Return the BufferNode containing the buffer, after setting its index.
230	static BufferNode* make_node_from_buffer(void** buffer, size_t index) {
231	BufferNode* node =
232	reinterpret_cast<BufferNode*>(
233	reinterpret_cast<char*>(buffer) - buffer_offset());
234	node->set_index(index);
235	return node;
236	}
237
238	// Return the buffer for node.
239	static void** make_buffer_from_node(BufferNode *node) {
240	// &_buffer[0] might lead to index out of bounds warnings.
241	return reinterpret_cast<void**>(
242	reinterpret_cast<char*>(node) + buffer_offset());
243	}
244
245	class Allocator; // Free-list based allocator.
246	class TestSupport; // Unit test support.
247	};
248
249	// Allocation is based on a lock-free free list of nodes, linked through
250	// BufferNode::_next (see BufferNode::Stack). To solve the ABA problem,
251	// popping a node from the free list is performed within a GlobalCounter
252	// critical section, and pushing nodes onto the free list is done after
253	// a GlobalCounter synchronization associated with the nodes to be pushed.
254	// This is documented behavior so that other parts of the node life-cycle
255	// can depend on and make use of it too.
256	class BufferNode::Allocator {
257	friend class TestSupport;
258
259	// Since we don't expect many instances, and measured >15% speedup
260	// on stress gtest, padding seems like a good tradeoff here.
261	#define DECLARE_PADDED_MEMBER(Id, Type, Name) \
262	Type Name; DEFINE_PAD_MINUS_SIZE(Id, DEFAULT_CACHE_LINE_SIZE, sizeof(Type))
263
264	const size_t _buffer_size;
265	char _name[DEFAULT_CACHE_LINE_SIZE - sizeof(size_t)]; // Use name as padding.
266	DECLARE_PADDED_MEMBER(`1`, Stack, _pending_list);
267	DECLARE_PADDED_MEMBER(`2`, Stack, _free_list);
268	DECLARE_PADDED_MEMBER(`3`, volatile size_t, _pending_count);
269	DECLARE_PADDED_MEMBER(`4`, volatile size_t, _free_count);
270	DECLARE_PADDED_MEMBER(`5`, volatile bool, _transfer_lock);
271
272	#undef DECLARE_PADDED_MEMBER
273
274	void delete_list(BufferNode* list);
275	bool try_transfer_pending();
276
277	public:
278	Allocator(const char* name, size_t buffer_size);
279	~Allocator();
280
281	const char* name() const { return _name; }
282	size_t buffer_size() const { return _buffer_size; }
283	size_t free_count() const;
284	BufferNode* allocate();
285	void release(BufferNode* node);
286
287	// Deallocate some of the available buffers. remove_goal is the target
288	// number to remove. Returns the number actually deallocated, which may
289	// be less than the goal if there were fewer available.
290	size_t reduce_free_list(size_t remove_goal);
291	};
292
293	// A PtrQueueSet represents resources common to a set of pointer queues.
294	// In particular, the individual queues allocate buffers from this shared
295	// set, and return completed buffers to the set.
296	class PtrQueueSet {
297	BufferNode::Allocator* _allocator;
298
299	Monitor* _cbl_mon; // Protects the fields below.
300	BufferNode* _completed_buffers_head;
301	BufferNode* _completed_buffers_tail;
302	volatile size_t _n_completed_buffers;
303
304	size_t _process_completed_buffers_threshold;
305	volatile bool _process_completed_buffers;
306
307	// If true, notify_all on _cbl_mon when the threshold is reached.
308	bool _notify_when_complete;
309
310	void assert_completed_buffers_list_len_correct_locked() NOT_DEBUG_RETURN;
311
312	protected:
313	bool _all_active;
314
315	// Create an empty ptr queue set.
316	PtrQueueSet(bool notify_when_complete = false);
317	~PtrQueueSet();
318
319	// Because of init-order concerns, we can't pass these as constructor
320	// arguments.
321	void initialize(Monitor* cbl_mon, BufferNode::Allocator* allocator);
322
323	// For (unlocked!) iteration over the completed buffers.
324	BufferNode* completed_buffers_head() const { return _completed_buffers_head; }
325
326	// Deallocate all of the completed buffers.
327	void abandon_completed_buffers();
328
329	public:
330
331	// Return the buffer for a BufferNode of size buffer_size().
332	void** allocate_buffer();
333
334	// Return an empty buffer to the free list. The node is required
335	// to have been allocated with a size of buffer_size().
336	void deallocate_buffer(BufferNode* node);
337
338	// A completed buffer is a buffer the mutator is finished with, and
339	// is ready to be processed by the collector. It need not be full.
340
341	// Adds node to the completed buffer list.
342	void enqueue_completed_buffer(BufferNode* node);
343
344	// If the number of completed buffers is > stop_at, then remove and
345	// return a completed buffer from the list. Otherwise, return NULL.
346	BufferNode* get_completed_buffer(size_t stop_at = `0`);
347
348	bool process_completed_buffers() { return _process_completed_buffers; }
349	void set_process_completed_buffers(bool x) { _process_completed_buffers = x; }
350
351	bool is_active() { return _all_active; }
352
353	size_t buffer_size() const {
354	return _allocator->buffer_size();
355	}
356
357	// Get/Set the number of completed buffers that triggers log processing.
358	// Log processing should be done when the number of buffers exceeds the
359	// threshold.
360	void set_process_completed_buffers_threshold(size_t sz) {
361	_process_completed_buffers_threshold = sz;
362	}
363	size_t process_completed_buffers_threshold() const {
364	return _process_completed_buffers_threshold;
365	}
366	static const size_t ProcessCompletedBuffersThresholdNever = ~size_t(`0`);
367
368	size_t completed_buffers_num() const { return _n_completed_buffers; }
369
370	void merge_bufferlists(PtrQueueSet* src);
371
372	// Notify the consumer if the number of buffers crossed the threshold
373	void notify_if_necessary();
374	};
375
376	#endif // SHARE_GC_SHARED_PTRQUEUE_HPP
377

Browse the source code of OpenJDK/src/hotspot/share/gc/shared/ptrQueue.hpp