cmsCardTable.cpp source code [OpenJDK/src/hotspot/share/gc/cms/cmsCardTable.cpp]

1	/*
2	* Copyright (c) 2007, 2018, Oracle and/or its affiliates. All rights reserved.
3	* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4	*
5	* This code is free software; you can redistribute it and/or modify it
6	* under the terms of the GNU General Public License version 2 only, as
7	* published by the Free Software Foundation.
8	*
9	* This code is distributed in the hope that it will be useful, but WITHOUT
10	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12	* version 2 for more details (a copy is included in the LICENSE file that
13	* accompanied this code).
14	*
15	* You should have received a copy of the GNU General Public License version
16	* 2 along with this work; if not, write to the Free Software Foundation,
17	* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18	*
19	* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20	* or visit www.oracle.com if you need additional information or have any
21	* questions.
22	*
23	*/
24
25	#include "precompiled.hpp"
26	#include "gc/cms/cmsCardTable.hpp"
27	#include "gc/cms/cmsHeap.hpp"
28	#include "gc/shared/cardTableBarrierSet.hpp"
29	#include "gc/shared/cardTableRS.hpp"
30	#include "gc/shared/collectedHeap.hpp"
31	#include "gc/shared/space.inline.hpp"
32	#include "memory/allocation.inline.hpp"
33	#include "memory/virtualspace.hpp"
34	#include "oops/oop.inline.hpp"
35	#include "runtime/java.hpp"
36	#include "runtime/mutexLocker.hpp"
37	#include "runtime/orderAccess.hpp"
38	#include "runtime/vmThread.hpp"
39
40	CMSCardTable::CMSCardTable(MemRegion whole_heap) :
41	CardTableRS (whole_heap, CMSPrecleaningEnabled / scanned_concurrently /) {
42	}
43
44	// Returns the number of chunks necessary to cover "mr".
45	size_t CMSCardTable::chunks_to_cover(MemRegion mr) {
46	return (size_t)(addr_to_chunk_index(mr.last()) -
47	addr_to_chunk_index(mr.start()) + `1`);
48	}
49
50	// Returns the index of the chunk in a stride which
51	// covers the given address.
52	uintptr_t CMSCardTable::addr_to_chunk_index(const void* addr) {
53	uintptr_t card = (uintptr_t) byte_for(addr);
54	return card / ParGCCardsPerStrideChunk;
55	}
56
57	void CMSCardTable::
58	non_clean_card_iterate_parallel_work(Space* sp, MemRegion mr,
59	OopsInGenClosure* cl,
60	CardTableRS* ct,
61	uint n_threads) {
62	assert(n_threads > `0`, "expected n_threads > 0");
63	assert(n_threads <= ParallelGCThreads,
64	"n_threads: %u > ParallelGCThreads: %u", n_threads, ParallelGCThreads);
65
66	// Make sure the LNC array is valid for the space.
67	CardValue** lowest_non_clean;
68	uintptr_t lowest_non_clean_base_chunk_index;
69	size_t lowest_non_clean_chunk_size;
70	get_LNC_array_for_space(sp, lowest_non_clean,
71	lowest_non_clean_base_chunk_index,
72	lowest_non_clean_chunk_size);
73
74	uint n_strides = n_threads * ParGCStridesPerThread;
75	SequentialSubTasksDone* pst = sp->par_seq_tasks();
76	// Sets the condition for completion of the subtask (how many threads
77	// need to finish in order to be done).
78	pst->set_n_threads(n_threads);
79	pst->set_n_tasks(n_strides);
80
81	uint stride = `0`;
82	while (pst->try_claim_task(/ reference / stride)) {
83	process_stride(sp, mr, stride, n_strides,
84	cl, ct,
85	lowest_non_clean,
86	lowest_non_clean_base_chunk_index,
87	lowest_non_clean_chunk_size);
88	}
89	if (pst->all_tasks_completed()) {
90	// Clear lowest_non_clean array for next time.
91	intptr_t first_chunk_index = addr_to_chunk_index(mr.start());
92	uintptr_t last_chunk_index = addr_to_chunk_index(mr.last());
93	for (uintptr_t ch = first_chunk_index; ch <= last_chunk_index; ch++) {
94	intptr_t ind = ch - lowest_non_clean_base_chunk_index;
95	assert(`0` <= ind && ind < (intptr_t)lowest_non_clean_chunk_size,
96	"Bounds error");
97	lowest_non_clean[ind] = NULL;
98	}
99	}
100	}
101
102	void
103	CMSCardTable::
104	process_stride(Space* sp,
105	MemRegion used,
106	jint stride, int n_strides,
107	OopsInGenClosure* cl,
108	CardTableRS* ct,
109	CardValue** lowest_non_clean,
110	uintptr_t lowest_non_clean_base_chunk_index,
111	size_t lowest_non_clean_chunk_size) {
112	// We go from higher to lower addresses here; it wouldn't help that much
113	// because of the strided parallelism pattern used here.
114
115	// Find the first card address of the first chunk in the stride that is
116	// at least "bottom" of the used region.
117	CardValue* start_card = byte_for(used.start());
118	CardValue* end_card = byte_after(used.last());
119	uintptr_t start_chunk = addr_to_chunk_index(used.start());
120	uintptr_t start_chunk_stride_num = start_chunk % n_strides;
121	CardValue* chunk_card_start;
122
123	if ((uintptr_t)stride >= start_chunk_stride_num) {
124	chunk_card_start = (start_card +
125	(stride - start_chunk_stride_num) * ParGCCardsPerStrideChunk);
126	} else {
127	// Go ahead to the next chunk group boundary, then to the requested stride.
128	chunk_card_start = (start_card +
129	(n_strides - start_chunk_stride_num + stride) * ParGCCardsPerStrideChunk);
130	}
131
132	while (chunk_card_start < end_card) {
133	// Even though we go from lower to higher addresses below, the
134	// strided parallelism can interleave the actual processing of the
135	// dirty pages in various ways. For a specific chunk within this
136	// stride, we take care to avoid double scanning or missing a card
137	// by suitably initializing the "min_done" field in process_chunk_boundaries()
138	// below, together with the dirty region extension accomplished in
139	// DirtyCardToOopClosure::do_MemRegion().
140	CardValue* chunk_card_end = chunk_card_start + ParGCCardsPerStrideChunk;
141	// Invariant: chunk_mr should be fully contained within the "used" region.
142	MemRegion chunk_mr = MemRegion (addr_for(chunk_card_start),
143	chunk_card_end >= end_card ?
144	used.end() : addr_for(chunk_card_end));
145	assert(chunk_mr.word_size() > `0`, "[chunk_card_start > used_end)");
146	assert(used.contains(chunk_mr), "chunk_mr should be subset of used");
147
148	// This function is used by the parallel card table iteration.
149	const bool parallel = true;
150
151	DirtyCardToOopClosure* dcto_cl = sp->new_dcto_cl(cl, precision(),
152	cl->gen_boundary(),
153	parallel);
154	ClearNoncleanCardWrapper clear_cl(dcto_cl, ct, parallel);
155
156
157	// Process the chunk.
158	process_chunk_boundaries(sp,
159	dcto_cl,
160	chunk_mr,
161	used,
162	lowest_non_clean,
163	lowest_non_clean_base_chunk_index,
164	lowest_non_clean_chunk_size);
165
166	// We want the LNC array updates above in process_chunk_boundaries
167	// to be visible before any of the card table value changes as a
168	// result of the dirty card iteration below.
169	OrderAccess::storestore();
170
171	// We want to clear the cards: clear_cl here does the work of finding
172	// contiguous dirty ranges of cards to process and clear.
173	clear_cl.do_MemRegion(chunk_mr);
174
175	// Find the next chunk of the stride.
176	chunk_card_start += ParGCCardsPerStrideChunk * n_strides;
177	}
178	}
179
180	void
181	CMSCardTable::
182	process_chunk_boundaries(Space* sp,
183	DirtyCardToOopClosure* dcto_cl,
184	MemRegion chunk_mr,
185	MemRegion used,
186	CardValue** lowest_non_clean,
187	uintptr_t lowest_non_clean_base_chunk_index,
188	size_t lowest_non_clean_chunk_size)
189	{
190	// We must worry about non-array objects that cross chunk boundaries,
191	// because such objects are both precisely and imprecisely marked:
192	// .. if the head of such an object is dirty, the entire object
193	// needs to be scanned, under the interpretation that this
194	// was an imprecise mark
195	// .. if the head of such an object is not dirty, we can assume
196	// precise marking and it's efficient to scan just the dirty
197	// cards.
198	// In either case, each scanned reference must be scanned precisely
199	// once so as to avoid cloning of a young referent. For efficiency,
200	// our closures depend on this property and do not protect against
201	// double scans.
202
203	uintptr_t start_chunk_index = addr_to_chunk_index(chunk_mr.start());
204	assert(start_chunk_index >= lowest_non_clean_base_chunk_index, "Bounds error.");
205	uintptr_t cur_chunk_index = start_chunk_index - lowest_non_clean_base_chunk_index;
206
207	// First, set "our" lowest_non_clean entry, which would be
208	// used by the thread scanning an adjoining left chunk with
209	// a non-array object straddling the mutual boundary.
210	// Find the object that spans our boundary, if one exists.
211	// first_block is the block possibly straddling our left boundary.
212	HeapWord* first_block = sp->block_start(chunk_mr.start());
213	assert((chunk_mr.start() != used.start()) \|\| (first_block == chunk_mr.start()),
214	"First chunk should always have a co-initial block");
215	// Does the block straddle the chunk's left boundary, and is it
216	// a non-array object?
217	if (first_block < chunk_mr.start() // first block straddles left bdry
218	&& sp->block_is_obj(first_block) // first block is an object
219	&& !(oop(first_block)->is_objArray() // first block is not an array (arrays are precisely dirtied)
220	\|\| oop(first_block)->is_typeArray())) {
221	// Find our least non-clean card, so that a left neighbor
222	// does not scan an object straddling the mutual boundary
223	// too far to the right, and attempt to scan a portion of
224	// that object twice.
225	CardValue* first_dirty_card = NULL;
226	CardValue* last_card_of_first_obj =
227	byte_for(first_block + sp->block_size(first_block) - `1`);
228	CardValue* first_card_of_cur_chunk = byte_for(chunk_mr.start());
229	CardValue* last_card_of_cur_chunk = byte_for(chunk_mr.last());
230	CardValue* last_card_to_check = MIN2(last_card_of_cur_chunk, last_card_of_first_obj);
231	// Note that this does not need to go beyond our last card
232	// if our first object completely straddles this chunk.
233	for (CardValue* cur = first_card_of_cur_chunk;
234	cur <= last_card_to_check; cur++) {
235	CardValue val = *cur;
236	if (card_will_be_scanned(val)) {
237	first_dirty_card = cur;
238	break;
239	} else {
240	assert(!card_may_have_been_dirty(val), "Error");
241	}
242	}
243	if (first_dirty_card != NULL) {
244	assert(cur_chunk_index < lowest_non_clean_chunk_size, "Bounds error.");
245	assert(lowest_non_clean[cur_chunk_index] == NULL,
246	"Write exactly once : value should be stable hereafter for this round");
247	lowest_non_clean[cur_chunk_index] = first_dirty_card;
248	}
249	} else {
250	// In this case we can help our neighbor by just asking them
251	// to stop at our first card (even though it may not be dirty).
252	assert(lowest_non_clean[cur_chunk_index] == NULL, "Write once : value should be stable hereafter");
253	CardValue* first_card_of_cur_chunk = byte_for(chunk_mr.start());
254	lowest_non_clean[cur_chunk_index] = first_card_of_cur_chunk;
255	}
256
257	// Next, set our own max_to_do, which will strictly/exclusively bound
258	// the highest address that we will scan past the right end of our chunk.
259	HeapWord* max_to_do = NULL;
260	if (chunk_mr.end() < used.end()) {
261	// This is not the last chunk in the used region.
262	// What is our last block? We check the first block of
263	// the next (right) chunk rather than strictly check our last block
264	// because it's potentially more efficient to do so.
265	HeapWord* const last_block = sp->block_start(chunk_mr.end());
266	assert(last_block <= chunk_mr.end(), "In case this property changes.");
267	if ((last_block == chunk_mr.end()) // our last block does not straddle boundary
268	\|\| !sp->block_is_obj(last_block) // last_block isn't an object
269	\|\| oop(last_block)->is_objArray() // last_block is an array (precisely marked)
270	\|\| oop(last_block)->is_typeArray()) {
271	max_to_do = chunk_mr.end();
272	} else {
273	assert(last_block < chunk_mr.end(), "Tautology");
274	// It is a non-array object that straddles the right boundary of this chunk.
275	// last_obj_card is the card corresponding to the start of the last object
276	// in the chunk. Note that the last object may not start in
277	// the chunk.
278	CardValue* const last_obj_card = byte_for(last_block);
279	const CardValue val = *last_obj_card;
280	if (!card_will_be_scanned(val)) {
281	assert(!card_may_have_been_dirty(val), "Error");
282	// The card containing the head is not dirty. Any marks on
283	// subsequent cards still in this chunk must have been made
284	// precisely; we can cap processing at the end of our chunk.
285	max_to_do = chunk_mr.end();
286	} else {
287	// The last object must be considered dirty, and extends onto the
288	// following chunk. Look for a dirty card in that chunk that will
289	// bound our processing.
290	CardValue* limit_card = NULL;
291	const size_t last_block_size = sp->block_size(last_block);
292	CardValue* const last_card_of_last_obj =
293	byte_for(last_block + last_block_size - `1`);
294	CardValue* const first_card_of_next_chunk = byte_for(chunk_mr.end());
295	// This search potentially goes a long distance looking
296	// for the next card that will be scanned, terminating
297	// at the end of the last_block, if no earlier dirty card
298	// is found.
299	assert(byte_for(chunk_mr.end()) - byte_for(chunk_mr.start()) == ParGCCardsPerStrideChunk,
300	"last card of next chunk may be wrong");
301	for (CardValue* cur = first_card_of_next_chunk;
302	cur <= last_card_of_last_obj; cur++) {
303	const CardValue val = *cur;
304	if (card_will_be_scanned(val)) {
305	limit_card = cur; break;
306	} else {
307	assert(!card_may_have_been_dirty(val), "Error: card can't be skipped");
308	}
309	}
310	if (limit_card != NULL) {
311	max_to_do = addr_for(limit_card);
312	assert(limit_card != NULL && max_to_do != NULL, "Error");
313	} else {
314	// The following is a pessimistic value, because it's possible
315	// that a dirty card on a subsequent chunk has been cleared by
316	// the time we get to look at it; we'll correct for that further below,
317	// using the LNC array which records the least non-clean card
318	// before cards were cleared in a particular chunk.
319	limit_card = last_card_of_last_obj;
320	max_to_do = last_block + last_block_size;
321	assert(limit_card != NULL && max_to_do != NULL, "Error");
322	}
323	assert(`0` < cur_chunk_index+`1` && cur_chunk_index+`1` < lowest_non_clean_chunk_size,
324	"Bounds error.");
325	// It is possible that a dirty card for the last object may have been
326	// cleared before we had a chance to examine it. In that case, the value
327	// will have been logged in the LNC for that chunk.
328	// We need to examine as many chunks to the right as this object
329	// covers. However, we need to bound this checking to the largest
330	// entry in the LNC array: this is because the heap may expand
331	// after the LNC array has been created but before we reach this point,
332	// and the last block in our chunk may have been expanded to include
333	// the expansion delta (and possibly subsequently allocated from, so
334	// it wouldn't be sufficient to check whether that last block was
335	// or was not an object at this point).
336	uintptr_t last_chunk_index_to_check = addr_to_chunk_index(last_block + last_block_size - `1`)
337	- lowest_non_clean_base_chunk_index;
338	const uintptr_t last_chunk_index = addr_to_chunk_index(used.last())
339	- lowest_non_clean_base_chunk_index;
340	if (last_chunk_index_to_check > last_chunk_index) {
341	assert(last_block + last_block_size > used.end(),
342	"Inconsistency detected: last_block [" PTR_FORMAT "," PTR_FORMAT "]"
343	" does not exceed used.end() = " PTR_FORMAT ","
344	" yet last_chunk_index_to_check " INTPTR_FORMAT
345	" exceeds last_chunk_index " INTPTR_FORMAT,
346	p2i(last_block), p2i(last_block + last_block_size),
347	p2i(used.end()),
348	last_chunk_index_to_check, last_chunk_index);
349	assert(sp->used_region().end() > used.end(),
350	"Expansion did not happen: "
351	"[" PTR_FORMAT "," PTR_FORMAT ") -> [" PTR_FORMAT "," PTR_FORMAT ")",
352	p2i(sp->used_region().start()), p2i(sp->used_region().end()),
353	p2i(used.start()), p2i(used.end()));
354	last_chunk_index_to_check = last_chunk_index;
355	}
356	for (uintptr_t lnc_index = cur_chunk_index + `1`;
357	lnc_index <= last_chunk_index_to_check;
358	lnc_index++) {
359	CardValue* lnc_card = lowest_non_clean[lnc_index];
360	if (lnc_card != NULL) {
361	// we can stop at the first non-NULL entry we find
362	if (lnc_card <= limit_card) {
363	limit_card = lnc_card;
364	max_to_do = addr_for(limit_card);
365	assert(limit_card != NULL && max_to_do != NULL, "Error");
366	}
367	// In any case, we break now
368	break;
369	} // else continue to look for a non-NULL entry if any
370	}
371	assert(limit_card != NULL && max_to_do != NULL, "Error");
372	}
373	assert(max_to_do != NULL, "OOPS 1 !");
374	}
375	assert(max_to_do != NULL, "OOPS 2!");
376	} else {
377	max_to_do = used.end();
378	}
379	assert(max_to_do != NULL, "OOPS 3!");
380	// Now we can set the closure we're using so it doesn't to beyond
381	// max_to_do.
382	dcto_cl->set_min_done(max_to_do);
383	#ifndef PRODUCT
384	dcto_cl->set_last_bottom(max_to_do);
385	#endif
386	}
387
388	void
389	CMSCardTable::
390	get_LNC_array_for_space(Space* sp,
391	CardValue**& lowest_non_clean,
392	uintptr_t& lowest_non_clean_base_chunk_index,
393	size_t& lowest_non_clean_chunk_size) {
394
395	int i = find_covering_region_containing(sp->bottom());
396	MemRegion covered = _covered[i];
397	size_t n_chunks = chunks_to_cover(covered);
398
399	// Only the first thread to obtain the lock will resize the
400	// LNC array for the covered region. Any later expansion can't affect
401	// the used_at_save_marks region.
402	// (I observed a bug in which the first thread to execute this would
403	// resize, and then it would cause "expand_and_allocate" that would
404	// increase the number of chunks in the covered region. Then a second
405	// thread would come and execute this, see that the size didn't match,
406	// and free and allocate again. So the first thread would be using a
407	// freed "_lowest_non_clean" array.)
408
409	// Do a dirty read here. If we pass the conditional then take the rare
410	// event lock and do the read again in case some other thread had already
411	// succeeded and done the resize.
412	int cur_collection = CMSHeap::heap()->total_collections();
413	// Updated _last_LNC_resizing_collection[i] must not be visible before
414	// _lowest_non_clean and friends are visible. Therefore use acquire/release
415	// to guarantee this on non TSO architecures.
416	if (OrderAccess::load_acquire(&_last_LNC_resizing_collection[i]) != cur_collection) {
417	MutexLocker x(ParGCRareEvent_lock);
418	// This load_acquire is here for clarity only. The MutexLocker already fences.
419	if (OrderAccess::load_acquire(&_last_LNC_resizing_collection[i]) != cur_collection) {
420	if (_lowest_non_clean[i] == NULL \|\|
421	n_chunks != _lowest_non_clean_chunk_size[i]) {
422
423	// Should we delete the old?
424	if (_lowest_non_clean[i] != NULL) {
425	assert(n_chunks != _lowest_non_clean_chunk_size[i],
426	"logical consequence");
427	FREE_C_HEAP_ARRAY(CardPtr, _lowest_non_clean[i]);
428	_lowest_non_clean[i] = NULL;
429	}
430	// Now allocate a new one if necessary.
431	if (_lowest_non_clean[i] == NULL) {
432	_lowest_non_clean[i] = NEW_C_HEAP_ARRAY(CardPtr, n_chunks, mtGC);
433	_lowest_non_clean_chunk_size[i] = n_chunks;
434	_lowest_non_clean_base_chunk_index[i] = addr_to_chunk_index(covered.start());
435	for (int j = `0`; j < (int)n_chunks; j++)
436	_lowest_non_clean[i][j] = NULL;
437	}
438	}
439	// Make sure this gets visible only after _lowest_non_clean was initialized*
440	OrderAccess::release_store(&_last_LNC_resizing_collection[i], cur_collection);
441	}
442	}
443	// In any case, now do the initialization.
444	lowest_non_clean = _lowest_non_clean[i];
445	lowest_non_clean_base_chunk_index = _lowest_non_clean_base_chunk_index[i];
446	lowest_non_clean_chunk_size = _lowest_non_clean_chunk_size[i];
447	}
448
449	#ifdef ASSERT
450	void CMSCardTable::verify_used_region_at_save_marks(Space* sp) const {
451	MemRegion ur = sp->used_region();
452	MemRegion urasm = sp->used_region_at_save_marks();
453
454	if (!ur.contains(urasm)) {
455	log_warning(gc)("CMS+ParNew: Did you forget to call save_marks()? "
456	"[" PTR_FORMAT ", " PTR_FORMAT ") is not contained in "
457	"[" PTR_FORMAT ", " PTR_FORMAT ")",
458	p2i(urasm.start()), p2i(urasm.end()), p2i(ur.start()), p2i(ur.end()));
459	MemRegion ur2 = sp->used_region();
460	MemRegion urasm2 = sp->used_region_at_save_marks();
461	if (!ur.equals(ur2)) {
462	log_warning(gc)("CMS+ParNew: Flickering used_region()!!");
463	}
464	if (!urasm.equals(urasm2)) {
465	log_warning(gc)("CMS+ParNew: Flickering used_region_at_save_marks()!!");
466	}
467	ShouldNotReachHere();
468	}
469	}
470	#endif // ASSERT
471

Browse the source code of OpenJDK/src/hotspot/share/gc/cms/cmsCardTable.cpp