src/share/vm/gc_implementation/g1/concurrentMark.cpp

Wed, 10 Sep 2014 13:01:13 -0700

author
jcoomes
date
Wed, 10 Sep 2014 13:01:13 -0700
changeset 7159
e5668dcf12e9
parent 7100
edb5f3b38aab
child 7195
c02ec279b062
permissions
-rw-r--r--

8057818: collect allocation context statistics at gc pauses
Reviewed-by: mikael, jmasa

ysr@777 1 /*
drchase@6680 2 * Copyright (c) 2001, 2014, Oracle and/or its affiliates. All rights reserved.
ysr@777 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
ysr@777 4 *
ysr@777 5 * This code is free software; you can redistribute it and/or modify it
ysr@777 6 * under the terms of the GNU General Public License version 2 only, as
ysr@777 7 * published by the Free Software Foundation.
ysr@777 8 *
ysr@777 9 * This code is distributed in the hope that it will be useful, but WITHOUT
ysr@777 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
ysr@777 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
ysr@777 12 * version 2 for more details (a copy is included in the LICENSE file that
ysr@777 13 * accompanied this code).
ysr@777 14 *
ysr@777 15 * You should have received a copy of the GNU General Public License version
ysr@777 16 * 2 along with this work; if not, write to the Free Software Foundation,
ysr@777 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
ysr@777 18 *
trims@1907 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
trims@1907 20 * or visit www.oracle.com if you need additional information or have any
trims@1907 21 * questions.
ysr@777 22 *
ysr@777 23 */
ysr@777 24
stefank@2314 25 #include "precompiled.hpp"
stefank@2314 26 #include "classfile/symbolTable.hpp"
stefank@6992 27 #include "code/codeCache.hpp"
tonyp@2968 28 #include "gc_implementation/g1/concurrentMark.inline.hpp"
stefank@2314 29 #include "gc_implementation/g1/concurrentMarkThread.inline.hpp"
stefank@2314 30 #include "gc_implementation/g1/g1CollectedHeap.inline.hpp"
stefank@2314 31 #include "gc_implementation/g1/g1CollectorPolicy.hpp"
tonyp@3114 32 #include "gc_implementation/g1/g1ErgoVerbose.hpp"
brutisso@3710 33 #include "gc_implementation/g1/g1Log.hpp"
tonyp@2968 34 #include "gc_implementation/g1/g1OopClosures.inline.hpp"
stefank@2314 35 #include "gc_implementation/g1/g1RemSet.hpp"
tonyp@3416 36 #include "gc_implementation/g1/heapRegion.inline.hpp"
tschatzl@7091 37 #include "gc_implementation/g1/heapRegionManager.inline.hpp"
stefank@2314 38 #include "gc_implementation/g1/heapRegionRemSet.hpp"
tschatzl@7051 39 #include "gc_implementation/g1/heapRegionSet.inline.hpp"
kamg@2445 40 #include "gc_implementation/shared/vmGCOperations.hpp"
sla@5237 41 #include "gc_implementation/shared/gcTimer.hpp"
sla@5237 42 #include "gc_implementation/shared/gcTrace.hpp"
sla@5237 43 #include "gc_implementation/shared/gcTraceTime.hpp"
stefank@6992 44 #include "memory/allocation.hpp"
stefank@2314 45 #include "memory/genOopClosures.inline.hpp"
stefank@2314 46 #include "memory/referencePolicy.hpp"
stefank@2314 47 #include "memory/resourceArea.hpp"
stefank@2314 48 #include "oops/oop.inline.hpp"
stefank@2314 49 #include "runtime/handles.inline.hpp"
stefank@2314 50 #include "runtime/java.hpp"
goetz@6912 51 #include "runtime/prefetch.inline.hpp"
zgu@3900 52 #include "services/memTracker.hpp"
ysr@777 53
brutisso@3455 54 // Concurrent marking bit map wrapper
ysr@777 55
johnc@4333 56 CMBitMapRO::CMBitMapRO(int shifter) :
johnc@4333 57 _bm(),
ysr@777 58 _shifter(shifter) {
johnc@4333 59 _bmStartWord = 0;
johnc@4333 60 _bmWordSize = 0;
ysr@777 61 }
ysr@777 62
stefank@6992 63 HeapWord* CMBitMapRO::getNextMarkedWordAddress(const HeapWord* addr,
stefank@6992 64 const HeapWord* limit) const {
ysr@777 65 // First we must round addr *up* to a possible object boundary.
ysr@777 66 addr = (HeapWord*)align_size_up((intptr_t)addr,
ysr@777 67 HeapWordSize << _shifter);
ysr@777 68 size_t addrOffset = heapWordToOffset(addr);
tonyp@2973 69 if (limit == NULL) {
tonyp@2973 70 limit = _bmStartWord + _bmWordSize;
tonyp@2973 71 }
ysr@777 72 size_t limitOffset = heapWordToOffset(limit);
ysr@777 73 size_t nextOffset = _bm.get_next_one_offset(addrOffset, limitOffset);
ysr@777 74 HeapWord* nextAddr = offsetToHeapWord(nextOffset);
ysr@777 75 assert(nextAddr >= addr, "get_next_one postcondition");
ysr@777 76 assert(nextAddr == limit || isMarked(nextAddr),
ysr@777 77 "get_next_one postcondition");
ysr@777 78 return nextAddr;
ysr@777 79 }
ysr@777 80
stefank@6992 81 HeapWord* CMBitMapRO::getNextUnmarkedWordAddress(const HeapWord* addr,
stefank@6992 82 const HeapWord* limit) const {
ysr@777 83 size_t addrOffset = heapWordToOffset(addr);
tonyp@2973 84 if (limit == NULL) {
tonyp@2973 85 limit = _bmStartWord + _bmWordSize;
tonyp@2973 86 }
ysr@777 87 size_t limitOffset = heapWordToOffset(limit);
ysr@777 88 size_t nextOffset = _bm.get_next_zero_offset(addrOffset, limitOffset);
ysr@777 89 HeapWord* nextAddr = offsetToHeapWord(nextOffset);
ysr@777 90 assert(nextAddr >= addr, "get_next_one postcondition");
ysr@777 91 assert(nextAddr == limit || !isMarked(nextAddr),
ysr@777 92 "get_next_one postcondition");
ysr@777 93 return nextAddr;
ysr@777 94 }
ysr@777 95
ysr@777 96 int CMBitMapRO::heapWordDiffToOffsetDiff(size_t diff) const {
ysr@777 97 assert((diff & ((1 << _shifter) - 1)) == 0, "argument check");
ysr@777 98 return (int) (diff >> _shifter);
ysr@777 99 }
ysr@777 100
ysr@777 101 #ifndef PRODUCT
tschatzl@7051 102 bool CMBitMapRO::covers(MemRegion heap_rs) const {
ysr@777 103 // assert(_bm.map() == _virtual_space.low(), "map inconsistency");
brutisso@4061 104 assert(((size_t)_bm.size() * ((size_t)1 << _shifter)) == _bmWordSize,
ysr@777 105 "size inconsistency");
tschatzl@7051 106 return _bmStartWord == (HeapWord*)(heap_rs.start()) &&
tschatzl@7051 107 _bmWordSize == heap_rs.word_size();
ysr@777 108 }
ysr@777 109 #endif
ysr@777 110
stefank@4904 111 void CMBitMapRO::print_on_error(outputStream* st, const char* prefix) const {
stefank@4904 112 _bm.print_on_error(st, prefix);
stefank@4904 113 }
stefank@4904 114
tschatzl@7051 115 size_t CMBitMap::compute_size(size_t heap_size) {
tschatzl@7051 116 return heap_size / mark_distance();
tschatzl@7051 117 }
tschatzl@7051 118
tschatzl@7051 119 size_t CMBitMap::mark_distance() {
tschatzl@7051 120 return MinObjAlignmentInBytes * BitsPerByte;
tschatzl@7051 121 }
tschatzl@7051 122
tschatzl@7051 123 void CMBitMap::initialize(MemRegion heap, G1RegionToSpaceMapper* storage) {
tschatzl@7051 124 _bmStartWord = heap.start();
tschatzl@7051 125 _bmWordSize = heap.word_size();
tschatzl@7051 126
tschatzl@7051 127 _bm.set_map((BitMap::bm_word_t*) storage->reserved().start());
tschatzl@7051 128 _bm.set_size(_bmWordSize >> _shifter);
tschatzl@7051 129
tschatzl@7051 130 storage->set_mapping_changed_listener(&_listener);
tschatzl@7051 131 }
tschatzl@7051 132
tschatzl@7051 133 void CMBitMapMappingChangedListener::on_commit(uint start_region, size_t num_regions) {
tschatzl@7051 134 // We need to clear the bitmap on commit, removing any existing information.
tschatzl@7051 135 MemRegion mr(G1CollectedHeap::heap()->bottom_addr_for_region(start_region), num_regions * HeapRegion::GrainWords);
tschatzl@7051 136 _bm->clearRange(mr);
tschatzl@7051 137 }
tschatzl@7051 138
tschatzl@7051 139 // Closure used for clearing the given mark bitmap.
tschatzl@7051 140 class ClearBitmapHRClosure : public HeapRegionClosure {
tschatzl@7051 141 private:
tschatzl@7051 142 ConcurrentMark* _cm;
tschatzl@7051 143 CMBitMap* _bitmap;
tschatzl@7051 144 bool _may_yield; // The closure may yield during iteration. If yielded, abort the iteration.
tschatzl@7051 145 public:
tschatzl@7051 146 ClearBitmapHRClosure(ConcurrentMark* cm, CMBitMap* bitmap, bool may_yield) : HeapRegionClosure(), _cm(cm), _bitmap(bitmap), _may_yield(may_yield) {
tschatzl@7051 147 assert(!may_yield || cm != NULL, "CM must be non-NULL if this closure is expected to yield.");
tschatzl@7051 148 }
tschatzl@7051 149
tschatzl@7051 150 virtual bool doHeapRegion(HeapRegion* r) {
tschatzl@7051 151 size_t const chunk_size_in_words = M / HeapWordSize;
tschatzl@7051 152
tschatzl@7051 153 HeapWord* cur = r->bottom();
tschatzl@7051 154 HeapWord* const end = r->end();
tschatzl@7051 155
tschatzl@7051 156 while (cur < end) {
tschatzl@7051 157 MemRegion mr(cur, MIN2(cur + chunk_size_in_words, end));
tschatzl@7051 158 _bitmap->clearRange(mr);
tschatzl@7051 159
tschatzl@7051 160 cur += chunk_size_in_words;
tschatzl@7051 161
tschatzl@7051 162 // Abort iteration if after yielding the marking has been aborted.
tschatzl@7051 163 if (_may_yield && _cm->do_yield_check() && _cm->has_aborted()) {
tschatzl@7051 164 return true;
tschatzl@7051 165 }
tschatzl@7051 166 // Repeat the asserts from before the start of the closure. We will do them
tschatzl@7051 167 // as asserts here to minimize their overhead on the product. However, we
tschatzl@7051 168 // will have them as guarantees at the beginning / end of the bitmap
tschatzl@7051 169 // clearing to get some checking in the product.
tschatzl@7051 170 assert(!_may_yield || _cm->cmThread()->during_cycle(), "invariant");
tschatzl@7051 171 assert(!_may_yield || !G1CollectedHeap::heap()->mark_in_progress(), "invariant");
tschatzl@7051 172 }
tschatzl@7051 173
johnc@4333 174 return false;
johnc@4333 175 }
tschatzl@7051 176 };
johnc@4333 177
ysr@777 178 void CMBitMap::clearAll() {
tschatzl@7051 179 ClearBitmapHRClosure cl(NULL, this, false /* may_yield */);
tschatzl@7051 180 G1CollectedHeap::heap()->heap_region_iterate(&cl);
tschatzl@7051 181 guarantee(cl.complete(), "Must have completed iteration.");
ysr@777 182 return;
ysr@777 183 }
ysr@777 184
ysr@777 185 void CMBitMap::markRange(MemRegion mr) {
ysr@777 186 mr.intersection(MemRegion(_bmStartWord, _bmWordSize));
ysr@777 187 assert(!mr.is_empty(), "unexpected empty region");
ysr@777 188 assert((offsetToHeapWord(heapWordToOffset(mr.end())) ==
ysr@777 189 ((HeapWord *) mr.end())),
ysr@777 190 "markRange memory region end is not card aligned");
ysr@777 191 // convert address range into offset range
ysr@777 192 _bm.at_put_range(heapWordToOffset(mr.start()),
ysr@777 193 heapWordToOffset(mr.end()), true);
ysr@777 194 }
ysr@777 195
ysr@777 196 void CMBitMap::clearRange(MemRegion mr) {
ysr@777 197 mr.intersection(MemRegion(_bmStartWord, _bmWordSize));
ysr@777 198 assert(!mr.is_empty(), "unexpected empty region");
ysr@777 199 // convert address range into offset range
ysr@777 200 _bm.at_put_range(heapWordToOffset(mr.start()),
ysr@777 201 heapWordToOffset(mr.end()), false);
ysr@777 202 }
ysr@777 203
ysr@777 204 MemRegion CMBitMap::getAndClearMarkedRegion(HeapWord* addr,
ysr@777 205 HeapWord* end_addr) {
ysr@777 206 HeapWord* start = getNextMarkedWordAddress(addr);
ysr@777 207 start = MIN2(start, end_addr);
ysr@777 208 HeapWord* end = getNextUnmarkedWordAddress(start);
ysr@777 209 end = MIN2(end, end_addr);
ysr@777 210 assert(start <= end, "Consistency check");
ysr@777 211 MemRegion mr(start, end);
ysr@777 212 if (!mr.is_empty()) {
ysr@777 213 clearRange(mr);
ysr@777 214 }
ysr@777 215 return mr;
ysr@777 216 }
ysr@777 217
ysr@777 218 CMMarkStack::CMMarkStack(ConcurrentMark* cm) :
ysr@777 219 _base(NULL), _cm(cm)
ysr@777 220 #ifdef ASSERT
ysr@777 221 , _drain_in_progress(false)
ysr@777 222 , _drain_in_progress_yields(false)
ysr@777 223 #endif
ysr@777 224 {}
ysr@777 225
johnc@4333 226 bool CMMarkStack::allocate(size_t capacity) {
johnc@4333 227 // allocate a stack of the requisite depth
johnc@4333 228 ReservedSpace rs(ReservedSpace::allocation_align_size_up(capacity * sizeof(oop)));
johnc@4333 229 if (!rs.is_reserved()) {
johnc@4333 230 warning("ConcurrentMark MarkStack allocation failure");
johnc@4333 231 return false;
tonyp@2973 232 }
johnc@4333 233 MemTracker::record_virtual_memory_type((address)rs.base(), mtGC);
johnc@4333 234 if (!_virtual_space.initialize(rs, rs.size())) {
johnc@4333 235 warning("ConcurrentMark MarkStack backing store failure");
johnc@4333 236 // Release the virtual memory reserved for the marking stack
johnc@4333 237 rs.release();
johnc@4333 238 return false;
johnc@4333 239 }
johnc@4333 240 assert(_virtual_space.committed_size() == rs.size(),
johnc@4333 241 "Didn't reserve backing store for all of ConcurrentMark stack?");
johnc@4333 242 _base = (oop*) _virtual_space.low();
johnc@4333 243 setEmpty();
johnc@4333 244 _capacity = (jint) capacity;
tonyp@3416 245 _saved_index = -1;
johnc@4386 246 _should_expand = false;
ysr@777 247 NOT_PRODUCT(_max_depth = 0);
johnc@4333 248 return true;
johnc@4333 249 }
johnc@4333 250
johnc@4333 251 void CMMarkStack::expand() {
johnc@4333 252 // Called, during remark, if we've overflown the marking stack during marking.
johnc@4333 253 assert(isEmpty(), "stack should been emptied while handling overflow");
johnc@4333 254 assert(_capacity <= (jint) MarkStackSizeMax, "stack bigger than permitted");
johnc@4333 255 // Clear expansion flag
johnc@4333 256 _should_expand = false;
johnc@4333 257 if (_capacity == (jint) MarkStackSizeMax) {
johnc@4333 258 if (PrintGCDetails && Verbose) {
johnc@4333 259 gclog_or_tty->print_cr(" (benign) Can't expand marking stack capacity, at max size limit");
johnc@4333 260 }
johnc@4333 261 return;
johnc@4333 262 }
johnc@4333 263 // Double capacity if possible
johnc@4333 264 jint new_capacity = MIN2(_capacity*2, (jint) MarkStackSizeMax);
johnc@4333 265 // Do not give up existing stack until we have managed to
johnc@4333 266 // get the double capacity that we desired.
johnc@4333 267 ReservedSpace rs(ReservedSpace::allocation_align_size_up(new_capacity *
johnc@4333 268 sizeof(oop)));
johnc@4333 269 if (rs.is_reserved()) {
johnc@4333 270 // Release the backing store associated with old stack
johnc@4333 271 _virtual_space.release();
johnc@4333 272 // Reinitialize virtual space for new stack
johnc@4333 273 if (!_virtual_space.initialize(rs, rs.size())) {
johnc@4333 274 fatal("Not enough swap for expanded marking stack capacity");
johnc@4333 275 }
johnc@4333 276 _base = (oop*)(_virtual_space.low());
johnc@4333 277 _index = 0;
johnc@4333 278 _capacity = new_capacity;
johnc@4333 279 } else {
johnc@4333 280 if (PrintGCDetails && Verbose) {
johnc@4333 281 // Failed to double capacity, continue;
johnc@4333 282 gclog_or_tty->print(" (benign) Failed to expand marking stack capacity from "
johnc@4333 283 SIZE_FORMAT"K to " SIZE_FORMAT"K",
johnc@4333 284 _capacity / K, new_capacity / K);
johnc@4333 285 }
johnc@4333 286 }
johnc@4333 287 }
johnc@4333 288
johnc@4333 289 void CMMarkStack::set_should_expand() {
johnc@4333 290 // If we're resetting the marking state because of an
johnc@4333 291 // marking stack overflow, record that we should, if
johnc@4333 292 // possible, expand the stack.
johnc@4333 293 _should_expand = _cm->has_overflown();
ysr@777 294 }
ysr@777 295
ysr@777 296 CMMarkStack::~CMMarkStack() {
tonyp@2973 297 if (_base != NULL) {
johnc@4333 298 _base = NULL;
johnc@4333 299 _virtual_space.release();
tonyp@2973 300 }
ysr@777 301 }
ysr@777 302
ysr@777 303 void CMMarkStack::par_push(oop ptr) {
ysr@777 304 while (true) {
ysr@777 305 if (isFull()) {
ysr@777 306 _overflow = true;
ysr@777 307 return;
ysr@777 308 }
ysr@777 309 // Otherwise...
ysr@777 310 jint index = _index;
ysr@777 311 jint next_index = index+1;
ysr@777 312 jint res = Atomic::cmpxchg(next_index, &_index, index);
ysr@777 313 if (res == index) {
ysr@777 314 _base[index] = ptr;
ysr@777 315 // Note that we don't maintain this atomically. We could, but it
ysr@777 316 // doesn't seem necessary.
ysr@777 317 NOT_PRODUCT(_max_depth = MAX2(_max_depth, next_index));
ysr@777 318 return;
ysr@777 319 }
ysr@777 320 // Otherwise, we need to try again.
ysr@777 321 }
ysr@777 322 }
ysr@777 323
ysr@777 324 void CMMarkStack::par_adjoin_arr(oop* ptr_arr, int n) {
ysr@777 325 while (true) {
ysr@777 326 if (isFull()) {
ysr@777 327 _overflow = true;
ysr@777 328 return;
ysr@777 329 }
ysr@777 330 // Otherwise...
ysr@777 331 jint index = _index;
ysr@777 332 jint next_index = index + n;
ysr@777 333 if (next_index > _capacity) {
ysr@777 334 _overflow = true;
ysr@777 335 return;
ysr@777 336 }
ysr@777 337 jint res = Atomic::cmpxchg(next_index, &_index, index);
ysr@777 338 if (res == index) {
ysr@777 339 for (int i = 0; i < n; i++) {
johnc@4333 340 int ind = index + i;
ysr@777 341 assert(ind < _capacity, "By overflow test above.");
ysr@777 342 _base[ind] = ptr_arr[i];
ysr@777 343 }
ysr@777 344 NOT_PRODUCT(_max_depth = MAX2(_max_depth, next_index));
ysr@777 345 return;
ysr@777 346 }
ysr@777 347 // Otherwise, we need to try again.
ysr@777 348 }
ysr@777 349 }
ysr@777 350
ysr@777 351 void CMMarkStack::par_push_arr(oop* ptr_arr, int n) {
ysr@777 352 MutexLockerEx x(ParGCRareEvent_lock, Mutex::_no_safepoint_check_flag);
ysr@777 353 jint start = _index;
ysr@777 354 jint next_index = start + n;
ysr@777 355 if (next_index > _capacity) {
ysr@777 356 _overflow = true;
ysr@777 357 return;
ysr@777 358 }
ysr@777 359 // Otherwise.
ysr@777 360 _index = next_index;
ysr@777 361 for (int i = 0; i < n; i++) {
ysr@777 362 int ind = start + i;
tonyp@1458 363 assert(ind < _capacity, "By overflow test above.");
ysr@777 364 _base[ind] = ptr_arr[i];
ysr@777 365 }
johnc@4333 366 NOT_PRODUCT(_max_depth = MAX2(_max_depth, next_index));
ysr@777 367 }
ysr@777 368
ysr@777 369 bool CMMarkStack::par_pop_arr(oop* ptr_arr, int max, int* n) {
ysr@777 370 MutexLockerEx x(ParGCRareEvent_lock, Mutex::_no_safepoint_check_flag);
ysr@777 371 jint index = _index;
ysr@777 372 if (index == 0) {
ysr@777 373 *n = 0;
ysr@777 374 return false;
ysr@777 375 } else {
ysr@777 376 int k = MIN2(max, index);
johnc@4333 377 jint new_ind = index - k;
ysr@777 378 for (int j = 0; j < k; j++) {
ysr@777 379 ptr_arr[j] = _base[new_ind + j];
ysr@777 380 }
ysr@777 381 _index = new_ind;
ysr@777 382 *n = k;
ysr@777 383 return true;
ysr@777 384 }
ysr@777 385 }
ysr@777 386
ysr@777 387 template<class OopClosureClass>
ysr@777 388 bool CMMarkStack::drain(OopClosureClass* cl, CMBitMap* bm, bool yield_after) {
ysr@777 389 assert(!_drain_in_progress || !_drain_in_progress_yields || yield_after
ysr@777 390 || SafepointSynchronize::is_at_safepoint(),
ysr@777 391 "Drain recursion must be yield-safe.");
ysr@777 392 bool res = true;
ysr@777 393 debug_only(_drain_in_progress = true);
ysr@777 394 debug_only(_drain_in_progress_yields = yield_after);
ysr@777 395 while (!isEmpty()) {
ysr@777 396 oop newOop = pop();
ysr@777 397 assert(G1CollectedHeap::heap()->is_in_reserved(newOop), "Bad pop");
ysr@777 398 assert(newOop->is_oop(), "Expected an oop");
ysr@777 399 assert(bm == NULL || bm->isMarked((HeapWord*)newOop),
ysr@777 400 "only grey objects on this stack");
ysr@777 401 newOop->oop_iterate(cl);
ysr@777 402 if (yield_after && _cm->do_yield_check()) {
tonyp@2973 403 res = false;
tonyp@2973 404 break;
ysr@777 405 }
ysr@777 406 }
ysr@777 407 debug_only(_drain_in_progress = false);
ysr@777 408 return res;
ysr@777 409 }
ysr@777 410
tonyp@3416 411 void CMMarkStack::note_start_of_gc() {
tonyp@3416 412 assert(_saved_index == -1,
tonyp@3416 413 "note_start_of_gc()/end_of_gc() bracketed incorrectly");
tonyp@3416 414 _saved_index = _index;
tonyp@3416 415 }
tonyp@3416 416
tonyp@3416 417 void CMMarkStack::note_end_of_gc() {
tonyp@3416 418 // This is intentionally a guarantee, instead of an assert. If we
tonyp@3416 419 // accidentally add something to the mark stack during GC, it
tonyp@3416 420 // will be a correctness issue so it's better if we crash. we'll
tonyp@3416 421 // only check this once per GC anyway, so it won't be a performance
tonyp@3416 422 // issue in any way.
tonyp@3416 423 guarantee(_saved_index == _index,
tonyp@3416 424 err_msg("saved index: %d index: %d", _saved_index, _index));
tonyp@3416 425 _saved_index = -1;
tonyp@3416 426 }
tonyp@3416 427
ysr@777 428 void CMMarkStack::oops_do(OopClosure* f) {
tonyp@3416 429 assert(_saved_index == _index,
tonyp@3416 430 err_msg("saved index: %d index: %d", _saved_index, _index));
tonyp@3416 431 for (int i = 0; i < _index; i += 1) {
ysr@777 432 f->do_oop(&_base[i]);
ysr@777 433 }
ysr@777 434 }
ysr@777 435
tonyp@3464 436 CMRootRegions::CMRootRegions() :
tonyp@3464 437 _young_list(NULL), _cm(NULL), _scan_in_progress(false),
tonyp@3464 438 _should_abort(false), _next_survivor(NULL) { }
tonyp@3464 439
tonyp@3464 440 void CMRootRegions::init(G1CollectedHeap* g1h, ConcurrentMark* cm) {
tonyp@3464 441 _young_list = g1h->young_list();
tonyp@3464 442 _cm = cm;
tonyp@3464 443 }
tonyp@3464 444
tonyp@3464 445 void CMRootRegions::prepare_for_scan() {
tonyp@3464 446 assert(!scan_in_progress(), "pre-condition");
tonyp@3464 447
tonyp@3464 448 // Currently, only survivors can be root regions.
tonyp@3464 449 assert(_next_survivor == NULL, "pre-condition");
tonyp@3464 450 _next_survivor = _young_list->first_survivor_region();
tonyp@3464 451 _scan_in_progress = (_next_survivor != NULL);
tonyp@3464 452 _should_abort = false;
tonyp@3464 453 }
tonyp@3464 454
tonyp@3464 455 HeapRegion* CMRootRegions::claim_next() {
tonyp@3464 456 if (_should_abort) {
tonyp@3464 457 // If someone has set the should_abort flag, we return NULL to
tonyp@3464 458 // force the caller to bail out of their loop.
tonyp@3464 459 return NULL;
tonyp@3464 460 }
tonyp@3464 461
tonyp@3464 462 // Currently, only survivors can be root regions.
tonyp@3464 463 HeapRegion* res = _next_survivor;
tonyp@3464 464 if (res != NULL) {
tonyp@3464 465 MutexLockerEx x(RootRegionScan_lock, Mutex::_no_safepoint_check_flag);
tonyp@3464 466 // Read it again in case it changed while we were waiting for the lock.
tonyp@3464 467 res = _next_survivor;
tonyp@3464 468 if (res != NULL) {
tonyp@3464 469 if (res == _young_list->last_survivor_region()) {
tonyp@3464 470 // We just claimed the last survivor so store NULL to indicate
tonyp@3464 471 // that we're done.
tonyp@3464 472 _next_survivor = NULL;
tonyp@3464 473 } else {
tonyp@3464 474 _next_survivor = res->get_next_young_region();
tonyp@3464 475 }
tonyp@3464 476 } else {
tonyp@3464 477 // Someone else claimed the last survivor while we were trying
tonyp@3464 478 // to take the lock so nothing else to do.
tonyp@3464 479 }
tonyp@3464 480 }
tonyp@3464 481 assert(res == NULL || res->is_survivor(), "post-condition");
tonyp@3464 482
tonyp@3464 483 return res;
tonyp@3464 484 }
tonyp@3464 485
tonyp@3464 486 void CMRootRegions::scan_finished() {
tonyp@3464 487 assert(scan_in_progress(), "pre-condition");
tonyp@3464 488
tonyp@3464 489 // Currently, only survivors can be root regions.
tonyp@3464 490 if (!_should_abort) {
tonyp@3464 491 assert(_next_survivor == NULL, "we should have claimed all survivors");
tonyp@3464 492 }
tonyp@3464 493 _next_survivor = NULL;
tonyp@3464 494
tonyp@3464 495 {
tonyp@3464 496 MutexLockerEx x(RootRegionScan_lock, Mutex::_no_safepoint_check_flag);
tonyp@3464 497 _scan_in_progress = false;
tonyp@3464 498 RootRegionScan_lock->notify_all();
tonyp@3464 499 }
tonyp@3464 500 }
tonyp@3464 501
tonyp@3464 502 bool CMRootRegions::wait_until_scan_finished() {
tonyp@3464 503 if (!scan_in_progress()) return false;
tonyp@3464 504
tonyp@3464 505 {
tonyp@3464 506 MutexLockerEx x(RootRegionScan_lock, Mutex::_no_safepoint_check_flag);
tonyp@3464 507 while (scan_in_progress()) {
tonyp@3464 508 RootRegionScan_lock->wait(Mutex::_no_safepoint_check_flag);
tonyp@3464 509 }
tonyp@3464 510 }
tonyp@3464 511 return true;
tonyp@3464 512 }
tonyp@3464 513
ysr@777 514 #ifdef _MSC_VER // the use of 'this' below gets a warning, make it go away
ysr@777 515 #pragma warning( disable:4355 ) // 'this' : used in base member initializer list
ysr@777 516 #endif // _MSC_VER
ysr@777 517
jmasa@3357 518 uint ConcurrentMark::scale_parallel_threads(uint n_par_threads) {
jmasa@3357 519 return MAX2((n_par_threads + 2) / 4, 1U);
jmasa@3294 520 }
jmasa@3294 521
tschatzl@7051 522 ConcurrentMark::ConcurrentMark(G1CollectedHeap* g1h, G1RegionToSpaceMapper* prev_bitmap_storage, G1RegionToSpaceMapper* next_bitmap_storage) :
johnc@4333 523 _g1h(g1h),
tschatzl@7051 524 _markBitMap1(),
tschatzl@7051 525 _markBitMap2(),
ysr@777 526 _parallel_marking_threads(0),
jmasa@3294 527 _max_parallel_marking_threads(0),
ysr@777 528 _sleep_factor(0.0),
ysr@777 529 _marking_task_overhead(1.0),
ysr@777 530 _cleanup_sleep_factor(0.0),
ysr@777 531 _cleanup_task_overhead(1.0),
tonyp@2472 532 _cleanup_list("Cleanup List"),
johnc@4333 533 _region_bm((BitMap::idx_t)(g1h->max_regions()), false /* in_resource_area*/),
tschatzl@7051 534 _card_bm((g1h->reserved_region().byte_size() + CardTableModRefBS::card_size - 1) >>
johnc@4333 535 CardTableModRefBS::card_shift,
johnc@4333 536 false /* in_resource_area*/),
johnc@3463 537
ysr@777 538 _prevMarkBitMap(&_markBitMap1),
ysr@777 539 _nextMarkBitMap(&_markBitMap2),
ysr@777 540
ysr@777 541 _markStack(this),
ysr@777 542 // _finger set in set_non_marking_state
ysr@777 543
johnc@4173 544 _max_worker_id(MAX2((uint)ParallelGCThreads, 1U)),
ysr@777 545 // _active_tasks set in set_non_marking_state
ysr@777 546 // _tasks set inside the constructor
johnc@4173 547 _task_queues(new CMTaskQueueSet((int) _max_worker_id)),
johnc@4173 548 _terminator(ParallelTaskTerminator((int) _max_worker_id, _task_queues)),
ysr@777 549
ysr@777 550 _has_overflown(false),
ysr@777 551 _concurrent(false),
tonyp@1054 552 _has_aborted(false),
brutisso@6904 553 _aborted_gc_id(GCId::undefined()),
tonyp@1054 554 _restart_for_overflow(false),
tonyp@1054 555 _concurrent_marking_in_progress(false),
ysr@777 556
ysr@777 557 // _verbose_level set below
ysr@777 558
ysr@777 559 _init_times(),
ysr@777 560 _remark_times(), _remark_mark_times(), _remark_weak_ref_times(),
ysr@777 561 _cleanup_times(),
ysr@777 562 _total_counting_time(0.0),
ysr@777 563 _total_rs_scrub_time(0.0),
johnc@3463 564
johnc@3463 565 _parallel_workers(NULL),
johnc@3463 566
johnc@3463 567 _count_card_bitmaps(NULL),
johnc@4333 568 _count_marked_bytes(NULL),
johnc@4333 569 _completed_initialization(false) {
tonyp@2973 570 CMVerboseLevel verbose_level = (CMVerboseLevel) G1MarkingVerboseLevel;
tonyp@2973 571 if (verbose_level < no_verbose) {
ysr@777 572 verbose_level = no_verbose;
tonyp@2973 573 }
tonyp@2973 574 if (verbose_level > high_verbose) {
ysr@777 575 verbose_level = high_verbose;
tonyp@2973 576 }
ysr@777 577 _verbose_level = verbose_level;
ysr@777 578
tonyp@2973 579 if (verbose_low()) {
ysr@777 580 gclog_or_tty->print_cr("[global] init, heap start = "PTR_FORMAT", "
drchase@6680 581 "heap end = " INTPTR_FORMAT, p2i(_heap_start), p2i(_heap_end));
tonyp@2973 582 }
ysr@777 583
tschatzl@7051 584 _markBitMap1.initialize(g1h->reserved_region(), prev_bitmap_storage);
tschatzl@7051 585 _markBitMap2.initialize(g1h->reserved_region(), next_bitmap_storage);
ysr@777 586
ysr@777 587 // Create & start a ConcurrentMark thread.
ysr@1280 588 _cmThread = new ConcurrentMarkThread(this);
ysr@1280 589 assert(cmThread() != NULL, "CM Thread should have been created");
ysr@1280 590 assert(cmThread()->cm() != NULL, "CM Thread should refer to this cm");
ehelin@6168 591 if (_cmThread->osthread() == NULL) {
ehelin@6168 592 vm_shutdown_during_initialization("Could not create ConcurrentMarkThread");
ehelin@6168 593 }
ysr@1280 594
ysr@777 595 assert(CGC_lock != NULL, "Where's the CGC_lock?");
tschatzl@7051 596 assert(_markBitMap1.covers(g1h->reserved_region()), "_markBitMap1 inconsistency");
tschatzl@7051 597 assert(_markBitMap2.covers(g1h->reserved_region()), "_markBitMap2 inconsistency");
ysr@777 598
ysr@777 599 SATBMarkQueueSet& satb_qs = JavaThread::satb_mark_queue_set();
tonyp@1717 600 satb_qs.set_buffer_size(G1SATBBufferSize);
ysr@777 601
tonyp@3464 602 _root_regions.init(_g1h, this);
tonyp@3464 603
jmasa@1719 604 if (ConcGCThreads > ParallelGCThreads) {
drchase@6680 605 warning("Can't have more ConcGCThreads (" UINTX_FORMAT ") "
drchase@6680 606 "than ParallelGCThreads (" UINTX_FORMAT ").",
johnc@4333 607 ConcGCThreads, ParallelGCThreads);
johnc@4333 608 return;
ysr@777 609 }
ysr@777 610 if (ParallelGCThreads == 0) {
ysr@777 611 // if we are not running with any parallel GC threads we will not
ysr@777 612 // spawn any marking threads either
jmasa@3294 613 _parallel_marking_threads = 0;
jmasa@3294 614 _max_parallel_marking_threads = 0;
jmasa@3294 615 _sleep_factor = 0.0;
jmasa@3294 616 _marking_task_overhead = 1.0;
ysr@777 617 } else {
johnc@4547 618 if (!FLAG_IS_DEFAULT(ConcGCThreads) && ConcGCThreads > 0) {
johnc@4547 619 // Note: ConcGCThreads has precedence over G1MarkingOverheadPercent
ysr@777 620 // if both are set
ysr@777 621 _sleep_factor = 0.0;
ysr@777 622 _marking_task_overhead = 1.0;
johnc@1186 623 } else if (G1MarkingOverheadPercent > 0) {
johnc@4547 624 // We will calculate the number of parallel marking threads based
johnc@4547 625 // on a target overhead with respect to the soft real-time goal
johnc@1186 626 double marking_overhead = (double) G1MarkingOverheadPercent / 100.0;
ysr@777 627 double overall_cm_overhead =
johnc@1186 628 (double) MaxGCPauseMillis * marking_overhead /
johnc@1186 629 (double) GCPauseIntervalMillis;
ysr@777 630 double cpu_ratio = 1.0 / (double) os::processor_count();
ysr@777 631 double marking_thread_num = ceil(overall_cm_overhead / cpu_ratio);
ysr@777 632 double marking_task_overhead =
ysr@777 633 overall_cm_overhead / marking_thread_num *
ysr@777 634 (double) os::processor_count();
ysr@777 635 double sleep_factor =
ysr@777 636 (1.0 - marking_task_overhead) / marking_task_overhead;
ysr@777 637
johnc@4547 638 FLAG_SET_ERGO(uintx, ConcGCThreads, (uint) marking_thread_num);
ysr@777 639 _sleep_factor = sleep_factor;
ysr@777 640 _marking_task_overhead = marking_task_overhead;
ysr@777 641 } else {
johnc@4547 642 // Calculate the number of parallel marking threads by scaling
johnc@4547 643 // the number of parallel GC threads.
johnc@4547 644 uint marking_thread_num = scale_parallel_threads((uint) ParallelGCThreads);
johnc@4547 645 FLAG_SET_ERGO(uintx, ConcGCThreads, marking_thread_num);
ysr@777 646 _sleep_factor = 0.0;
ysr@777 647 _marking_task_overhead = 1.0;
ysr@777 648 }
ysr@777 649
johnc@4547 650 assert(ConcGCThreads > 0, "Should have been set");
johnc@4547 651 _parallel_marking_threads = (uint) ConcGCThreads;
johnc@4547 652 _max_parallel_marking_threads = _parallel_marking_threads;
johnc@4547 653
tonyp@2973 654 if (parallel_marking_threads() > 1) {
ysr@777 655 _cleanup_task_overhead = 1.0;
tonyp@2973 656 } else {
ysr@777 657 _cleanup_task_overhead = marking_task_overhead();
tonyp@2973 658 }
ysr@777 659 _cleanup_sleep_factor =
ysr@777 660 (1.0 - cleanup_task_overhead()) / cleanup_task_overhead();
ysr@777 661
ysr@777 662 #if 0
ysr@777 663 gclog_or_tty->print_cr("Marking Threads %d", parallel_marking_threads());
ysr@777 664 gclog_or_tty->print_cr("CM Marking Task Overhead %1.4lf", marking_task_overhead());
ysr@777 665 gclog_or_tty->print_cr("CM Sleep Factor %1.4lf", sleep_factor());
ysr@777 666 gclog_or_tty->print_cr("CL Marking Task Overhead %1.4lf", cleanup_task_overhead());
ysr@777 667 gclog_or_tty->print_cr("CL Sleep Factor %1.4lf", cleanup_sleep_factor());
ysr@777 668 #endif
ysr@777 669
tonyp@1458 670 guarantee(parallel_marking_threads() > 0, "peace of mind");
jmasa@2188 671 _parallel_workers = new FlexibleWorkGang("G1 Parallel Marking Threads",
jmasa@3357 672 _max_parallel_marking_threads, false, true);
jmasa@2188 673 if (_parallel_workers == NULL) {
ysr@777 674 vm_exit_during_initialization("Failed necessary allocation.");
jmasa@2188 675 } else {
jmasa@2188 676 _parallel_workers->initialize_workers();
jmasa@2188 677 }
ysr@777 678 }
ysr@777 679
johnc@4333 680 if (FLAG_IS_DEFAULT(MarkStackSize)) {
johnc@4333 681 uintx mark_stack_size =
johnc@4333 682 MIN2(MarkStackSizeMax,
johnc@4333 683 MAX2(MarkStackSize, (uintx) (parallel_marking_threads() * TASKQUEUE_SIZE)));
johnc@4333 684 // Verify that the calculated value for MarkStackSize is in range.
johnc@4333 685 // It would be nice to use the private utility routine from Arguments.
johnc@4333 686 if (!(mark_stack_size >= 1 && mark_stack_size <= MarkStackSizeMax)) {
johnc@4333 687 warning("Invalid value calculated for MarkStackSize (" UINTX_FORMAT "): "
johnc@4333 688 "must be between " UINTX_FORMAT " and " UINTX_FORMAT,
drchase@6680 689 mark_stack_size, (uintx) 1, MarkStackSizeMax);
johnc@4333 690 return;
johnc@4333 691 }
johnc@4333 692 FLAG_SET_ERGO(uintx, MarkStackSize, mark_stack_size);
johnc@4333 693 } else {
johnc@4333 694 // Verify MarkStackSize is in range.
johnc@4333 695 if (FLAG_IS_CMDLINE(MarkStackSize)) {
johnc@4333 696 if (FLAG_IS_DEFAULT(MarkStackSizeMax)) {
johnc@4333 697 if (!(MarkStackSize >= 1 && MarkStackSize <= MarkStackSizeMax)) {
johnc@4333 698 warning("Invalid value specified for MarkStackSize (" UINTX_FORMAT "): "
johnc@4333 699 "must be between " UINTX_FORMAT " and " UINTX_FORMAT,
drchase@6680 700 MarkStackSize, (uintx) 1, MarkStackSizeMax);
johnc@4333 701 return;
johnc@4333 702 }
johnc@4333 703 } else if (FLAG_IS_CMDLINE(MarkStackSizeMax)) {
johnc@4333 704 if (!(MarkStackSize >= 1 && MarkStackSize <= MarkStackSizeMax)) {
johnc@4333 705 warning("Invalid value specified for MarkStackSize (" UINTX_FORMAT ")"
johnc@4333 706 " or for MarkStackSizeMax (" UINTX_FORMAT ")",
johnc@4333 707 MarkStackSize, MarkStackSizeMax);
johnc@4333 708 return;
johnc@4333 709 }
johnc@4333 710 }
johnc@4333 711 }
johnc@4333 712 }
johnc@4333 713
johnc@4333 714 if (!_markStack.allocate(MarkStackSize)) {
johnc@4333 715 warning("Failed to allocate CM marking stack");
johnc@4333 716 return;
johnc@4333 717 }
johnc@4333 718
johnc@4333 719 _tasks = NEW_C_HEAP_ARRAY(CMTask*, _max_worker_id, mtGC);
johnc@4333 720 _accum_task_vtime = NEW_C_HEAP_ARRAY(double, _max_worker_id, mtGC);
johnc@4333 721
johnc@4333 722 _count_card_bitmaps = NEW_C_HEAP_ARRAY(BitMap, _max_worker_id, mtGC);
johnc@4333 723 _count_marked_bytes = NEW_C_HEAP_ARRAY(size_t*, _max_worker_id, mtGC);
johnc@4333 724
johnc@4333 725 BitMap::idx_t card_bm_size = _card_bm.size();
johnc@4333 726
johnc@4333 727 // so that the assertion in MarkingTaskQueue::task_queue doesn't fail
johnc@4333 728 _active_tasks = _max_worker_id;
johnc@4333 729
johnc@4333 730 size_t max_regions = (size_t) _g1h->max_regions();
johnc@4333 731 for (uint i = 0; i < _max_worker_id; ++i) {
johnc@4333 732 CMTaskQueue* task_queue = new CMTaskQueue();
johnc@4333 733 task_queue->initialize();
johnc@4333 734 _task_queues->register_queue(i, task_queue);
johnc@4333 735
johnc@4333 736 _count_card_bitmaps[i] = BitMap(card_bm_size, false);
johnc@4333 737 _count_marked_bytes[i] = NEW_C_HEAP_ARRAY(size_t, max_regions, mtGC);
johnc@4333 738
johnc@4333 739 _tasks[i] = new CMTask(i, this,
johnc@4333 740 _count_marked_bytes[i],
johnc@4333 741 &_count_card_bitmaps[i],
johnc@4333 742 task_queue, _task_queues);
johnc@4333 743
johnc@4333 744 _accum_task_vtime[i] = 0.0;
johnc@4333 745 }
johnc@4333 746
johnc@4333 747 // Calculate the card number for the bottom of the heap. Used
johnc@4333 748 // in biasing indexes into the accounting card bitmaps.
johnc@4333 749 _heap_bottom_card_num =
johnc@4333 750 intptr_t(uintptr_t(_g1h->reserved_region().start()) >>
johnc@4333 751 CardTableModRefBS::card_shift);
johnc@4333 752
johnc@4333 753 // Clear all the liveness counting data
johnc@4333 754 clear_all_count_data();
johnc@4333 755
ysr@777 756 // so that the call below can read a sensible value
tschatzl@7051 757 _heap_start = g1h->reserved_region().start();
ysr@777 758 set_non_marking_state();
johnc@4333 759 _completed_initialization = true;
ysr@777 760 }
ysr@777 761
ysr@777 762 void ConcurrentMark::reset() {
ysr@777 763 // Starting values for these two. This should be called in a STW
tschatzl@7051 764 // phase.
tschatzl@7051 765 MemRegion reserved = _g1h->g1_reserved();
tschatzl@7051 766 _heap_start = reserved.start();
tschatzl@7051 767 _heap_end = reserved.end();
ysr@777 768
tonyp@1458 769 // Separated the asserts so that we know which one fires.
tonyp@1458 770 assert(_heap_start != NULL, "heap bounds should look ok");
tonyp@1458 771 assert(_heap_end != NULL, "heap bounds should look ok");
tonyp@1458 772 assert(_heap_start < _heap_end, "heap bounds should look ok");
ysr@777 773
johnc@4386 774 // Reset all the marking data structures and any necessary flags
johnc@4386 775 reset_marking_state();
ysr@777 776
tonyp@2973 777 if (verbose_low()) {
ysr@777 778 gclog_or_tty->print_cr("[global] resetting");
tonyp@2973 779 }
ysr@777 780
ysr@777 781 // We do reset all of them, since different phases will use
ysr@777 782 // different number of active threads. So, it's easiest to have all
ysr@777 783 // of them ready.
johnc@4173 784 for (uint i = 0; i < _max_worker_id; ++i) {
ysr@777 785 _tasks[i]->reset(_nextMarkBitMap);
johnc@2190 786 }
ysr@777 787
ysr@777 788 // we need this to make sure that the flag is on during the evac
ysr@777 789 // pause with initial mark piggy-backed
ysr@777 790 set_concurrent_marking_in_progress();
ysr@777 791 }
ysr@777 792
johnc@4386 793
johnc@4386 794 void ConcurrentMark::reset_marking_state(bool clear_overflow) {
johnc@4386 795 _markStack.set_should_expand();
johnc@4386 796 _markStack.setEmpty(); // Also clears the _markStack overflow flag
johnc@4386 797 if (clear_overflow) {
johnc@4386 798 clear_has_overflown();
johnc@4386 799 } else {
johnc@4386 800 assert(has_overflown(), "pre-condition");
johnc@4386 801 }
johnc@4386 802 _finger = _heap_start;
johnc@4386 803
johnc@4386 804 for (uint i = 0; i < _max_worker_id; ++i) {
johnc@4386 805 CMTaskQueue* queue = _task_queues->queue(i);
johnc@4386 806 queue->set_empty();
johnc@4386 807 }
johnc@4386 808 }
johnc@4386 809
johnc@4788 810 void ConcurrentMark::set_concurrency(uint active_tasks) {
johnc@4173 811 assert(active_tasks <= _max_worker_id, "we should not have more");
ysr@777 812
ysr@777 813 _active_tasks = active_tasks;
ysr@777 814 // Need to update the three data structures below according to the
ysr@777 815 // number of active threads for this phase.
ysr@777 816 _terminator = ParallelTaskTerminator((int) active_tasks, _task_queues);
ysr@777 817 _first_overflow_barrier_sync.set_n_workers((int) active_tasks);
ysr@777 818 _second_overflow_barrier_sync.set_n_workers((int) active_tasks);
johnc@4788 819 }
johnc@4788 820
johnc@4788 821 void ConcurrentMark::set_concurrency_and_phase(uint active_tasks, bool concurrent) {
johnc@4788 822 set_concurrency(active_tasks);
ysr@777 823
ysr@777 824 _concurrent = concurrent;
ysr@777 825 // We propagate this to all tasks, not just the active ones.
johnc@4173 826 for (uint i = 0; i < _max_worker_id; ++i)
ysr@777 827 _tasks[i]->set_concurrent(concurrent);
ysr@777 828
ysr@777 829 if (concurrent) {
ysr@777 830 set_concurrent_marking_in_progress();
ysr@777 831 } else {
ysr@777 832 // We currently assume that the concurrent flag has been set to
ysr@777 833 // false before we start remark. At this point we should also be
ysr@777 834 // in a STW phase.
tonyp@1458 835 assert(!concurrent_marking_in_progress(), "invariant");
pliden@6693 836 assert(out_of_regions(),
johnc@4788 837 err_msg("only way to get here: _finger: "PTR_FORMAT", _heap_end: "PTR_FORMAT,
drchase@6680 838 p2i(_finger), p2i(_heap_end)));
ysr@777 839 }
ysr@777 840 }
ysr@777 841
ysr@777 842 void ConcurrentMark::set_non_marking_state() {
ysr@777 843 // We set the global marking state to some default values when we're
ysr@777 844 // not doing marking.
johnc@4386 845 reset_marking_state();
ysr@777 846 _active_tasks = 0;
ysr@777 847 clear_concurrent_marking_in_progress();
ysr@777 848 }
ysr@777 849
ysr@777 850 ConcurrentMark::~ConcurrentMark() {
stefank@3364 851 // The ConcurrentMark instance is never freed.
stefank@3364 852 ShouldNotReachHere();
ysr@777 853 }
ysr@777 854
ysr@777 855 void ConcurrentMark::clearNextBitmap() {
tonyp@1794 856 G1CollectedHeap* g1h = G1CollectedHeap::heap();
tonyp@1794 857
tonyp@1794 858 // Make sure that the concurrent mark thread looks to still be in
tonyp@1794 859 // the current cycle.
tonyp@1794 860 guarantee(cmThread()->during_cycle(), "invariant");
tonyp@1794 861
tonyp@1794 862 // We are finishing up the current cycle by clearing the next
tonyp@1794 863 // marking bitmap and getting it ready for the next cycle. During
tonyp@1794 864 // this time no other cycle can start. So, let's make sure that this
tonyp@1794 865 // is the case.
tonyp@1794 866 guarantee(!g1h->mark_in_progress(), "invariant");
tonyp@1794 867
tschatzl@7051 868 ClearBitmapHRClosure cl(this, _nextMarkBitMap, true /* may_yield */);
tschatzl@7051 869 g1h->heap_region_iterate(&cl);
tschatzl@7051 870
tschatzl@7051 871 // Clear the liveness counting data. If the marking has been aborted, the abort()
tschatzl@7051 872 // call already did that.
tschatzl@7051 873 if (cl.complete()) {
tschatzl@7051 874 clear_all_count_data();
tonyp@1794 875 }
tonyp@1794 876
tonyp@1794 877 // Repeat the asserts from above.
tonyp@1794 878 guarantee(cmThread()->during_cycle(), "invariant");
tonyp@1794 879 guarantee(!g1h->mark_in_progress(), "invariant");
ysr@777 880 }
ysr@777 881
tschatzl@7051 882 class CheckBitmapClearHRClosure : public HeapRegionClosure {
tschatzl@7051 883 CMBitMap* _bitmap;
tschatzl@7051 884 bool _error;
tschatzl@7051 885 public:
tschatzl@7051 886 CheckBitmapClearHRClosure(CMBitMap* bitmap) : _bitmap(bitmap) {
tschatzl@7051 887 }
tschatzl@7051 888
tschatzl@7051 889 virtual bool doHeapRegion(HeapRegion* r) {
tschatzl@7100 890 // This closure can be called concurrently to the mutator, so we must make sure
tschatzl@7100 891 // that the result of the getNextMarkedWordAddress() call is compared to the
tschatzl@7100 892 // value passed to it as limit to detect any found bits.
tschatzl@7100 893 // We can use the region's orig_end() for the limit and the comparison value
tschatzl@7100 894 // as it always contains the "real" end of the region that never changes and
tschatzl@7100 895 // has no side effects.
tschatzl@7100 896 // Due to the latter, there can also be no problem with the compiler generating
tschatzl@7100 897 // reloads of the orig_end() call.
tschatzl@7100 898 HeapWord* end = r->orig_end();
tschatzl@7100 899 return _bitmap->getNextMarkedWordAddress(r->bottom(), end) != end;
tschatzl@7051 900 }
tschatzl@7051 901 };
tschatzl@7051 902
tschatzl@7016 903 bool ConcurrentMark::nextMarkBitmapIsClear() {
tschatzl@7051 904 CheckBitmapClearHRClosure cl(_nextMarkBitMap);
tschatzl@7051 905 _g1h->heap_region_iterate(&cl);
tschatzl@7051 906 return cl.complete();
tschatzl@7016 907 }
tschatzl@7016 908
ysr@777 909 class NoteStartOfMarkHRClosure: public HeapRegionClosure {
ysr@777 910 public:
ysr@777 911 bool doHeapRegion(HeapRegion* r) {
ysr@777 912 if (!r->continuesHumongous()) {
tonyp@3416 913 r->note_start_of_marking();
ysr@777 914 }
ysr@777 915 return false;
ysr@777 916 }
ysr@777 917 };
ysr@777 918
ysr@777 919 void ConcurrentMark::checkpointRootsInitialPre() {
ysr@777 920 G1CollectedHeap* g1h = G1CollectedHeap::heap();
ysr@777 921 G1CollectorPolicy* g1p = g1h->g1_policy();
ysr@777 922
ysr@777 923 _has_aborted = false;
ysr@777 924
jcoomes@1902 925 #ifndef PRODUCT
tonyp@1479 926 if (G1PrintReachableAtInitialMark) {
tonyp@1823 927 print_reachable("at-cycle-start",
johnc@2969 928 VerifyOption_G1UsePrevMarking, true /* all */);
tonyp@1479 929 }
jcoomes@1902 930 #endif
ysr@777 931
ysr@777 932 // Initialise marking structures. This has to be done in a STW phase.
ysr@777 933 reset();
tonyp@3416 934
tonyp@3416 935 // For each region note start of marking.
tonyp@3416 936 NoteStartOfMarkHRClosure startcl;
tonyp@3416 937 g1h->heap_region_iterate(&startcl);
ysr@777 938 }
ysr@777 939
ysr@777 940
ysr@777 941 void ConcurrentMark::checkpointRootsInitialPost() {
ysr@777 942 G1CollectedHeap* g1h = G1CollectedHeap::heap();
ysr@777 943
tonyp@2848 944 // If we force an overflow during remark, the remark operation will
tonyp@2848 945 // actually abort and we'll restart concurrent marking. If we always
tonyp@2848 946 // force an oveflow during remark we'll never actually complete the
tonyp@2848 947 // marking phase. So, we initilize this here, at the start of the
tonyp@2848 948 // cycle, so that at the remaining overflow number will decrease at
tonyp@2848 949 // every remark and we'll eventually not need to cause one.
tonyp@2848 950 force_overflow_stw()->init();
tonyp@2848 951
johnc@3175 952 // Start Concurrent Marking weak-reference discovery.
johnc@3175 953 ReferenceProcessor* rp = g1h->ref_processor_cm();
johnc@3175 954 // enable ("weak") refs discovery
johnc@3175 955 rp->enable_discovery(true /*verify_disabled*/, true /*verify_no_refs*/);
ysr@892 956 rp->setup_policy(false); // snapshot the soft ref policy to be used in this cycle
ysr@777 957
ysr@777 958 SATBMarkQueueSet& satb_mq_set = JavaThread::satb_mark_queue_set();
tonyp@1752 959 // This is the start of the marking cycle, we're expected all
tonyp@1752 960 // threads to have SATB queues with active set to false.
tonyp@1752 961 satb_mq_set.set_active_all_threads(true, /* new active value */
tonyp@1752 962 false /* expected_active */);
ysr@777 963
tonyp@3464 964 _root_regions.prepare_for_scan();
tonyp@3464 965
ysr@777 966 // update_g1_committed() will be called at the end of an evac pause
ysr@777 967 // when marking is on. So, it's also called at the end of the
ysr@777 968 // initial-mark pause to update the heap end, if the heap expands
ysr@777 969 // during it. No need to call it here.
ysr@777 970 }
ysr@777 971
ysr@777 972 /*
tonyp@2848 973 * Notice that in the next two methods, we actually leave the STS
tonyp@2848 974 * during the barrier sync and join it immediately afterwards. If we
tonyp@2848 975 * do not do this, the following deadlock can occur: one thread could
tonyp@2848 976 * be in the barrier sync code, waiting for the other thread to also
tonyp@2848 977 * sync up, whereas another one could be trying to yield, while also
tonyp@2848 978 * waiting for the other threads to sync up too.
tonyp@2848 979 *
tonyp@2848 980 * Note, however, that this code is also used during remark and in
tonyp@2848 981 * this case we should not attempt to leave / enter the STS, otherwise
tonyp@2848 982 * we'll either hit an asseert (debug / fastdebug) or deadlock
tonyp@2848 983 * (product). So we should only leave / enter the STS if we are
tonyp@2848 984 * operating concurrently.
tonyp@2848 985 *
tonyp@2848 986 * Because the thread that does the sync barrier has left the STS, it
tonyp@2848 987 * is possible to be suspended for a Full GC or an evacuation pause
tonyp@2848 988 * could occur. This is actually safe, since the entering the sync
tonyp@2848 989 * barrier is one of the last things do_marking_step() does, and it
tonyp@2848 990 * doesn't manipulate any data structures afterwards.
tonyp@2848 991 */
ysr@777 992
johnc@4173 993 void ConcurrentMark::enter_first_sync_barrier(uint worker_id) {
tonyp@2973 994 if (verbose_low()) {
johnc@4173 995 gclog_or_tty->print_cr("[%u] entering first barrier", worker_id);
tonyp@2973 996 }
ysr@777 997
tonyp@2848 998 if (concurrent()) {
pliden@6906 999 SuspendibleThreadSet::leave();
tonyp@2848 1000 }
pliden@6692 1001
pliden@6692 1002 bool barrier_aborted = !_first_overflow_barrier_sync.enter();
pliden@6692 1003
tonyp@2848 1004 if (concurrent()) {
pliden@6906 1005 SuspendibleThreadSet::join();
tonyp@2848 1006 }
ysr@777 1007 // at this point everyone should have synced up and not be doing any
ysr@777 1008 // more work
ysr@777 1009
tonyp@2973 1010 if (verbose_low()) {
pliden@6692 1011 if (barrier_aborted) {
pliden@6692 1012 gclog_or_tty->print_cr("[%u] aborted first barrier", worker_id);
pliden@6692 1013 } else {
pliden@6692 1014 gclog_or_tty->print_cr("[%u] leaving first barrier", worker_id);
pliden@6692 1015 }
pliden@6692 1016 }
pliden@6692 1017
pliden@6692 1018 if (barrier_aborted) {
pliden@6692 1019 // If the barrier aborted we ignore the overflow condition and
pliden@6692 1020 // just abort the whole marking phase as quickly as possible.
pliden@6692 1021 return;
tonyp@2973 1022 }
ysr@777 1023
johnc@4788 1024 // If we're executing the concurrent phase of marking, reset the marking
johnc@4788 1025 // state; otherwise the marking state is reset after reference processing,
johnc@4788 1026 // during the remark pause.
johnc@4788 1027 // If we reset here as a result of an overflow during the remark we will
johnc@4788 1028 // see assertion failures from any subsequent set_concurrency_and_phase()
johnc@4788 1029 // calls.
johnc@4788 1030 if (concurrent()) {
johnc@4788 1031 // let the task associated with with worker 0 do this
johnc@4788 1032 if (worker_id == 0) {
johnc@4788 1033 // task 0 is responsible for clearing the global data structures
johnc@4788 1034 // We should be here because of an overflow. During STW we should
johnc@4788 1035 // not clear the overflow flag since we rely on it being true when
johnc@4788 1036 // we exit this method to abort the pause and restart concurent
johnc@4788 1037 // marking.
johnc@4788 1038 reset_marking_state(true /* clear_overflow */);
johnc@4788 1039 force_overflow()->update();
johnc@4788 1040
johnc@4788 1041 if (G1Log::fine()) {
brutisso@6904 1042 gclog_or_tty->gclog_stamp(concurrent_gc_id());
johnc@4788 1043 gclog_or_tty->print_cr("[GC concurrent-mark-reset-for-overflow]");
johnc@4788 1044 }
ysr@777 1045 }
ysr@777 1046 }
ysr@777 1047
ysr@777 1048 // after this, each task should reset its own data structures then
ysr@777 1049 // then go into the second barrier
ysr@777 1050 }
ysr@777 1051
johnc@4173 1052 void ConcurrentMark::enter_second_sync_barrier(uint worker_id) {
tonyp@2973 1053 if (verbose_low()) {
johnc@4173 1054 gclog_or_tty->print_cr("[%u] entering second barrier", worker_id);
tonyp@2973 1055 }
ysr@777 1056
tonyp@2848 1057 if (concurrent()) {
pliden@6906 1058 SuspendibleThreadSet::leave();
tonyp@2848 1059 }
pliden@6692 1060
pliden@6692 1061 bool barrier_aborted = !_second_overflow_barrier_sync.enter();
pliden@6692 1062
tonyp@2848 1063 if (concurrent()) {
pliden@6906 1064 SuspendibleThreadSet::join();
tonyp@2848 1065 }
johnc@4788 1066 // at this point everything should be re-initialized and ready to go
ysr@777 1067
tonyp@2973 1068 if (verbose_low()) {
pliden@6692 1069 if (barrier_aborted) {
pliden@6692 1070 gclog_or_tty->print_cr("[%u] aborted second barrier", worker_id);
pliden@6692 1071 } else {
pliden@6692 1072 gclog_or_tty->print_cr("[%u] leaving second barrier", worker_id);
pliden@6692 1073 }
tonyp@2973 1074 }
ysr@777 1075 }
ysr@777 1076
tonyp@2848 1077 #ifndef PRODUCT
tonyp@2848 1078 void ForceOverflowSettings::init() {
tonyp@2848 1079 _num_remaining = G1ConcMarkForceOverflow;
tonyp@2848 1080 _force = false;
tonyp@2848 1081 update();
tonyp@2848 1082 }
tonyp@2848 1083
tonyp@2848 1084 void ForceOverflowSettings::update() {
tonyp@2848 1085 if (_num_remaining > 0) {
tonyp@2848 1086 _num_remaining -= 1;
tonyp@2848 1087 _force = true;
tonyp@2848 1088 } else {
tonyp@2848 1089 _force = false;
tonyp@2848 1090 }
tonyp@2848 1091 }
tonyp@2848 1092
tonyp@2848 1093 bool ForceOverflowSettings::should_force() {
tonyp@2848 1094 if (_force) {
tonyp@2848 1095 _force = false;
tonyp@2848 1096 return true;
tonyp@2848 1097 } else {
tonyp@2848 1098 return false;
tonyp@2848 1099 }
tonyp@2848 1100 }
tonyp@2848 1101 #endif // !PRODUCT
tonyp@2848 1102
ysr@777 1103 class CMConcurrentMarkingTask: public AbstractGangTask {
ysr@777 1104 private:
ysr@777 1105 ConcurrentMark* _cm;
ysr@777 1106 ConcurrentMarkThread* _cmt;
ysr@777 1107
ysr@777 1108 public:
jmasa@3357 1109 void work(uint worker_id) {
tonyp@1458 1110 assert(Thread::current()->is_ConcurrentGC_thread(),
tonyp@1458 1111 "this should only be done by a conc GC thread");
johnc@2316 1112 ResourceMark rm;
ysr@777 1113
ysr@777 1114 double start_vtime = os::elapsedVTime();
ysr@777 1115
pliden@6906 1116 SuspendibleThreadSet::join();
ysr@777 1117
jmasa@3357 1118 assert(worker_id < _cm->active_tasks(), "invariant");
jmasa@3357 1119 CMTask* the_task = _cm->task(worker_id);
ysr@777 1120 the_task->record_start_time();
ysr@777 1121 if (!_cm->has_aborted()) {
ysr@777 1122 do {
ysr@777 1123 double start_vtime_sec = os::elapsedVTime();
johnc@2494 1124 double mark_step_duration_ms = G1ConcMarkStepDurationMillis;
johnc@2494 1125
johnc@2494 1126 the_task->do_marking_step(mark_step_duration_ms,
johnc@4787 1127 true /* do_termination */,
johnc@4787 1128 false /* is_serial*/);
johnc@2494 1129
ysr@777 1130 double end_vtime_sec = os::elapsedVTime();
ysr@777 1131 double elapsed_vtime_sec = end_vtime_sec - start_vtime_sec;
ysr@777 1132 _cm->clear_has_overflown();
ysr@777 1133
tschatzl@7094 1134 _cm->do_yield_check(worker_id);
ysr@777 1135
ysr@777 1136 jlong sleep_time_ms;
ysr@777 1137 if (!_cm->has_aborted() && the_task->has_aborted()) {
ysr@777 1138 sleep_time_ms =
ysr@777 1139 (jlong) (elapsed_vtime_sec * _cm->sleep_factor() * 1000.0);
pliden@6906 1140 SuspendibleThreadSet::leave();
ysr@777 1141 os::sleep(Thread::current(), sleep_time_ms, false);
pliden@6906 1142 SuspendibleThreadSet::join();
ysr@777 1143 }
ysr@777 1144 } while (!_cm->has_aborted() && the_task->has_aborted());
ysr@777 1145 }
ysr@777 1146 the_task->record_end_time();
tonyp@1458 1147 guarantee(!the_task->has_aborted() || _cm->has_aborted(), "invariant");
ysr@777 1148
pliden@6906 1149 SuspendibleThreadSet::leave();
ysr@777 1150
ysr@777 1151 double end_vtime = os::elapsedVTime();
jmasa@3357 1152 _cm->update_accum_task_vtime(worker_id, end_vtime - start_vtime);
ysr@777 1153 }
ysr@777 1154
ysr@777 1155 CMConcurrentMarkingTask(ConcurrentMark* cm,
ysr@777 1156 ConcurrentMarkThread* cmt) :
ysr@777 1157 AbstractGangTask("Concurrent Mark"), _cm(cm), _cmt(cmt) { }
ysr@777 1158
ysr@777 1159 ~CMConcurrentMarkingTask() { }
ysr@777 1160 };
ysr@777 1161
jmasa@3294 1162 // Calculates the number of active workers for a concurrent
jmasa@3294 1163 // phase.
jmasa@3357 1164 uint ConcurrentMark::calc_parallel_marking_threads() {
johnc@3338 1165 if (G1CollectedHeap::use_parallel_gc_threads()) {
jmasa@3357 1166 uint n_conc_workers = 0;
jmasa@3294 1167 if (!UseDynamicNumberOfGCThreads ||
jmasa@3294 1168 (!FLAG_IS_DEFAULT(ConcGCThreads) &&
jmasa@3294 1169 !ForceDynamicNumberOfGCThreads)) {
jmasa@3294 1170 n_conc_workers = max_parallel_marking_threads();
jmasa@3294 1171 } else {
jmasa@3294 1172 n_conc_workers =
jmasa@3294 1173 AdaptiveSizePolicy::calc_default_active_workers(
jmasa@3294 1174 max_parallel_marking_threads(),
jmasa@3294 1175 1, /* Minimum workers */
jmasa@3294 1176 parallel_marking_threads(),
jmasa@3294 1177 Threads::number_of_non_daemon_threads());
jmasa@3294 1178 // Don't scale down "n_conc_workers" by scale_parallel_threads() because
jmasa@3294 1179 // that scaling has already gone into "_max_parallel_marking_threads".
jmasa@3294 1180 }
johnc@3338 1181 assert(n_conc_workers > 0, "Always need at least 1");
johnc@3338 1182 return n_conc_workers;
jmasa@3294 1183 }
johnc@3338 1184 // If we are not running with any parallel GC threads we will not
johnc@3338 1185 // have spawned any marking threads either. Hence the number of
johnc@3338 1186 // concurrent workers should be 0.
johnc@3338 1187 return 0;
jmasa@3294 1188 }
jmasa@3294 1189
tonyp@3464 1190 void ConcurrentMark::scanRootRegion(HeapRegion* hr, uint worker_id) {
tonyp@3464 1191 // Currently, only survivors can be root regions.
tonyp@3464 1192 assert(hr->next_top_at_mark_start() == hr->bottom(), "invariant");
tonyp@3464 1193 G1RootRegionScanClosure cl(_g1h, this, worker_id);
tonyp@3464 1194
tonyp@3464 1195 const uintx interval = PrefetchScanIntervalInBytes;
tonyp@3464 1196 HeapWord* curr = hr->bottom();
tonyp@3464 1197 const HeapWord* end = hr->top();
tonyp@3464 1198 while (curr < end) {
tonyp@3464 1199 Prefetch::read(curr, interval);
tonyp@3464 1200 oop obj = oop(curr);
tonyp@3464 1201 int size = obj->oop_iterate(&cl);
tonyp@3464 1202 assert(size == obj->size(), "sanity");
tonyp@3464 1203 curr += size;
tonyp@3464 1204 }
tonyp@3464 1205 }
tonyp@3464 1206
tonyp@3464 1207 class CMRootRegionScanTask : public AbstractGangTask {
tonyp@3464 1208 private:
tonyp@3464 1209 ConcurrentMark* _cm;
tonyp@3464 1210
tonyp@3464 1211 public:
tonyp@3464 1212 CMRootRegionScanTask(ConcurrentMark* cm) :
tonyp@3464 1213 AbstractGangTask("Root Region Scan"), _cm(cm) { }
tonyp@3464 1214
tonyp@3464 1215 void work(uint worker_id) {
tonyp@3464 1216 assert(Thread::current()->is_ConcurrentGC_thread(),
tonyp@3464 1217 "this should only be done by a conc GC thread");
tonyp@3464 1218
tonyp@3464 1219 CMRootRegions* root_regions = _cm->root_regions();
tonyp@3464 1220 HeapRegion* hr = root_regions->claim_next();
tonyp@3464 1221 while (hr != NULL) {
tonyp@3464 1222 _cm->scanRootRegion(hr, worker_id);
tonyp@3464 1223 hr = root_regions->claim_next();
tonyp@3464 1224 }
tonyp@3464 1225 }
tonyp@3464 1226 };
tonyp@3464 1227
tonyp@3464 1228 void ConcurrentMark::scanRootRegions() {
stefank@6992 1229 // Start of concurrent marking.
stefank@6992 1230 ClassLoaderDataGraph::clear_claimed_marks();
stefank@6992 1231
tonyp@3464 1232 // scan_in_progress() will have been set to true only if there was
tonyp@3464 1233 // at least one root region to scan. So, if it's false, we
tonyp@3464 1234 // should not attempt to do any further work.
tonyp@3464 1235 if (root_regions()->scan_in_progress()) {
tonyp@3464 1236 _parallel_marking_threads = calc_parallel_marking_threads();
tonyp@3464 1237 assert(parallel_marking_threads() <= max_parallel_marking_threads(),
tonyp@3464 1238 "Maximum number of marking threads exceeded");
tonyp@3464 1239 uint active_workers = MAX2(1U, parallel_marking_threads());
tonyp@3464 1240
tonyp@3464 1241 CMRootRegionScanTask task(this);
johnc@4549 1242 if (use_parallel_marking_threads()) {
tonyp@3464 1243 _parallel_workers->set_active_workers((int) active_workers);
tonyp@3464 1244 _parallel_workers->run_task(&task);
tonyp@3464 1245 } else {
tonyp@3464 1246 task.work(0);
tonyp@3464 1247 }
tonyp@3464 1248
tonyp@3464 1249 // It's possible that has_aborted() is true here without actually
tonyp@3464 1250 // aborting the survivor scan earlier. This is OK as it's
tonyp@3464 1251 // mainly used for sanity checking.
tonyp@3464 1252 root_regions()->scan_finished();
tonyp@3464 1253 }
tonyp@3464 1254 }
tonyp@3464 1255
ysr@777 1256 void ConcurrentMark::markFromRoots() {
ysr@777 1257 // we might be tempted to assert that:
ysr@777 1258 // assert(asynch == !SafepointSynchronize::is_at_safepoint(),
ysr@777 1259 // "inconsistent argument?");
ysr@777 1260 // However that wouldn't be right, because it's possible that
ysr@777 1261 // a safepoint is indeed in progress as a younger generation
ysr@777 1262 // stop-the-world GC happens even as we mark in this generation.
ysr@777 1263
ysr@777 1264 _restart_for_overflow = false;
tonyp@2848 1265 force_overflow_conc()->init();
jmasa@3294 1266
jmasa@3294 1267 // _g1h has _n_par_threads
jmasa@3294 1268 _parallel_marking_threads = calc_parallel_marking_threads();
jmasa@3294 1269 assert(parallel_marking_threads() <= max_parallel_marking_threads(),
jmasa@3294 1270 "Maximum number of marking threads exceeded");
johnc@3338 1271
jmasa@3357 1272 uint active_workers = MAX2(1U, parallel_marking_threads());
johnc@3338 1273
johnc@4788 1274 // Parallel task terminator is set in "set_concurrency_and_phase()"
johnc@4788 1275 set_concurrency_and_phase(active_workers, true /* concurrent */);
ysr@777 1276
ysr@777 1277 CMConcurrentMarkingTask markingTask(this, cmThread());
johnc@4549 1278 if (use_parallel_marking_threads()) {
johnc@3338 1279 _parallel_workers->set_active_workers((int)active_workers);
stefank@6992 1280 // Don't set _n_par_threads because it affects MT in process_roots()
johnc@3338 1281 // and the decisions on that MT processing is made elsewhere.
johnc@3338 1282 assert(_parallel_workers->active_workers() > 0, "Should have been set");
ysr@777 1283 _parallel_workers->run_task(&markingTask);
tonyp@2973 1284 } else {
ysr@777 1285 markingTask.work(0);
tonyp@2973 1286 }
ysr@777 1287 print_stats();
ysr@777 1288 }
ysr@777 1289
ysr@777 1290 void ConcurrentMark::checkpointRootsFinal(bool clear_all_soft_refs) {
ysr@777 1291 // world is stopped at this checkpoint
ysr@777 1292 assert(SafepointSynchronize::is_at_safepoint(),
ysr@777 1293 "world should be stopped");
johnc@3175 1294
ysr@777 1295 G1CollectedHeap* g1h = G1CollectedHeap::heap();
ysr@777 1296
ysr@777 1297 // If a full collection has happened, we shouldn't do this.
ysr@777 1298 if (has_aborted()) {
ysr@777 1299 g1h->set_marking_complete(); // So bitmap clearing isn't confused
ysr@777 1300 return;
ysr@777 1301 }
ysr@777 1302
kamg@2445 1303 SvcGCMarker sgcm(SvcGCMarker::OTHER);
kamg@2445 1304
ysr@1280 1305 if (VerifyDuringGC) {
ysr@1280 1306 HandleMark hm; // handle scope
ysr@1280 1307 Universe::heap()->prepare_for_verify();
stefank@5018 1308 Universe::verify(VerifyOption_G1UsePrevMarking,
stefank@5018 1309 " VerifyDuringGC:(before)");
ysr@1280 1310 }
brutisso@7005 1311 g1h->check_bitmaps("Remark Start");
ysr@1280 1312
ysr@777 1313 G1CollectorPolicy* g1p = g1h->g1_policy();
ysr@777 1314 g1p->record_concurrent_mark_remark_start();
ysr@777 1315
ysr@777 1316 double start = os::elapsedTime();
ysr@777 1317
ysr@777 1318 checkpointRootsFinalWork();
ysr@777 1319
ysr@777 1320 double mark_work_end = os::elapsedTime();
ysr@777 1321
ysr@777 1322 weakRefsWork(clear_all_soft_refs);
ysr@777 1323
ysr@777 1324 if (has_overflown()) {
ysr@777 1325 // Oops. We overflowed. Restart concurrent marking.
ysr@777 1326 _restart_for_overflow = true;
johnc@4789 1327 if (G1TraceMarkStackOverflow) {
johnc@4789 1328 gclog_or_tty->print_cr("\nRemark led to restart for overflow.");
johnc@4789 1329 }
johnc@4789 1330
johnc@4789 1331 // Verify the heap w.r.t. the previous marking bitmap.
johnc@4789 1332 if (VerifyDuringGC) {
johnc@4789 1333 HandleMark hm; // handle scope
johnc@4789 1334 Universe::heap()->prepare_for_verify();
stefank@5018 1335 Universe::verify(VerifyOption_G1UsePrevMarking,
stefank@5018 1336 " VerifyDuringGC:(overflow)");
johnc@4789 1337 }
johnc@4789 1338
johnc@4386 1339 // Clear the marking state because we will be restarting
johnc@4386 1340 // marking due to overflowing the global mark stack.
johnc@4386 1341 reset_marking_state();
ysr@777 1342 } else {
johnc@3463 1343 // Aggregate the per-task counting data that we have accumulated
johnc@3463 1344 // while marking.
johnc@3463 1345 aggregate_count_data();
johnc@3463 1346
tonyp@2469 1347 SATBMarkQueueSet& satb_mq_set = JavaThread::satb_mark_queue_set();
ysr@777 1348 // We're done with marking.
tonyp@1752 1349 // This is the end of the marking cycle, we're expected all
tonyp@1752 1350 // threads to have SATB queues with active set to true.
tonyp@2469 1351 satb_mq_set.set_active_all_threads(false, /* new active value */
tonyp@2469 1352 true /* expected_active */);
tonyp@1246 1353
tonyp@1246 1354 if (VerifyDuringGC) {
ysr@1280 1355 HandleMark hm; // handle scope
ysr@1280 1356 Universe::heap()->prepare_for_verify();
stefank@5018 1357 Universe::verify(VerifyOption_G1UseNextMarking,
stefank@5018 1358 " VerifyDuringGC:(after)");
tonyp@1246 1359 }
brutisso@7005 1360 g1h->check_bitmaps("Remark End");
johnc@2494 1361 assert(!restart_for_overflow(), "sanity");
johnc@4386 1362 // Completely reset the marking state since marking completed
johnc@4386 1363 set_non_marking_state();
johnc@2494 1364 }
johnc@2494 1365
johnc@4333 1366 // Expand the marking stack, if we have to and if we can.
johnc@4333 1367 if (_markStack.should_expand()) {
johnc@4333 1368 _markStack.expand();
johnc@4333 1369 }
johnc@4333 1370
ysr@777 1371 // Statistics
ysr@777 1372 double now = os::elapsedTime();
ysr@777 1373 _remark_mark_times.add((mark_work_end - start) * 1000.0);
ysr@777 1374 _remark_weak_ref_times.add((now - mark_work_end) * 1000.0);
ysr@777 1375 _remark_times.add((now - start) * 1000.0);
ysr@777 1376
ysr@777 1377 g1p->record_concurrent_mark_remark_end();
sla@5237 1378
sla@5237 1379 G1CMIsAliveClosure is_alive(g1h);
sla@5237 1380 g1h->gc_tracer_cm()->report_object_count_after_gc(&is_alive);
ysr@777 1381 }
ysr@777 1382
johnc@3731 1383 // Base class of the closures that finalize and verify the
johnc@3731 1384 // liveness counting data.
johnc@3731 1385 class CMCountDataClosureBase: public HeapRegionClosure {
johnc@3731 1386 protected:
johnc@4123 1387 G1CollectedHeap* _g1h;
ysr@777 1388 ConcurrentMark* _cm;
johnc@4123 1389 CardTableModRefBS* _ct_bs;
johnc@4123 1390
johnc@3463 1391 BitMap* _region_bm;
johnc@3463 1392 BitMap* _card_bm;
johnc@3463 1393
johnc@4123 1394 // Takes a region that's not empty (i.e., it has at least one
tonyp@1264 1395 // live object in it and sets its corresponding bit on the region
tonyp@1264 1396 // bitmap to 1. If the region is "starts humongous" it will also set
tonyp@1264 1397 // to 1 the bits on the region bitmap that correspond to its
tonyp@1264 1398 // associated "continues humongous" regions.
tonyp@1264 1399 void set_bit_for_region(HeapRegion* hr) {
tonyp@1264 1400 assert(!hr->continuesHumongous(), "should have filtered those out");
tonyp@1264 1401
tschatzl@7091 1402 BitMap::idx_t index = (BitMap::idx_t) hr->hrm_index();
tonyp@1264 1403 if (!hr->startsHumongous()) {
tonyp@1264 1404 // Normal (non-humongous) case: just set the bit.
tonyp@3713 1405 _region_bm->par_at_put(index, true);
tonyp@1264 1406 } else {
tonyp@1264 1407 // Starts humongous case: calculate how many regions are part of
johnc@3463 1408 // this humongous region and then set the bit range.
tonyp@3957 1409 BitMap::idx_t end_index = (BitMap::idx_t) hr->last_hc_index();
tonyp@3713 1410 _region_bm->par_at_put_range(index, end_index, true);
tonyp@1264 1411 }
tonyp@1264 1412 }
tonyp@1264 1413
johnc@3731 1414 public:
johnc@4123 1415 CMCountDataClosureBase(G1CollectedHeap* g1h,
johnc@3731 1416 BitMap* region_bm, BitMap* card_bm):
johnc@4123 1417 _g1h(g1h), _cm(g1h->concurrent_mark()),
johnc@4123 1418 _ct_bs((CardTableModRefBS*) (g1h->barrier_set())),
johnc@4123 1419 _region_bm(region_bm), _card_bm(card_bm) { }
johnc@3731 1420 };
johnc@3731 1421
johnc@3731 1422 // Closure that calculates the # live objects per region. Used
johnc@3731 1423 // for verification purposes during the cleanup pause.
johnc@3731 1424 class CalcLiveObjectsClosure: public CMCountDataClosureBase {
johnc@3731 1425 CMBitMapRO* _bm;
johnc@3731 1426 size_t _region_marked_bytes;
johnc@3731 1427
johnc@3731 1428 public:
johnc@4123 1429 CalcLiveObjectsClosure(CMBitMapRO *bm, G1CollectedHeap* g1h,
johnc@3731 1430 BitMap* region_bm, BitMap* card_bm) :
johnc@4123 1431 CMCountDataClosureBase(g1h, region_bm, card_bm),
johnc@3731 1432 _bm(bm), _region_marked_bytes(0) { }
johnc@3731 1433
ysr@777 1434 bool doHeapRegion(HeapRegion* hr) {
ysr@777 1435
iveresov@1074 1436 if (hr->continuesHumongous()) {
tonyp@1264 1437 // We will ignore these here and process them when their
tonyp@1264 1438 // associated "starts humongous" region is processed (see
tonyp@1264 1439 // set_bit_for_heap_region()). Note that we cannot rely on their
tonyp@1264 1440 // associated "starts humongous" region to have their bit set to
tonyp@1264 1441 // 1 since, due to the region chunking in the parallel region
tonyp@1264 1442 // iteration, a "continues humongous" region might be visited
tonyp@1264 1443 // before its associated "starts humongous".
iveresov@1074 1444 return false;
iveresov@1074 1445 }
ysr@777 1446
johnc@4123 1447 HeapWord* ntams = hr->next_top_at_mark_start();
johnc@4123 1448 HeapWord* start = hr->bottom();
johnc@4123 1449
johnc@4123 1450 assert(start <= hr->end() && start <= ntams && ntams <= hr->end(),
johnc@3463 1451 err_msg("Preconditions not met - "
johnc@4123 1452 "start: "PTR_FORMAT", ntams: "PTR_FORMAT", end: "PTR_FORMAT,
drchase@6680 1453 p2i(start), p2i(ntams), p2i(hr->end())));
johnc@3463 1454
ysr@777 1455 // Find the first marked object at or after "start".
johnc@4123 1456 start = _bm->getNextMarkedWordAddress(start, ntams);
johnc@3463 1457
ysr@777 1458 size_t marked_bytes = 0;
ysr@777 1459
johnc@4123 1460 while (start < ntams) {
ysr@777 1461 oop obj = oop(start);
ysr@777 1462 int obj_sz = obj->size();
johnc@4123 1463 HeapWord* obj_end = start + obj_sz;
johnc@3731 1464
johnc@3731 1465 BitMap::idx_t start_idx = _cm->card_bitmap_index_for(start);
johnc@4123 1466 BitMap::idx_t end_idx = _cm->card_bitmap_index_for(obj_end);
johnc@4123 1467
johnc@4123 1468 // Note: if we're looking at the last region in heap - obj_end
johnc@4123 1469 // could be actually just beyond the end of the heap; end_idx
johnc@4123 1470 // will then correspond to a (non-existent) card that is also
johnc@4123 1471 // just beyond the heap.
johnc@4123 1472 if (_g1h->is_in_g1_reserved(obj_end) && !_ct_bs->is_card_aligned(obj_end)) {
johnc@4123 1473 // end of object is not card aligned - increment to cover
johnc@4123 1474 // all the cards spanned by the object
johnc@4123 1475 end_idx += 1;
johnc@4123 1476 }
johnc@4123 1477
johnc@4123 1478 // Set the bits in the card BM for the cards spanned by this object.
johnc@4123 1479 _cm->set_card_bitmap_range(_card_bm, start_idx, end_idx, true /* is_par */);
johnc@3731 1480
johnc@3731 1481 // Add the size of this object to the number of marked bytes.
apetrusenko@1465 1482 marked_bytes += (size_t)obj_sz * HeapWordSize;
johnc@3463 1483
ysr@777 1484 // Find the next marked object after this one.
johnc@4123 1485 start = _bm->getNextMarkedWordAddress(obj_end, ntams);
tonyp@2973 1486 }
johnc@3463 1487
johnc@3463 1488 // Mark the allocated-since-marking portion...
johnc@3463 1489 HeapWord* top = hr->top();
johnc@4123 1490 if (ntams < top) {
johnc@4123 1491 BitMap::idx_t start_idx = _cm->card_bitmap_index_for(ntams);
johnc@4123 1492 BitMap::idx_t end_idx = _cm->card_bitmap_index_for(top);
johnc@4123 1493
johnc@4123 1494 // Note: if we're looking at the last region in heap - top
johnc@4123 1495 // could be actually just beyond the end of the heap; end_idx
johnc@4123 1496 // will then correspond to a (non-existent) card that is also
johnc@4123 1497 // just beyond the heap.
johnc@4123 1498 if (_g1h->is_in_g1_reserved(top) && !_ct_bs->is_card_aligned(top)) {
johnc@4123 1499 // end of object is not card aligned - increment to cover
johnc@4123 1500 // all the cards spanned by the object
johnc@4123 1501 end_idx += 1;
johnc@4123 1502 }
johnc@4123 1503 _cm->set_card_bitmap_range(_card_bm, start_idx, end_idx, true /* is_par */);
johnc@3463 1504
johnc@3463 1505 // This definitely means the region has live objects.
johnc@3463 1506 set_bit_for_region(hr);
ysr@777 1507 }
ysr@777 1508
ysr@777 1509 // Update the live region bitmap.
ysr@777 1510 if (marked_bytes > 0) {
tonyp@1264 1511 set_bit_for_region(hr);
ysr@777 1512 }
johnc@3463 1513
johnc@3463 1514 // Set the marked bytes for the current region so that
johnc@3463 1515 // it can be queried by a calling verificiation routine
johnc@3463 1516 _region_marked_bytes = marked_bytes;
johnc@3463 1517
johnc@3463 1518 return false;
johnc@3463 1519 }
johnc@3463 1520
johnc@3463 1521 size_t region_marked_bytes() const { return _region_marked_bytes; }
johnc@3463 1522 };
johnc@3463 1523
johnc@3463 1524 // Heap region closure used for verifying the counting data
johnc@3463 1525 // that was accumulated concurrently and aggregated during
johnc@3463 1526 // the remark pause. This closure is applied to the heap
johnc@3463 1527 // regions during the STW cleanup pause.
johnc@3463 1528
johnc@3463 1529 class VerifyLiveObjectDataHRClosure: public HeapRegionClosure {
johnc@4123 1530 G1CollectedHeap* _g1h;
johnc@3463 1531 ConcurrentMark* _cm;
johnc@3463 1532 CalcLiveObjectsClosure _calc_cl;
johnc@3463 1533 BitMap* _region_bm; // Region BM to be verified
johnc@3463 1534 BitMap* _card_bm; // Card BM to be verified
johnc@3463 1535 bool _verbose; // verbose output?
johnc@3463 1536
johnc@3463 1537 BitMap* _exp_region_bm; // Expected Region BM values
johnc@3463 1538 BitMap* _exp_card_bm; // Expected card BM values
johnc@3463 1539
johnc@3463 1540 int _failures;
johnc@3463 1541
johnc@3463 1542 public:
johnc@4123 1543 VerifyLiveObjectDataHRClosure(G1CollectedHeap* g1h,
johnc@3463 1544 BitMap* region_bm,
johnc@3463 1545 BitMap* card_bm,
johnc@3463 1546 BitMap* exp_region_bm,
johnc@3463 1547 BitMap* exp_card_bm,
johnc@3463 1548 bool verbose) :
johnc@4123 1549 _g1h(g1h), _cm(g1h->concurrent_mark()),
johnc@4123 1550 _calc_cl(_cm->nextMarkBitMap(), g1h, exp_region_bm, exp_card_bm),
johnc@3463 1551 _region_bm(region_bm), _card_bm(card_bm), _verbose(verbose),
johnc@3463 1552 _exp_region_bm(exp_region_bm), _exp_card_bm(exp_card_bm),
johnc@3463 1553 _failures(0) { }
johnc@3463 1554
johnc@3463 1555 int failures() const { return _failures; }
johnc@3463 1556
johnc@3463 1557 bool doHeapRegion(HeapRegion* hr) {
johnc@3463 1558 if (hr->continuesHumongous()) {
johnc@3463 1559 // We will ignore these here and process them when their
johnc@3463 1560 // associated "starts humongous" region is processed (see
johnc@3463 1561 // set_bit_for_heap_region()). Note that we cannot rely on their
johnc@3463 1562 // associated "starts humongous" region to have their bit set to
johnc@3463 1563 // 1 since, due to the region chunking in the parallel region
johnc@3463 1564 // iteration, a "continues humongous" region might be visited
johnc@3463 1565 // before its associated "starts humongous".
johnc@3463 1566 return false;
johnc@3463 1567 }
johnc@3463 1568
johnc@3463 1569 int failures = 0;
johnc@3463 1570
johnc@3463 1571 // Call the CalcLiveObjectsClosure to walk the marking bitmap for
johnc@3463 1572 // this region and set the corresponding bits in the expected region
johnc@3463 1573 // and card bitmaps.
johnc@3463 1574 bool res = _calc_cl.doHeapRegion(hr);
johnc@3463 1575 assert(res == false, "should be continuing");
johnc@3463 1576
johnc@3463 1577 MutexLockerEx x((_verbose ? ParGCRareEvent_lock : NULL),
johnc@3463 1578 Mutex::_no_safepoint_check_flag);
johnc@3463 1579
johnc@3463 1580 // Verify the marked bytes for this region.
johnc@3463 1581 size_t exp_marked_bytes = _calc_cl.region_marked_bytes();
johnc@3463 1582 size_t act_marked_bytes = hr->next_marked_bytes();
johnc@3463 1583
johnc@3463 1584 // We're not OK if expected marked bytes > actual marked bytes. It means
johnc@3463 1585 // we have missed accounting some objects during the actual marking.
johnc@3463 1586 if (exp_marked_bytes > act_marked_bytes) {
johnc@3463 1587 if (_verbose) {
tonyp@3713 1588 gclog_or_tty->print_cr("Region %u: marked bytes mismatch: "
johnc@3463 1589 "expected: " SIZE_FORMAT ", actual: " SIZE_FORMAT,
tschatzl@7091 1590 hr->hrm_index(), exp_marked_bytes, act_marked_bytes);
johnc@3463 1591 }
johnc@3463 1592 failures += 1;
johnc@3463 1593 }
johnc@3463 1594
johnc@3463 1595 // Verify the bit, for this region, in the actual and expected
johnc@3463 1596 // (which was just calculated) region bit maps.
johnc@3463 1597 // We're not OK if the bit in the calculated expected region
johnc@3463 1598 // bitmap is set and the bit in the actual region bitmap is not.
tschatzl@7091 1599 BitMap::idx_t index = (BitMap::idx_t) hr->hrm_index();
johnc@3463 1600
johnc@3463 1601 bool expected = _exp_region_bm->at(index);
johnc@3463 1602 bool actual = _region_bm->at(index);
johnc@3463 1603 if (expected && !actual) {
johnc@3463 1604 if (_verbose) {
tonyp@3713 1605 gclog_or_tty->print_cr("Region %u: region bitmap mismatch: "
tonyp@3713 1606 "expected: %s, actual: %s",
tschatzl@7091 1607 hr->hrm_index(),
tonyp@3713 1608 BOOL_TO_STR(expected), BOOL_TO_STR(actual));
johnc@3463 1609 }
johnc@3463 1610 failures += 1;
johnc@3463 1611 }
johnc@3463 1612
johnc@3463 1613 // Verify that the card bit maps for the cards spanned by the current
johnc@3463 1614 // region match. We have an error if we have a set bit in the expected
johnc@3463 1615 // bit map and the corresponding bit in the actual bitmap is not set.
johnc@3463 1616
johnc@3463 1617 BitMap::idx_t start_idx = _cm->card_bitmap_index_for(hr->bottom());
johnc@3463 1618 BitMap::idx_t end_idx = _cm->card_bitmap_index_for(hr->top());
johnc@3463 1619
johnc@3463 1620 for (BitMap::idx_t i = start_idx; i < end_idx; i+=1) {
johnc@3463 1621 expected = _exp_card_bm->at(i);
johnc@3463 1622 actual = _card_bm->at(i);
johnc@3463 1623
johnc@3463 1624 if (expected && !actual) {
johnc@3463 1625 if (_verbose) {
tonyp@3713 1626 gclog_or_tty->print_cr("Region %u: card bitmap mismatch at " SIZE_FORMAT ": "
tonyp@3713 1627 "expected: %s, actual: %s",
tschatzl@7091 1628 hr->hrm_index(), i,
tonyp@3713 1629 BOOL_TO_STR(expected), BOOL_TO_STR(actual));
ysr@777 1630 }
johnc@3463 1631 failures += 1;
ysr@777 1632 }
ysr@777 1633 }
ysr@777 1634
johnc@3463 1635 if (failures > 0 && _verbose) {
johnc@3463 1636 gclog_or_tty->print_cr("Region " HR_FORMAT ", ntams: " PTR_FORMAT ", "
johnc@3463 1637 "marked_bytes: calc/actual " SIZE_FORMAT "/" SIZE_FORMAT,
drchase@6680 1638 HR_FORMAT_PARAMS(hr), p2i(hr->next_top_at_mark_start()),
johnc@3463 1639 _calc_cl.region_marked_bytes(), hr->next_marked_bytes());
johnc@3463 1640 }
johnc@3463 1641
johnc@3463 1642 _failures += failures;
johnc@3463 1643
johnc@3463 1644 // We could stop iteration over the heap when we
johnc@3731 1645 // find the first violating region by returning true.
ysr@777 1646 return false;
ysr@777 1647 }
ysr@777 1648 };
ysr@777 1649
johnc@3463 1650 class G1ParVerifyFinalCountTask: public AbstractGangTask {
johnc@3463 1651 protected:
johnc@3463 1652 G1CollectedHeap* _g1h;
johnc@3463 1653 ConcurrentMark* _cm;
johnc@3463 1654 BitMap* _actual_region_bm;
johnc@3463 1655 BitMap* _actual_card_bm;
johnc@3463 1656
johnc@3463 1657 uint _n_workers;
johnc@3463 1658
johnc@3463 1659 BitMap* _expected_region_bm;
johnc@3463 1660 BitMap* _expected_card_bm;
johnc@3463 1661
johnc@3463 1662 int _failures;
johnc@3463 1663 bool _verbose;
johnc@3463 1664
johnc@3463 1665 public:
johnc@3463 1666 G1ParVerifyFinalCountTask(G1CollectedHeap* g1h,
johnc@3463 1667 BitMap* region_bm, BitMap* card_bm,
johnc@3463 1668 BitMap* expected_region_bm, BitMap* expected_card_bm)
johnc@3463 1669 : AbstractGangTask("G1 verify final counting"),
johnc@3463 1670 _g1h(g1h), _cm(_g1h->concurrent_mark()),
johnc@3463 1671 _actual_region_bm(region_bm), _actual_card_bm(card_bm),
johnc@3463 1672 _expected_region_bm(expected_region_bm), _expected_card_bm(expected_card_bm),
johnc@3463 1673 _failures(0), _verbose(false),
johnc@3463 1674 _n_workers(0) {
johnc@3463 1675 assert(VerifyDuringGC, "don't call this otherwise");
johnc@3463 1676
johnc@3463 1677 // Use the value already set as the number of active threads
johnc@3463 1678 // in the call to run_task().
johnc@3463 1679 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@3463 1680 assert( _g1h->workers()->active_workers() > 0,
johnc@3463 1681 "Should have been previously set");
johnc@3463 1682 _n_workers = _g1h->workers()->active_workers();
johnc@3463 1683 } else {
johnc@3463 1684 _n_workers = 1;
johnc@3463 1685 }
johnc@3463 1686
johnc@3463 1687 assert(_expected_card_bm->size() == _actual_card_bm->size(), "sanity");
johnc@3463 1688 assert(_expected_region_bm->size() == _actual_region_bm->size(), "sanity");
johnc@3463 1689
johnc@3463 1690 _verbose = _cm->verbose_medium();
johnc@3463 1691 }
johnc@3463 1692
johnc@3463 1693 void work(uint worker_id) {
johnc@3463 1694 assert(worker_id < _n_workers, "invariant");
johnc@3463 1695
johnc@4123 1696 VerifyLiveObjectDataHRClosure verify_cl(_g1h,
johnc@3463 1697 _actual_region_bm, _actual_card_bm,
johnc@3463 1698 _expected_region_bm,
johnc@3463 1699 _expected_card_bm,
johnc@3463 1700 _verbose);
johnc@3463 1701
johnc@3463 1702 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@3463 1703 _g1h->heap_region_par_iterate_chunked(&verify_cl,
johnc@3463 1704 worker_id,
johnc@3463 1705 _n_workers,
johnc@3463 1706 HeapRegion::VerifyCountClaimValue);
johnc@3463 1707 } else {
johnc@3463 1708 _g1h->heap_region_iterate(&verify_cl);
johnc@3463 1709 }
johnc@3463 1710
johnc@3463 1711 Atomic::add(verify_cl.failures(), &_failures);
johnc@3463 1712 }
johnc@3463 1713
johnc@3463 1714 int failures() const { return _failures; }
johnc@3463 1715 };
johnc@3463 1716
johnc@3731 1717 // Closure that finalizes the liveness counting data.
johnc@3731 1718 // Used during the cleanup pause.
johnc@3731 1719 // Sets the bits corresponding to the interval [NTAMS, top]
johnc@3731 1720 // (which contains the implicitly live objects) in the
johnc@3731 1721 // card liveness bitmap. Also sets the bit for each region,
johnc@3731 1722 // containing live data, in the region liveness bitmap.
johnc@3731 1723
johnc@3731 1724 class FinalCountDataUpdateClosure: public CMCountDataClosureBase {
johnc@3463 1725 public:
johnc@4123 1726 FinalCountDataUpdateClosure(G1CollectedHeap* g1h,
johnc@3463 1727 BitMap* region_bm,
johnc@3463 1728 BitMap* card_bm) :
johnc@4123 1729 CMCountDataClosureBase(g1h, region_bm, card_bm) { }
johnc@3463 1730
johnc@3463 1731 bool doHeapRegion(HeapRegion* hr) {
johnc@3463 1732
johnc@3463 1733 if (hr->continuesHumongous()) {
johnc@3463 1734 // We will ignore these here and process them when their
johnc@3463 1735 // associated "starts humongous" region is processed (see
johnc@3463 1736 // set_bit_for_heap_region()). Note that we cannot rely on their
johnc@3463 1737 // associated "starts humongous" region to have their bit set to
johnc@3463 1738 // 1 since, due to the region chunking in the parallel region
johnc@3463 1739 // iteration, a "continues humongous" region might be visited
johnc@3463 1740 // before its associated "starts humongous".
johnc@3463 1741 return false;
johnc@3463 1742 }
johnc@3463 1743
johnc@3463 1744 HeapWord* ntams = hr->next_top_at_mark_start();
johnc@3463 1745 HeapWord* top = hr->top();
johnc@3463 1746
johnc@3731 1747 assert(hr->bottom() <= ntams && ntams <= hr->end(), "Preconditions.");
johnc@3463 1748
johnc@3463 1749 // Mark the allocated-since-marking portion...
johnc@3463 1750 if (ntams < top) {
johnc@3463 1751 // This definitely means the region has live objects.
johnc@3463 1752 set_bit_for_region(hr);
johnc@4123 1753
johnc@4123 1754 // Now set the bits in the card bitmap for [ntams, top)
johnc@4123 1755 BitMap::idx_t start_idx = _cm->card_bitmap_index_for(ntams);
johnc@4123 1756 BitMap::idx_t end_idx = _cm->card_bitmap_index_for(top);
johnc@4123 1757
johnc@4123 1758 // Note: if we're looking at the last region in heap - top
johnc@4123 1759 // could be actually just beyond the end of the heap; end_idx
johnc@4123 1760 // will then correspond to a (non-existent) card that is also
johnc@4123 1761 // just beyond the heap.
johnc@4123 1762 if (_g1h->is_in_g1_reserved(top) && !_ct_bs->is_card_aligned(top)) {
johnc@4123 1763 // end of object is not card aligned - increment to cover
johnc@4123 1764 // all the cards spanned by the object
johnc@4123 1765 end_idx += 1;
johnc@4123 1766 }
johnc@4123 1767
johnc@4123 1768 assert(end_idx <= _card_bm->size(),
johnc@4123 1769 err_msg("oob: end_idx= "SIZE_FORMAT", bitmap size= "SIZE_FORMAT,
johnc@4123 1770 end_idx, _card_bm->size()));
johnc@4123 1771 assert(start_idx < _card_bm->size(),
johnc@4123 1772 err_msg("oob: start_idx= "SIZE_FORMAT", bitmap size= "SIZE_FORMAT,
johnc@4123 1773 start_idx, _card_bm->size()));
johnc@4123 1774
johnc@4123 1775 _cm->set_card_bitmap_range(_card_bm, start_idx, end_idx, true /* is_par */);
coleenp@4037 1776 }
johnc@3463 1777
johnc@3463 1778 // Set the bit for the region if it contains live data
johnc@3463 1779 if (hr->next_marked_bytes() > 0) {
johnc@3463 1780 set_bit_for_region(hr);
johnc@3463 1781 }
johnc@3463 1782
johnc@3463 1783 return false;
johnc@3463 1784 }
johnc@3463 1785 };
ysr@777 1786
ysr@777 1787 class G1ParFinalCountTask: public AbstractGangTask {
ysr@777 1788 protected:
ysr@777 1789 G1CollectedHeap* _g1h;
johnc@3463 1790 ConcurrentMark* _cm;
johnc@3463 1791 BitMap* _actual_region_bm;
johnc@3463 1792 BitMap* _actual_card_bm;
johnc@3463 1793
jmasa@3357 1794 uint _n_workers;
johnc@3463 1795
ysr@777 1796 public:
johnc@3463 1797 G1ParFinalCountTask(G1CollectedHeap* g1h, BitMap* region_bm, BitMap* card_bm)
johnc@3463 1798 : AbstractGangTask("G1 final counting"),
johnc@3463 1799 _g1h(g1h), _cm(_g1h->concurrent_mark()),
johnc@3463 1800 _actual_region_bm(region_bm), _actual_card_bm(card_bm),
johnc@3463 1801 _n_workers(0) {
jmasa@3294 1802 // Use the value already set as the number of active threads
tonyp@3714 1803 // in the call to run_task().
jmasa@3294 1804 if (G1CollectedHeap::use_parallel_gc_threads()) {
jmasa@3294 1805 assert( _g1h->workers()->active_workers() > 0,
jmasa@3294 1806 "Should have been previously set");
jmasa@3294 1807 _n_workers = _g1h->workers()->active_workers();
tonyp@2973 1808 } else {
ysr@777 1809 _n_workers = 1;
tonyp@2973 1810 }
ysr@777 1811 }
ysr@777 1812
jmasa@3357 1813 void work(uint worker_id) {
johnc@3463 1814 assert(worker_id < _n_workers, "invariant");
johnc@3463 1815
johnc@4123 1816 FinalCountDataUpdateClosure final_update_cl(_g1h,
johnc@3463 1817 _actual_region_bm,
johnc@3463 1818 _actual_card_bm);
johnc@3463 1819
jmasa@2188 1820 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@3463 1821 _g1h->heap_region_par_iterate_chunked(&final_update_cl,
johnc@3463 1822 worker_id,
johnc@3463 1823 _n_workers,
tonyp@790 1824 HeapRegion::FinalCountClaimValue);
ysr@777 1825 } else {
johnc@3463 1826 _g1h->heap_region_iterate(&final_update_cl);
ysr@777 1827 }
ysr@777 1828 }
ysr@777 1829 };
ysr@777 1830
ysr@777 1831 class G1ParNoteEndTask;
ysr@777 1832
ysr@777 1833 class G1NoteEndOfConcMarkClosure : public HeapRegionClosure {
ysr@777 1834 G1CollectedHeap* _g1;
ysr@777 1835 size_t _max_live_bytes;
tonyp@3713 1836 uint _regions_claimed;
ysr@777 1837 size_t _freed_bytes;
tonyp@2493 1838 FreeRegionList* _local_cleanup_list;
brutisso@6385 1839 HeapRegionSetCount _old_regions_removed;
brutisso@6385 1840 HeapRegionSetCount _humongous_regions_removed;
tonyp@2493 1841 HRRSCleanupTask* _hrrs_cleanup_task;
ysr@777 1842 double _claimed_region_time;
ysr@777 1843 double _max_region_time;
ysr@777 1844
ysr@777 1845 public:
ysr@777 1846 G1NoteEndOfConcMarkClosure(G1CollectedHeap* g1,
tonyp@2493 1847 FreeRegionList* local_cleanup_list,
johnc@3292 1848 HRRSCleanupTask* hrrs_cleanup_task) :
vkempik@6552 1849 _g1(g1),
johnc@3292 1850 _max_live_bytes(0), _regions_claimed(0),
johnc@3292 1851 _freed_bytes(0),
johnc@3292 1852 _claimed_region_time(0.0), _max_region_time(0.0),
johnc@3292 1853 _local_cleanup_list(local_cleanup_list),
brutisso@6385 1854 _old_regions_removed(),
brutisso@6385 1855 _humongous_regions_removed(),
johnc@3292 1856 _hrrs_cleanup_task(hrrs_cleanup_task) { }
johnc@3292 1857
ysr@777 1858 size_t freed_bytes() { return _freed_bytes; }
brutisso@6385 1859 const HeapRegionSetCount& old_regions_removed() { return _old_regions_removed; }
brutisso@6385 1860 const HeapRegionSetCount& humongous_regions_removed() { return _humongous_regions_removed; }
ysr@777 1861
johnc@3292 1862 bool doHeapRegion(HeapRegion *hr) {
tonyp@3957 1863 if (hr->continuesHumongous()) {
tonyp@3957 1864 return false;
tonyp@3957 1865 }
johnc@3292 1866 // We use a claim value of zero here because all regions
johnc@3292 1867 // were claimed with value 1 in the FinalCount task.
tonyp@3957 1868 _g1->reset_gc_time_stamps(hr);
tonyp@3957 1869 double start = os::elapsedTime();
tonyp@3957 1870 _regions_claimed++;
tonyp@3957 1871 hr->note_end_of_marking();
tonyp@3957 1872 _max_live_bytes += hr->max_live_bytes();
brutisso@6385 1873
brutisso@6385 1874 if (hr->used() > 0 && hr->max_live_bytes() == 0 && !hr->is_young()) {
brutisso@6385 1875 _freed_bytes += hr->used();
brutisso@6385 1876 hr->set_containing_set(NULL);
brutisso@6385 1877 if (hr->isHumongous()) {
brutisso@6385 1878 assert(hr->startsHumongous(), "we should only see starts humongous");
brutisso@6385 1879 _humongous_regions_removed.increment(1u, hr->capacity());
brutisso@6385 1880 _g1->free_humongous_region(hr, _local_cleanup_list, true);
brutisso@6385 1881 } else {
brutisso@6385 1882 _old_regions_removed.increment(1u, hr->capacity());
brutisso@6385 1883 _g1->free_region(hr, _local_cleanup_list, true);
brutisso@6385 1884 }
brutisso@6385 1885 } else {
brutisso@6385 1886 hr->rem_set()->do_cleanup_work(_hrrs_cleanup_task);
brutisso@6385 1887 }
brutisso@6385 1888
tonyp@3957 1889 double region_time = (os::elapsedTime() - start);
tonyp@3957 1890 _claimed_region_time += region_time;
tonyp@3957 1891 if (region_time > _max_region_time) {
tonyp@3957 1892 _max_region_time = region_time;
johnc@3292 1893 }
johnc@3292 1894 return false;
johnc@3292 1895 }
ysr@777 1896
ysr@777 1897 size_t max_live_bytes() { return _max_live_bytes; }
tonyp@3713 1898 uint regions_claimed() { return _regions_claimed; }
ysr@777 1899 double claimed_region_time_sec() { return _claimed_region_time; }
ysr@777 1900 double max_region_time_sec() { return _max_region_time; }
ysr@777 1901 };
ysr@777 1902
ysr@777 1903 class G1ParNoteEndTask: public AbstractGangTask {
ysr@777 1904 friend class G1NoteEndOfConcMarkClosure;
tonyp@2472 1905
ysr@777 1906 protected:
ysr@777 1907 G1CollectedHeap* _g1h;
ysr@777 1908 size_t _max_live_bytes;
ysr@777 1909 size_t _freed_bytes;
tonyp@2472 1910 FreeRegionList* _cleanup_list;
tonyp@2472 1911
ysr@777 1912 public:
ysr@777 1913 G1ParNoteEndTask(G1CollectedHeap* g1h,
tonyp@2472 1914 FreeRegionList* cleanup_list) :
ysr@777 1915 AbstractGangTask("G1 note end"), _g1h(g1h),
tonyp@2472 1916 _max_live_bytes(0), _freed_bytes(0), _cleanup_list(cleanup_list) { }
ysr@777 1917
jmasa@3357 1918 void work(uint worker_id) {
ysr@777 1919 double start = os::elapsedTime();
tonyp@2493 1920 FreeRegionList local_cleanup_list("Local Cleanup List");
tonyp@2493 1921 HRRSCleanupTask hrrs_cleanup_task;
vkempik@6552 1922 G1NoteEndOfConcMarkClosure g1_note_end(_g1h, &local_cleanup_list,
tonyp@2493 1923 &hrrs_cleanup_task);
jmasa@2188 1924 if (G1CollectedHeap::use_parallel_gc_threads()) {
jmasa@3357 1925 _g1h->heap_region_par_iterate_chunked(&g1_note_end, worker_id,
jmasa@3294 1926 _g1h->workers()->active_workers(),
tonyp@790 1927 HeapRegion::NoteEndClaimValue);
ysr@777 1928 } else {
ysr@777 1929 _g1h->heap_region_iterate(&g1_note_end);
ysr@777 1930 }
ysr@777 1931 assert(g1_note_end.complete(), "Shouldn't have yielded!");
ysr@777 1932
tonyp@2472 1933 // Now update the lists
brutisso@6385 1934 _g1h->remove_from_old_sets(g1_note_end.old_regions_removed(), g1_note_end.humongous_regions_removed());
ysr@777 1935 {
ysr@777 1936 MutexLockerEx x(ParGCRareEvent_lock, Mutex::_no_safepoint_check_flag);
brutisso@6385 1937 _g1h->decrement_summary_bytes(g1_note_end.freed_bytes());
ysr@777 1938 _max_live_bytes += g1_note_end.max_live_bytes();
ysr@777 1939 _freed_bytes += g1_note_end.freed_bytes();
tonyp@2472 1940
tonyp@2975 1941 // If we iterate over the global cleanup list at the end of
tonyp@2975 1942 // cleanup to do this printing we will not guarantee to only
tonyp@2975 1943 // generate output for the newly-reclaimed regions (the list
tonyp@2975 1944 // might not be empty at the beginning of cleanup; we might
tonyp@2975 1945 // still be working on its previous contents). So we do the
tonyp@2975 1946 // printing here, before we append the new regions to the global
tonyp@2975 1947 // cleanup list.
tonyp@2975 1948
tonyp@2975 1949 G1HRPrinter* hr_printer = _g1h->hr_printer();
tonyp@2975 1950 if (hr_printer->is_active()) {
brutisso@6385 1951 FreeRegionListIterator iter(&local_cleanup_list);
tonyp@2975 1952 while (iter.more_available()) {
tonyp@2975 1953 HeapRegion* hr = iter.get_next();
tonyp@2975 1954 hr_printer->cleanup(hr);
tonyp@2975 1955 }
tonyp@2975 1956 }
tonyp@2975 1957
jwilhelm@6422 1958 _cleanup_list->add_ordered(&local_cleanup_list);
tonyp@2493 1959 assert(local_cleanup_list.is_empty(), "post-condition");
tonyp@2493 1960
tonyp@2493 1961 HeapRegionRemSet::finish_cleanup_task(&hrrs_cleanup_task);
ysr@777 1962 }
ysr@777 1963 }
ysr@777 1964 size_t max_live_bytes() { return _max_live_bytes; }
ysr@777 1965 size_t freed_bytes() { return _freed_bytes; }
ysr@777 1966 };
ysr@777 1967
ysr@777 1968 class G1ParScrubRemSetTask: public AbstractGangTask {
ysr@777 1969 protected:
ysr@777 1970 G1RemSet* _g1rs;
ysr@777 1971 BitMap* _region_bm;
ysr@777 1972 BitMap* _card_bm;
ysr@777 1973 public:
ysr@777 1974 G1ParScrubRemSetTask(G1CollectedHeap* g1h,
ysr@777 1975 BitMap* region_bm, BitMap* card_bm) :
ysr@777 1976 AbstractGangTask("G1 ScrubRS"), _g1rs(g1h->g1_rem_set()),
johnc@3463 1977 _region_bm(region_bm), _card_bm(card_bm) { }
ysr@777 1978
jmasa@3357 1979 void work(uint worker_id) {
jmasa@2188 1980 if (G1CollectedHeap::use_parallel_gc_threads()) {
jmasa@3357 1981 _g1rs->scrub_par(_region_bm, _card_bm, worker_id,
tonyp@790 1982 HeapRegion::ScrubRemSetClaimValue);
ysr@777 1983 } else {
ysr@777 1984 _g1rs->scrub(_region_bm, _card_bm);
ysr@777 1985 }
ysr@777 1986 }
ysr@777 1987
ysr@777 1988 };
ysr@777 1989
ysr@777 1990 void ConcurrentMark::cleanup() {
ysr@777 1991 // world is stopped at this checkpoint
ysr@777 1992 assert(SafepointSynchronize::is_at_safepoint(),
ysr@777 1993 "world should be stopped");
ysr@777 1994 G1CollectedHeap* g1h = G1CollectedHeap::heap();
ysr@777 1995
ysr@777 1996 // If a full collection has happened, we shouldn't do this.
ysr@777 1997 if (has_aborted()) {
ysr@777 1998 g1h->set_marking_complete(); // So bitmap clearing isn't confused
ysr@777 1999 return;
ysr@777 2000 }
ysr@777 2001
tonyp@2472 2002 g1h->verify_region_sets_optional();
tonyp@2472 2003
ysr@1280 2004 if (VerifyDuringGC) {
ysr@1280 2005 HandleMark hm; // handle scope
ysr@1280 2006 Universe::heap()->prepare_for_verify();
stefank@5018 2007 Universe::verify(VerifyOption_G1UsePrevMarking,
stefank@5018 2008 " VerifyDuringGC:(before)");
ysr@1280 2009 }
brutisso@7005 2010 g1h->check_bitmaps("Cleanup Start");
ysr@1280 2011
ysr@777 2012 G1CollectorPolicy* g1p = G1CollectedHeap::heap()->g1_policy();
ysr@777 2013 g1p->record_concurrent_mark_cleanup_start();
ysr@777 2014
ysr@777 2015 double start = os::elapsedTime();
ysr@777 2016
tonyp@2493 2017 HeapRegionRemSet::reset_for_cleanup_tasks();
tonyp@2493 2018
jmasa@3357 2019 uint n_workers;
jmasa@3294 2020
ysr@777 2021 // Do counting once more with the world stopped for good measure.
johnc@3463 2022 G1ParFinalCountTask g1_par_count_task(g1h, &_region_bm, &_card_bm);
johnc@3463 2023
jmasa@2188 2024 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@3463 2025 assert(g1h->check_heap_region_claim_values(HeapRegion::InitialClaimValue),
tonyp@790 2026 "sanity check");
tonyp@790 2027
johnc@3338 2028 g1h->set_par_threads();
johnc@3338 2029 n_workers = g1h->n_par_threads();
jmasa@3357 2030 assert(g1h->n_par_threads() == n_workers,
johnc@3338 2031 "Should not have been reset");
ysr@777 2032 g1h->workers()->run_task(&g1_par_count_task);
jmasa@3294 2033 // Done with the parallel phase so reset to 0.
ysr@777 2034 g1h->set_par_threads(0);
tonyp@790 2035
johnc@3463 2036 assert(g1h->check_heap_region_claim_values(HeapRegion::FinalCountClaimValue),
tonyp@790 2037 "sanity check");
ysr@777 2038 } else {
johnc@3338 2039 n_workers = 1;
ysr@777 2040 g1_par_count_task.work(0);
ysr@777 2041 }
ysr@777 2042
johnc@3463 2043 if (VerifyDuringGC) {
johnc@3463 2044 // Verify that the counting data accumulated during marking matches
johnc@3463 2045 // that calculated by walking the marking bitmap.
johnc@3463 2046
johnc@3463 2047 // Bitmaps to hold expected values
mgerdin@6977 2048 BitMap expected_region_bm(_region_bm.size(), true);
mgerdin@6977 2049 BitMap expected_card_bm(_card_bm.size(), true);
johnc@3463 2050
johnc@3463 2051 G1ParVerifyFinalCountTask g1_par_verify_task(g1h,
johnc@3463 2052 &_region_bm,
johnc@3463 2053 &_card_bm,
johnc@3463 2054 &expected_region_bm,
johnc@3463 2055 &expected_card_bm);
johnc@3463 2056
johnc@3463 2057 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@3463 2058 g1h->set_par_threads((int)n_workers);
johnc@3463 2059 g1h->workers()->run_task(&g1_par_verify_task);
johnc@3463 2060 // Done with the parallel phase so reset to 0.
johnc@3463 2061 g1h->set_par_threads(0);
johnc@3463 2062
johnc@3463 2063 assert(g1h->check_heap_region_claim_values(HeapRegion::VerifyCountClaimValue),
johnc@3463 2064 "sanity check");
johnc@3463 2065 } else {
johnc@3463 2066 g1_par_verify_task.work(0);
johnc@3463 2067 }
johnc@3463 2068
johnc@3463 2069 guarantee(g1_par_verify_task.failures() == 0, "Unexpected accounting failures");
johnc@3463 2070 }
johnc@3463 2071
ysr@777 2072 size_t start_used_bytes = g1h->used();
ysr@777 2073 g1h->set_marking_complete();
ysr@777 2074
ysr@777 2075 double count_end = os::elapsedTime();
ysr@777 2076 double this_final_counting_time = (count_end - start);
ysr@777 2077 _total_counting_time += this_final_counting_time;
ysr@777 2078
tonyp@2717 2079 if (G1PrintRegionLivenessInfo) {
tonyp@2717 2080 G1PrintRegionLivenessInfoClosure cl(gclog_or_tty, "Post-Marking");
tonyp@2717 2081 _g1h->heap_region_iterate(&cl);
tonyp@2717 2082 }
tonyp@2717 2083
ysr@777 2084 // Install newly created mark bitMap as "prev".
ysr@777 2085 swapMarkBitMaps();
ysr@777 2086
ysr@777 2087 g1h->reset_gc_time_stamp();
ysr@777 2088
ysr@777 2089 // Note end of marking in all heap regions.
tonyp@2472 2090 G1ParNoteEndTask g1_par_note_end_task(g1h, &_cleanup_list);
jmasa@2188 2091 if (G1CollectedHeap::use_parallel_gc_threads()) {
jmasa@3294 2092 g1h->set_par_threads((int)n_workers);
ysr@777 2093 g1h->workers()->run_task(&g1_par_note_end_task);
ysr@777 2094 g1h->set_par_threads(0);
tonyp@790 2095
tonyp@790 2096 assert(g1h->check_heap_region_claim_values(HeapRegion::NoteEndClaimValue),
tonyp@790 2097 "sanity check");
ysr@777 2098 } else {
ysr@777 2099 g1_par_note_end_task.work(0);
ysr@777 2100 }
tonyp@3957 2101 g1h->check_gc_time_stamps();
tonyp@2472 2102
tonyp@2472 2103 if (!cleanup_list_is_empty()) {
tonyp@2472 2104 // The cleanup list is not empty, so we'll have to process it
tonyp@2472 2105 // concurrently. Notify anyone else that might be wanting free
tonyp@2472 2106 // regions that there will be more free regions coming soon.
tonyp@2472 2107 g1h->set_free_regions_coming();
tonyp@2472 2108 }
ysr@777 2109
ysr@777 2110 // call below, since it affects the metric by which we sort the heap
ysr@777 2111 // regions.
ysr@777 2112 if (G1ScrubRemSets) {
ysr@777 2113 double rs_scrub_start = os::elapsedTime();
ysr@777 2114 G1ParScrubRemSetTask g1_par_scrub_rs_task(g1h, &_region_bm, &_card_bm);
jmasa@2188 2115 if (G1CollectedHeap::use_parallel_gc_threads()) {
jmasa@3294 2116 g1h->set_par_threads((int)n_workers);
ysr@777 2117 g1h->workers()->run_task(&g1_par_scrub_rs_task);
ysr@777 2118 g1h->set_par_threads(0);
tonyp@790 2119
tonyp@790 2120 assert(g1h->check_heap_region_claim_values(
tonyp@790 2121 HeapRegion::ScrubRemSetClaimValue),
tonyp@790 2122 "sanity check");
ysr@777 2123 } else {
ysr@777 2124 g1_par_scrub_rs_task.work(0);
ysr@777 2125 }
ysr@777 2126
ysr@777 2127 double rs_scrub_end = os::elapsedTime();
ysr@777 2128 double this_rs_scrub_time = (rs_scrub_end - rs_scrub_start);
ysr@777 2129 _total_rs_scrub_time += this_rs_scrub_time;
ysr@777 2130 }
ysr@777 2131
ysr@777 2132 // this will also free any regions totally full of garbage objects,
ysr@777 2133 // and sort the regions.
jmasa@3294 2134 g1h->g1_policy()->record_concurrent_mark_cleanup_end((int)n_workers);
ysr@777 2135
ysr@777 2136 // Statistics.
ysr@777 2137 double end = os::elapsedTime();
ysr@777 2138 _cleanup_times.add((end - start) * 1000.0);
ysr@777 2139
brutisso@3710 2140 if (G1Log::fine()) {
ysr@777 2141 g1h->print_size_transition(gclog_or_tty,
ysr@777 2142 start_used_bytes,
ysr@777 2143 g1h->used(),
ysr@777 2144 g1h->capacity());
ysr@777 2145 }
ysr@777 2146
johnc@3175 2147 // Clean up will have freed any regions completely full of garbage.
johnc@3175 2148 // Update the soft reference policy with the new heap occupancy.
johnc@3175 2149 Universe::update_heap_info_at_gc();
johnc@3175 2150
johnc@1186 2151 if (VerifyDuringGC) {
ysr@1280 2152 HandleMark hm; // handle scope
ysr@1280 2153 Universe::heap()->prepare_for_verify();
stefank@5018 2154 Universe::verify(VerifyOption_G1UsePrevMarking,
stefank@5018 2155 " VerifyDuringGC:(after)");
ysr@777 2156 }
brutisso@7005 2157 g1h->check_bitmaps("Cleanup End");
tonyp@2472 2158
tonyp@2472 2159 g1h->verify_region_sets_optional();
stefank@6992 2160
stefank@6992 2161 // We need to make this be a "collection" so any collection pause that
stefank@6992 2162 // races with it goes around and waits for completeCleanup to finish.
stefank@6992 2163 g1h->increment_total_collections();
stefank@6992 2164
stefank@6992 2165 // Clean out dead classes and update Metaspace sizes.
stefank@6996 2166 if (ClassUnloadingWithConcurrentMark) {
stefank@6996 2167 ClassLoaderDataGraph::purge();
stefank@6996 2168 }
stefank@6992 2169 MetaspaceGC::compute_new_size();
stefank@6992 2170
stefank@6992 2171 // We reclaimed old regions so we should calculate the sizes to make
stefank@6992 2172 // sure we update the old gen/space data.
stefank@6992 2173 g1h->g1mm()->update_sizes();
stefank@6992 2174
sla@5237 2175 g1h->trace_heap_after_concurrent_cycle();
ysr@777 2176 }
ysr@777 2177
ysr@777 2178 void ConcurrentMark::completeCleanup() {
ysr@777 2179 if (has_aborted()) return;
ysr@777 2180
tonyp@2472 2181 G1CollectedHeap* g1h = G1CollectedHeap::heap();
tonyp@2472 2182
jwilhelm@6549 2183 _cleanup_list.verify_optional();
tonyp@2643 2184 FreeRegionList tmp_free_list("Tmp Free List");
tonyp@2472 2185
tonyp@2472 2186 if (G1ConcRegionFreeingVerbose) {
tonyp@2472 2187 gclog_or_tty->print_cr("G1ConcRegionFreeing [complete cleanup] : "
tonyp@3713 2188 "cleanup list has %u entries",
tonyp@2472 2189 _cleanup_list.length());
tonyp@2472 2190 }
tonyp@2472 2191
tschatzl@7051 2192 // No one else should be accessing the _cleanup_list at this point,
tschatzl@7051 2193 // so it is not necessary to take any locks
tonyp@2472 2194 while (!_cleanup_list.is_empty()) {
tschatzl@7050 2195 HeapRegion* hr = _cleanup_list.remove_region(true /* from_head */);
jwilhelm@6422 2196 assert(hr != NULL, "Got NULL from a non-empty list");
tonyp@2849 2197 hr->par_clear();
jwilhelm@6422 2198 tmp_free_list.add_ordered(hr);
tonyp@2472 2199
tonyp@2472 2200 // Instead of adding one region at a time to the secondary_free_list,
tonyp@2472 2201 // we accumulate them in the local list and move them a few at a
tonyp@2472 2202 // time. This also cuts down on the number of notify_all() calls
tonyp@2472 2203 // we do during this process. We'll also append the local list when
tonyp@2472 2204 // _cleanup_list is empty (which means we just removed the last
tonyp@2472 2205 // region from the _cleanup_list).
tonyp@2643 2206 if ((tmp_free_list.length() % G1SecondaryFreeListAppendLength == 0) ||
tonyp@2472 2207 _cleanup_list.is_empty()) {
tonyp@2472 2208 if (G1ConcRegionFreeingVerbose) {
tonyp@2472 2209 gclog_or_tty->print_cr("G1ConcRegionFreeing [complete cleanup] : "
tonyp@3713 2210 "appending %u entries to the secondary_free_list, "
tonyp@3713 2211 "cleanup list still has %u entries",
tonyp@2643 2212 tmp_free_list.length(),
tonyp@2472 2213 _cleanup_list.length());
ysr@777 2214 }
tonyp@2472 2215
tonyp@2472 2216 {
tonyp@2472 2217 MutexLockerEx x(SecondaryFreeList_lock, Mutex::_no_safepoint_check_flag);
jwilhelm@6422 2218 g1h->secondary_free_list_add(&tmp_free_list);
tonyp@2472 2219 SecondaryFreeList_lock->notify_all();
tonyp@2472 2220 }
tonyp@2472 2221
tonyp@2472 2222 if (G1StressConcRegionFreeing) {
tonyp@2472 2223 for (uintx i = 0; i < G1StressConcRegionFreeingDelayMillis; ++i) {
tonyp@2472 2224 os::sleep(Thread::current(), (jlong) 1, false);
tonyp@2472 2225 }
tonyp@2472 2226 }
ysr@777 2227 }
ysr@777 2228 }
tonyp@2643 2229 assert(tmp_free_list.is_empty(), "post-condition");
ysr@777 2230 }
ysr@777 2231
johnc@4555 2232 // Supporting Object and Oop closures for reference discovery
johnc@4555 2233 // and processing in during marking
johnc@2494 2234
johnc@2379 2235 bool G1CMIsAliveClosure::do_object_b(oop obj) {
johnc@2379 2236 HeapWord* addr = (HeapWord*)obj;
johnc@2379 2237 return addr != NULL &&
johnc@2379 2238 (!_g1->is_in_g1_reserved(addr) || !_g1->is_obj_ill(obj));
johnc@2379 2239 }
ysr@777 2240
johnc@4555 2241 // 'Keep Alive' oop closure used by both serial parallel reference processing.
johnc@4555 2242 // Uses the CMTask associated with a worker thread (for serial reference
johnc@4555 2243 // processing the CMTask for worker 0 is used) to preserve (mark) and
johnc@4555 2244 // trace referent objects.
johnc@4555 2245 //
johnc@4555 2246 // Using the CMTask and embedded local queues avoids having the worker
johnc@4555 2247 // threads operating on the global mark stack. This reduces the risk
johnc@4555 2248 // of overflowing the stack - which we would rather avoid at this late
johnc@4555 2249 // state. Also using the tasks' local queues removes the potential
johnc@4555 2250 // of the workers interfering with each other that could occur if
johnc@4555 2251 // operating on the global stack.
johnc@4555 2252
johnc@4555 2253 class G1CMKeepAliveAndDrainClosure: public OopClosure {
johnc@4787 2254 ConcurrentMark* _cm;
johnc@4787 2255 CMTask* _task;
johnc@4787 2256 int _ref_counter_limit;
johnc@4787 2257 int _ref_counter;
johnc@4787 2258 bool _is_serial;
johnc@2494 2259 public:
johnc@4787 2260 G1CMKeepAliveAndDrainClosure(ConcurrentMark* cm, CMTask* task, bool is_serial) :
johnc@4787 2261 _cm(cm), _task(task), _is_serial(is_serial),
johnc@4787 2262 _ref_counter_limit(G1RefProcDrainInterval) {
johnc@2494 2263 assert(_ref_counter_limit > 0, "sanity");
johnc@4787 2264 assert(!_is_serial || _task->worker_id() == 0, "only task 0 for serial code");
johnc@2494 2265 _ref_counter = _ref_counter_limit;
johnc@2494 2266 }
johnc@2494 2267
johnc@2494 2268 virtual void do_oop(narrowOop* p) { do_oop_work(p); }
johnc@2494 2269 virtual void do_oop( oop* p) { do_oop_work(p); }
johnc@2494 2270
johnc@2494 2271 template <class T> void do_oop_work(T* p) {
johnc@2494 2272 if (!_cm->has_overflown()) {
johnc@2494 2273 oop obj = oopDesc::load_decode_heap_oop(p);
tonyp@2973 2274 if (_cm->verbose_high()) {
johnc@4173 2275 gclog_or_tty->print_cr("\t[%u] we're looking at location "
johnc@2494 2276 "*"PTR_FORMAT" = "PTR_FORMAT,
drchase@6680 2277 _task->worker_id(), p2i(p), p2i((void*) obj));
tonyp@2973 2278 }
johnc@2494 2279
johnc@2494 2280 _task->deal_with_reference(obj);
johnc@2494 2281 _ref_counter--;
johnc@2494 2282
johnc@2494 2283 if (_ref_counter == 0) {
johnc@4555 2284 // We have dealt with _ref_counter_limit references, pushing them
johnc@4555 2285 // and objects reachable from them on to the local stack (and
johnc@4555 2286 // possibly the global stack). Call CMTask::do_marking_step() to
johnc@4555 2287 // process these entries.
johnc@4555 2288 //
johnc@4555 2289 // We call CMTask::do_marking_step() in a loop, which we'll exit if
johnc@4555 2290 // there's nothing more to do (i.e. we're done with the entries that
johnc@4555 2291 // were pushed as a result of the CMTask::deal_with_reference() calls
johnc@4555 2292 // above) or we overflow.
johnc@4555 2293 //
johnc@4555 2294 // Note: CMTask::do_marking_step() can set the CMTask::has_aborted()
johnc@4555 2295 // flag while there may still be some work to do. (See the comment at
johnc@4555 2296 // the beginning of CMTask::do_marking_step() for those conditions -
johnc@4555 2297 // one of which is reaching the specified time target.) It is only
johnc@4555 2298 // when CMTask::do_marking_step() returns without setting the
johnc@4555 2299 // has_aborted() flag that the marking step has completed.
johnc@2494 2300 do {
johnc@2494 2301 double mark_step_duration_ms = G1ConcMarkStepDurationMillis;
johnc@2494 2302 _task->do_marking_step(mark_step_duration_ms,
johnc@4787 2303 false /* do_termination */,
johnc@4787 2304 _is_serial);
johnc@2494 2305 } while (_task->has_aborted() && !_cm->has_overflown());
johnc@2494 2306 _ref_counter = _ref_counter_limit;
johnc@2494 2307 }
johnc@2494 2308 } else {
tonyp@2973 2309 if (_cm->verbose_high()) {
johnc@4173 2310 gclog_or_tty->print_cr("\t[%u] CM Overflow", _task->worker_id());
tonyp@2973 2311 }
johnc@2494 2312 }
johnc@2494 2313 }
johnc@2494 2314 };
johnc@2494 2315
johnc@4555 2316 // 'Drain' oop closure used by both serial and parallel reference processing.
johnc@4555 2317 // Uses the CMTask associated with a given worker thread (for serial
johnc@4555 2318 // reference processing the CMtask for worker 0 is used). Calls the
johnc@4555 2319 // do_marking_step routine, with an unbelievably large timeout value,
johnc@4555 2320 // to drain the marking data structures of the remaining entries
johnc@4555 2321 // added by the 'keep alive' oop closure above.
johnc@4555 2322
johnc@4555 2323 class G1CMDrainMarkingStackClosure: public VoidClosure {
johnc@2494 2324 ConcurrentMark* _cm;
johnc@4555 2325 CMTask* _task;
johnc@4787 2326 bool _is_serial;
johnc@2494 2327 public:
johnc@4787 2328 G1CMDrainMarkingStackClosure(ConcurrentMark* cm, CMTask* task, bool is_serial) :
johnc@4787 2329 _cm(cm), _task(task), _is_serial(is_serial) {
johnc@4787 2330 assert(!_is_serial || _task->worker_id() == 0, "only task 0 for serial code");
johnc@4555 2331 }
johnc@2494 2332
johnc@2494 2333 void do_void() {
johnc@2494 2334 do {
tonyp@2973 2335 if (_cm->verbose_high()) {
johnc@4787 2336 gclog_or_tty->print_cr("\t[%u] Drain: Calling do_marking_step - serial: %s",
johnc@4787 2337 _task->worker_id(), BOOL_TO_STR(_is_serial));
tonyp@2973 2338 }
johnc@2494 2339
johnc@4555 2340 // We call CMTask::do_marking_step() to completely drain the local
johnc@4555 2341 // and global marking stacks of entries pushed by the 'keep alive'
johnc@4555 2342 // oop closure (an instance of G1CMKeepAliveAndDrainClosure above).
johnc@4555 2343 //
johnc@4555 2344 // CMTask::do_marking_step() is called in a loop, which we'll exit
johnc@4555 2345 // if there's nothing more to do (i.e. we'completely drained the
johnc@4555 2346 // entries that were pushed as a a result of applying the 'keep alive'
johnc@4555 2347 // closure to the entries on the discovered ref lists) or we overflow
johnc@4555 2348 // the global marking stack.
johnc@4555 2349 //
johnc@4555 2350 // Note: CMTask::do_marking_step() can set the CMTask::has_aborted()
johnc@4555 2351 // flag while there may still be some work to do. (See the comment at
johnc@4555 2352 // the beginning of CMTask::do_marking_step() for those conditions -
johnc@4555 2353 // one of which is reaching the specified time target.) It is only
johnc@4555 2354 // when CMTask::do_marking_step() returns without setting the
johnc@4555 2355 // has_aborted() flag that the marking step has completed.
johnc@2494 2356
johnc@2494 2357 _task->do_marking_step(1000000000.0 /* something very large */,
johnc@4787 2358 true /* do_termination */,
johnc@4787 2359 _is_serial);
johnc@2494 2360 } while (_task->has_aborted() && !_cm->has_overflown());
johnc@2494 2361 }
johnc@2494 2362 };
johnc@2494 2363
johnc@3175 2364 // Implementation of AbstractRefProcTaskExecutor for parallel
johnc@3175 2365 // reference processing at the end of G1 concurrent marking
johnc@3175 2366
johnc@3175 2367 class G1CMRefProcTaskExecutor: public AbstractRefProcTaskExecutor {
johnc@2494 2368 private:
johnc@2494 2369 G1CollectedHeap* _g1h;
johnc@2494 2370 ConcurrentMark* _cm;
johnc@2494 2371 WorkGang* _workers;
johnc@2494 2372 int _active_workers;
johnc@2494 2373
johnc@2494 2374 public:
johnc@3175 2375 G1CMRefProcTaskExecutor(G1CollectedHeap* g1h,
johnc@2494 2376 ConcurrentMark* cm,
johnc@2494 2377 WorkGang* workers,
johnc@2494 2378 int n_workers) :
johnc@3292 2379 _g1h(g1h), _cm(cm),
johnc@3292 2380 _workers(workers), _active_workers(n_workers) { }
johnc@2494 2381
johnc@2494 2382 // Executes the given task using concurrent marking worker threads.
johnc@2494 2383 virtual void execute(ProcessTask& task);
johnc@2494 2384 virtual void execute(EnqueueTask& task);
johnc@2494 2385 };
johnc@2494 2386
johnc@3175 2387 class G1CMRefProcTaskProxy: public AbstractGangTask {
johnc@2494 2388 typedef AbstractRefProcTaskExecutor::ProcessTask ProcessTask;
johnc@2494 2389 ProcessTask& _proc_task;
johnc@2494 2390 G1CollectedHeap* _g1h;
johnc@2494 2391 ConcurrentMark* _cm;
johnc@2494 2392
johnc@2494 2393 public:
johnc@3175 2394 G1CMRefProcTaskProxy(ProcessTask& proc_task,
johnc@2494 2395 G1CollectedHeap* g1h,
johnc@3292 2396 ConcurrentMark* cm) :
johnc@2494 2397 AbstractGangTask("Process reference objects in parallel"),
johnc@4555 2398 _proc_task(proc_task), _g1h(g1h), _cm(cm) {
johnc@4787 2399 ReferenceProcessor* rp = _g1h->ref_processor_cm();
johnc@4787 2400 assert(rp->processing_is_mt(), "shouldn't be here otherwise");
johnc@4787 2401 }
johnc@2494 2402
jmasa@3357 2403 virtual void work(uint worker_id) {
mdoerr@7020 2404 ResourceMark rm;
mdoerr@7020 2405 HandleMark hm;
johnc@4787 2406 CMTask* task = _cm->task(worker_id);
johnc@2494 2407 G1CMIsAliveClosure g1_is_alive(_g1h);
johnc@4787 2408 G1CMKeepAliveAndDrainClosure g1_par_keep_alive(_cm, task, false /* is_serial */);
johnc@4787 2409 G1CMDrainMarkingStackClosure g1_par_drain(_cm, task, false /* is_serial */);
johnc@2494 2410
jmasa@3357 2411 _proc_task.work(worker_id, g1_is_alive, g1_par_keep_alive, g1_par_drain);
johnc@2494 2412 }
johnc@2494 2413 };
johnc@2494 2414
johnc@3175 2415 void G1CMRefProcTaskExecutor::execute(ProcessTask& proc_task) {
johnc@2494 2416 assert(_workers != NULL, "Need parallel worker threads.");
johnc@4555 2417 assert(_g1h->ref_processor_cm()->processing_is_mt(), "processing is not MT");
johnc@2494 2418
johnc@3292 2419 G1CMRefProcTaskProxy proc_task_proxy(proc_task, _g1h, _cm);
johnc@2494 2420
johnc@4788 2421 // We need to reset the concurrency level before each
johnc@4788 2422 // proxy task execution, so that the termination protocol
johnc@4788 2423 // and overflow handling in CMTask::do_marking_step() knows
johnc@4788 2424 // how many workers to wait for.
johnc@4788 2425 _cm->set_concurrency(_active_workers);
johnc@2494 2426 _g1h->set_par_threads(_active_workers);
johnc@2494 2427 _workers->run_task(&proc_task_proxy);
johnc@2494 2428 _g1h->set_par_threads(0);
johnc@2494 2429 }
johnc@2494 2430
johnc@3175 2431 class G1CMRefEnqueueTaskProxy: public AbstractGangTask {
johnc@2494 2432 typedef AbstractRefProcTaskExecutor::EnqueueTask EnqueueTask;
johnc@2494 2433 EnqueueTask& _enq_task;
johnc@2494 2434
johnc@2494 2435 public:
johnc@3175 2436 G1CMRefEnqueueTaskProxy(EnqueueTask& enq_task) :
johnc@2494 2437 AbstractGangTask("Enqueue reference objects in parallel"),
johnc@3292 2438 _enq_task(enq_task) { }
johnc@2494 2439
jmasa@3357 2440 virtual void work(uint worker_id) {
jmasa@3357 2441 _enq_task.work(worker_id);
johnc@2494 2442 }
johnc@2494 2443 };
johnc@2494 2444
johnc@3175 2445 void G1CMRefProcTaskExecutor::execute(EnqueueTask& enq_task) {
johnc@2494 2446 assert(_workers != NULL, "Need parallel worker threads.");
johnc@4555 2447 assert(_g1h->ref_processor_cm()->processing_is_mt(), "processing is not MT");
johnc@2494 2448
johnc@3175 2449 G1CMRefEnqueueTaskProxy enq_task_proxy(enq_task);
johnc@2494 2450
johnc@4788 2451 // Not strictly necessary but...
johnc@4788 2452 //
johnc@4788 2453 // We need to reset the concurrency level before each
johnc@4788 2454 // proxy task execution, so that the termination protocol
johnc@4788 2455 // and overflow handling in CMTask::do_marking_step() knows
johnc@4788 2456 // how many workers to wait for.
johnc@4788 2457 _cm->set_concurrency(_active_workers);
johnc@2494 2458 _g1h->set_par_threads(_active_workers);
johnc@2494 2459 _workers->run_task(&enq_task_proxy);
johnc@2494 2460 _g1h->set_par_threads(0);
johnc@2494 2461 }
johnc@2494 2462
stefank@6992 2463 void ConcurrentMark::weakRefsWorkParallelPart(BoolObjectClosure* is_alive, bool purged_classes) {
stefank@6992 2464 G1CollectedHeap::heap()->parallel_cleaning(is_alive, true, true, purged_classes);
stefank@6992 2465 }
stefank@6992 2466
stefank@6992 2467 // Helper class to get rid of some boilerplate code.
stefank@6992 2468 class G1RemarkGCTraceTime : public GCTraceTime {
stefank@6992 2469 static bool doit_and_prepend(bool doit) {
stefank@6992 2470 if (doit) {
stefank@6992 2471 gclog_or_tty->put(' ');
stefank@6992 2472 }
stefank@6992 2473 return doit;
stefank@6992 2474 }
stefank@6992 2475
stefank@6992 2476 public:
stefank@6992 2477 G1RemarkGCTraceTime(const char* title, bool doit)
stefank@6992 2478 : GCTraceTime(title, doit_and_prepend(doit), false, G1CollectedHeap::heap()->gc_timer_cm(),
stefank@6992 2479 G1CollectedHeap::heap()->concurrent_mark()->concurrent_gc_id()) {
stefank@6992 2480 }
stefank@6992 2481 };
stefank@6992 2482
ysr@777 2483 void ConcurrentMark::weakRefsWork(bool clear_all_soft_refs) {
johnc@4788 2484 if (has_overflown()) {
johnc@4788 2485 // Skip processing the discovered references if we have
johnc@4788 2486 // overflown the global marking stack. Reference objects
johnc@4788 2487 // only get discovered once so it is OK to not
johnc@4788 2488 // de-populate the discovered reference lists. We could have,
johnc@4788 2489 // but the only benefit would be that, when marking restarts,
johnc@4788 2490 // less reference objects are discovered.
johnc@4788 2491 return;
johnc@4788 2492 }
johnc@4788 2493
ysr@777 2494 ResourceMark rm;
ysr@777 2495 HandleMark hm;
johnc@3171 2496
johnc@3171 2497 G1CollectedHeap* g1h = G1CollectedHeap::heap();
johnc@3171 2498
johnc@3171 2499 // Is alive closure.
johnc@3171 2500 G1CMIsAliveClosure g1_is_alive(g1h);
johnc@3171 2501
johnc@3171 2502 // Inner scope to exclude the cleaning of the string and symbol
johnc@3171 2503 // tables from the displayed time.
johnc@3171 2504 {
brutisso@3710 2505 if (G1Log::finer()) {
johnc@3171 2506 gclog_or_tty->put(' ');
johnc@3171 2507 }
brutisso@6904 2508 GCTraceTime t("GC ref-proc", G1Log::finer(), false, g1h->gc_timer_cm(), concurrent_gc_id());
johnc@3171 2509
johnc@3175 2510 ReferenceProcessor* rp = g1h->ref_processor_cm();
johnc@3171 2511
johnc@3171 2512 // See the comment in G1CollectedHeap::ref_processing_init()
johnc@3171 2513 // about how reference processing currently works in G1.
johnc@3171 2514
johnc@4555 2515 // Set the soft reference policy
johnc@3171 2516 rp->setup_policy(clear_all_soft_refs);
johnc@3171 2517 assert(_markStack.isEmpty(), "mark stack should be empty");
johnc@3171 2518
johnc@4787 2519 // Instances of the 'Keep Alive' and 'Complete GC' closures used
johnc@4787 2520 // in serial reference processing. Note these closures are also
johnc@4787 2521 // used for serially processing (by the the current thread) the
johnc@4787 2522 // JNI references during parallel reference processing.
johnc@4787 2523 //
johnc@4787 2524 // These closures do not need to synchronize with the worker
johnc@4787 2525 // threads involved in parallel reference processing as these
johnc@4787 2526 // instances are executed serially by the current thread (e.g.
johnc@4787 2527 // reference processing is not multi-threaded and is thus
johnc@4787 2528 // performed by the current thread instead of a gang worker).
johnc@4787 2529 //
johnc@4787 2530 // The gang tasks involved in parallel reference procssing create
johnc@4787 2531 // their own instances of these closures, which do their own
johnc@4787 2532 // synchronization among themselves.
johnc@4787 2533 G1CMKeepAliveAndDrainClosure g1_keep_alive(this, task(0), true /* is_serial */);
johnc@4787 2534 G1CMDrainMarkingStackClosure g1_drain_mark_stack(this, task(0), true /* is_serial */);
johnc@4787 2535
johnc@4787 2536 // We need at least one active thread. If reference processing
johnc@4787 2537 // is not multi-threaded we use the current (VMThread) thread,
johnc@4787 2538 // otherwise we use the work gang from the G1CollectedHeap and
johnc@4787 2539 // we utilize all the worker threads we can.
johnc@4787 2540 bool processing_is_mt = rp->processing_is_mt() && g1h->workers() != NULL;
johnc@4787 2541 uint active_workers = (processing_is_mt ? g1h->workers()->active_workers() : 1U);
johnc@4173 2542 active_workers = MAX2(MIN2(active_workers, _max_worker_id), 1U);
johnc@3171 2543
johnc@4787 2544 // Parallel processing task executor.
johnc@3292 2545 G1CMRefProcTaskExecutor par_task_executor(g1h, this,
johnc@3175 2546 g1h->workers(), active_workers);
johnc@4787 2547 AbstractRefProcTaskExecutor* executor = (processing_is_mt ? &par_task_executor : NULL);
johnc@4555 2548
johnc@4788 2549 // Set the concurrency level. The phase was already set prior to
johnc@4788 2550 // executing the remark task.
johnc@4788 2551 set_concurrency(active_workers);
johnc@4788 2552
johnc@4555 2553 // Set the degree of MT processing here. If the discovery was done MT,
johnc@4555 2554 // the number of threads involved during discovery could differ from
johnc@4555 2555 // the number of active workers. This is OK as long as the discovered
johnc@4555 2556 // Reference lists are balanced (see balance_all_queues() and balance_queues()).
johnc@4555 2557 rp->set_active_mt_degree(active_workers);
johnc@4555 2558
johnc@4555 2559 // Process the weak references.
sla@5237 2560 const ReferenceProcessorStats& stats =
sla@5237 2561 rp->process_discovered_references(&g1_is_alive,
sla@5237 2562 &g1_keep_alive,
sla@5237 2563 &g1_drain_mark_stack,
sla@5237 2564 executor,
brutisso@6904 2565 g1h->gc_timer_cm(),
brutisso@6904 2566 concurrent_gc_id());
sla@5237 2567 g1h->gc_tracer_cm()->report_gc_reference_stats(stats);
johnc@4555 2568
johnc@4555 2569 // The do_oop work routines of the keep_alive and drain_marking_stack
johnc@4555 2570 // oop closures will set the has_overflown flag if we overflow the
johnc@4555 2571 // global marking stack.
johnc@3171 2572
johnc@3171 2573 assert(_markStack.overflow() || _markStack.isEmpty(),
johnc@3171 2574 "mark stack should be empty (unless it overflowed)");
johnc@4787 2575
johnc@3171 2576 if (_markStack.overflow()) {
johnc@4555 2577 // This should have been done already when we tried to push an
johnc@3171 2578 // entry on to the global mark stack. But let's do it again.
johnc@3171 2579 set_has_overflown();
johnc@3171 2580 }
johnc@3171 2581
johnc@4555 2582 assert(rp->num_q() == active_workers, "why not");
johnc@4555 2583
johnc@4555 2584 rp->enqueue_discovered_references(executor);
johnc@3171 2585
johnc@3171 2586 rp->verify_no_references_recorded();
johnc@3175 2587 assert(!rp->discovery_enabled(), "Post condition");
johnc@2494 2588 }
johnc@2494 2589
pliden@6399 2590 if (has_overflown()) {
pliden@6399 2591 // We can not trust g1_is_alive if the marking stack overflowed
pliden@6399 2592 return;
pliden@6399 2593 }
pliden@6399 2594
stefank@6992 2595 assert(_markStack.isEmpty(), "Marking should have completed");
stefank@6992 2596
stefank@6992 2597 // Unload Klasses, String, Symbols, Code Cache, etc.
stefank@6992 2598 {
stefank@6996 2599 G1RemarkGCTraceTime trace("Unloading", G1Log::finer());
stefank@6996 2600
stefank@6996 2601 if (ClassUnloadingWithConcurrentMark) {
stefank@6996 2602 bool purged_classes;
stefank@6996 2603
stefank@6996 2604 {
stefank@6996 2605 G1RemarkGCTraceTime trace("System Dictionary Unloading", G1Log::finest());
stefank@6996 2606 purged_classes = SystemDictionary::do_unloading(&g1_is_alive);
stefank@6996 2607 }
stefank@6996 2608
stefank@6996 2609 {
stefank@6996 2610 G1RemarkGCTraceTime trace("Parallel Unloading", G1Log::finest());
stefank@6996 2611 weakRefsWorkParallelPart(&g1_is_alive, purged_classes);
stefank@6996 2612 }
stefank@6996 2613 }
stefank@6996 2614
stefank@6996 2615 if (G1StringDedup::is_enabled()) {
stefank@6996 2616 G1RemarkGCTraceTime trace("String Deduplication Unlink", G1Log::finest());
stefank@6996 2617 G1StringDedup::unlink(&g1_is_alive);
stefank@6996 2618 }
stefank@6992 2619 }
ysr@777 2620 }
ysr@777 2621
ysr@777 2622 void ConcurrentMark::swapMarkBitMaps() {
ysr@777 2623 CMBitMapRO* temp = _prevMarkBitMap;
ysr@777 2624 _prevMarkBitMap = (CMBitMapRO*)_nextMarkBitMap;
ysr@777 2625 _nextMarkBitMap = (CMBitMap*) temp;
ysr@777 2626 }
ysr@777 2627
stefank@6992 2628 class CMObjectClosure;
stefank@6992 2629
stefank@6992 2630 // Closure for iterating over objects, currently only used for
stefank@6992 2631 // processing SATB buffers.
stefank@6992 2632 class CMObjectClosure : public ObjectClosure {
stefank@6992 2633 private:
stefank@6992 2634 CMTask* _task;
stefank@6992 2635
stefank@6992 2636 public:
stefank@6992 2637 void do_object(oop obj) {
stefank@6992 2638 _task->deal_with_reference(obj);
stefank@6992 2639 }
stefank@6992 2640
stefank@6992 2641 CMObjectClosure(CMTask* task) : _task(task) { }
stefank@6992 2642 };
stefank@6992 2643
stefank@6992 2644 class G1RemarkThreadsClosure : public ThreadClosure {
stefank@6992 2645 CMObjectClosure _cm_obj;
stefank@6992 2646 G1CMOopClosure _cm_cl;
stefank@6992 2647 MarkingCodeBlobClosure _code_cl;
stefank@6992 2648 int _thread_parity;
stefank@6992 2649 bool _is_par;
stefank@6992 2650
stefank@6992 2651 public:
stefank@6992 2652 G1RemarkThreadsClosure(G1CollectedHeap* g1h, CMTask* task, bool is_par) :
stefank@6992 2653 _cm_obj(task), _cm_cl(g1h, g1h->concurrent_mark(), task), _code_cl(&_cm_cl, !CodeBlobToOopClosure::FixRelocations),
stefank@6992 2654 _thread_parity(SharedHeap::heap()->strong_roots_parity()), _is_par(is_par) {}
stefank@6992 2655
stefank@6992 2656 void do_thread(Thread* thread) {
stefank@6992 2657 if (thread->is_Java_thread()) {
stefank@6992 2658 if (thread->claim_oops_do(_is_par, _thread_parity)) {
stefank@6992 2659 JavaThread* jt = (JavaThread*)thread;
stefank@6992 2660
stefank@6992 2661 // In theory it should not be neccessary to explicitly walk the nmethods to find roots for concurrent marking
stefank@6992 2662 // however the liveness of oops reachable from nmethods have very complex lifecycles:
stefank@6992 2663 // * Alive if on the stack of an executing method
stefank@6992 2664 // * Weakly reachable otherwise
stefank@6992 2665 // Some objects reachable from nmethods, such as the class loader (or klass_holder) of the receiver should be
stefank@6992 2666 // live by the SATB invariant but other oops recorded in nmethods may behave differently.
stefank@6992 2667 jt->nmethods_do(&_code_cl);
stefank@6992 2668
stefank@6992 2669 jt->satb_mark_queue().apply_closure_and_empty(&_cm_obj);
stefank@6992 2670 }
stefank@6992 2671 } else if (thread->is_VM_thread()) {
stefank@6992 2672 if (thread->claim_oops_do(_is_par, _thread_parity)) {
stefank@6992 2673 JavaThread::satb_mark_queue_set().shared_satb_queue()->apply_closure_and_empty(&_cm_obj);
stefank@6992 2674 }
stefank@6992 2675 }
stefank@6992 2676 }
stefank@6992 2677 };
stefank@6992 2678
ysr@777 2679 class CMRemarkTask: public AbstractGangTask {
ysr@777 2680 private:
johnc@4787 2681 ConcurrentMark* _cm;
johnc@4787 2682 bool _is_serial;
ysr@777 2683 public:
jmasa@3357 2684 void work(uint worker_id) {
ysr@777 2685 // Since all available tasks are actually started, we should
ysr@777 2686 // only proceed if we're supposed to be actived.
jmasa@3357 2687 if (worker_id < _cm->active_tasks()) {
jmasa@3357 2688 CMTask* task = _cm->task(worker_id);
ysr@777 2689 task->record_start_time();
stefank@6992 2690 {
stefank@6992 2691 ResourceMark rm;
stefank@6992 2692 HandleMark hm;
stefank@6992 2693
stefank@6992 2694 G1RemarkThreadsClosure threads_f(G1CollectedHeap::heap(), task, !_is_serial);
stefank@6992 2695 Threads::threads_do(&threads_f);
stefank@6992 2696 }
stefank@6992 2697
ysr@777 2698 do {
johnc@2494 2699 task->do_marking_step(1000000000.0 /* something very large */,
johnc@4787 2700 true /* do_termination */,
johnc@4787 2701 _is_serial);
ysr@777 2702 } while (task->has_aborted() && !_cm->has_overflown());
ysr@777 2703 // If we overflow, then we do not want to restart. We instead
ysr@777 2704 // want to abort remark and do concurrent marking again.
ysr@777 2705 task->record_end_time();
ysr@777 2706 }
ysr@777 2707 }
ysr@777 2708
johnc@4787 2709 CMRemarkTask(ConcurrentMark* cm, int active_workers, bool is_serial) :
johnc@4787 2710 AbstractGangTask("Par Remark"), _cm(cm), _is_serial(is_serial) {
johnc@3338 2711 _cm->terminator()->reset_for_reuse(active_workers);
jmasa@3294 2712 }
ysr@777 2713 };
ysr@777 2714
ysr@777 2715 void ConcurrentMark::checkpointRootsFinalWork() {
ysr@777 2716 ResourceMark rm;
ysr@777 2717 HandleMark hm;
ysr@777 2718 G1CollectedHeap* g1h = G1CollectedHeap::heap();
ysr@777 2719
stefank@6992 2720 G1RemarkGCTraceTime trace("Finalize Marking", G1Log::finer());
stefank@6992 2721
ysr@777 2722 g1h->ensure_parsability(false);
ysr@777 2723
jmasa@2188 2724 if (G1CollectedHeap::use_parallel_gc_threads()) {
jrose@1424 2725 G1CollectedHeap::StrongRootsScope srs(g1h);
jmasa@3294 2726 // this is remark, so we'll use up all active threads
jmasa@3357 2727 uint active_workers = g1h->workers()->active_workers();
jmasa@3294 2728 if (active_workers == 0) {
jmasa@3294 2729 assert(active_workers > 0, "Should have been set earlier");
jmasa@3357 2730 active_workers = (uint) ParallelGCThreads;
jmasa@3294 2731 g1h->workers()->set_active_workers(active_workers);
jmasa@3294 2732 }
johnc@4788 2733 set_concurrency_and_phase(active_workers, false /* concurrent */);
jmasa@3294 2734 // Leave _parallel_marking_threads at it's
jmasa@3294 2735 // value originally calculated in the ConcurrentMark
jmasa@3294 2736 // constructor and pass values of the active workers
jmasa@3294 2737 // through the gang in the task.
ysr@777 2738
johnc@4787 2739 CMRemarkTask remarkTask(this, active_workers, false /* is_serial */);
johnc@4787 2740 // We will start all available threads, even if we decide that the
johnc@4787 2741 // active_workers will be fewer. The extra ones will just bail out
johnc@4787 2742 // immediately.
jmasa@3294 2743 g1h->set_par_threads(active_workers);
ysr@777 2744 g1h->workers()->run_task(&remarkTask);
ysr@777 2745 g1h->set_par_threads(0);
ysr@777 2746 } else {
jrose@1424 2747 G1CollectedHeap::StrongRootsScope srs(g1h);
jmasa@3357 2748 uint active_workers = 1;
johnc@4788 2749 set_concurrency_and_phase(active_workers, false /* concurrent */);
ysr@777 2750
johnc@4787 2751 // Note - if there's no work gang then the VMThread will be
johnc@4787 2752 // the thread to execute the remark - serially. We have
johnc@4787 2753 // to pass true for the is_serial parameter so that
johnc@4787 2754 // CMTask::do_marking_step() doesn't enter the sync
johnc@4787 2755 // barriers in the event of an overflow. Doing so will
johnc@4787 2756 // cause an assert that the current thread is not a
johnc@4787 2757 // concurrent GC thread.
johnc@4787 2758 CMRemarkTask remarkTask(this, active_workers, true /* is_serial*/);
ysr@777 2759 remarkTask.work(0);
ysr@777 2760 }
tonyp@1458 2761 SATBMarkQueueSet& satb_mq_set = JavaThread::satb_mark_queue_set();
johnc@4789 2762 guarantee(has_overflown() ||
johnc@4789 2763 satb_mq_set.completed_buffers_num() == 0,
johnc@4789 2764 err_msg("Invariant: has_overflown = %s, num buffers = %d",
johnc@4789 2765 BOOL_TO_STR(has_overflown()),
johnc@4789 2766 satb_mq_set.completed_buffers_num()));
ysr@777 2767
ysr@777 2768 print_stats();
ysr@777 2769 }
ysr@777 2770
tonyp@1479 2771 #ifndef PRODUCT
tonyp@1479 2772
tonyp@1823 2773 class PrintReachableOopClosure: public OopClosure {
ysr@777 2774 private:
ysr@777 2775 G1CollectedHeap* _g1h;
ysr@777 2776 outputStream* _out;
johnc@2969 2777 VerifyOption _vo;
tonyp@1823 2778 bool _all;
ysr@777 2779
ysr@777 2780 public:
johnc@2969 2781 PrintReachableOopClosure(outputStream* out,
johnc@2969 2782 VerifyOption vo,
tonyp@1823 2783 bool all) :
tonyp@1479 2784 _g1h(G1CollectedHeap::heap()),
johnc@2969 2785 _out(out), _vo(vo), _all(all) { }
ysr@777 2786
ysr@1280 2787 void do_oop(narrowOop* p) { do_oop_work(p); }
ysr@1280 2788 void do_oop( oop* p) { do_oop_work(p); }
ysr@1280 2789
ysr@1280 2790 template <class T> void do_oop_work(T* p) {
ysr@1280 2791 oop obj = oopDesc::load_decode_heap_oop(p);
ysr@777 2792 const char* str = NULL;
ysr@777 2793 const char* str2 = "";
ysr@777 2794
tonyp@1823 2795 if (obj == NULL) {
tonyp@1823 2796 str = "";
tonyp@1823 2797 } else if (!_g1h->is_in_g1_reserved(obj)) {
tonyp@1823 2798 str = " O";
tonyp@1823 2799 } else {
ysr@777 2800 HeapRegion* hr = _g1h->heap_region_containing(obj);
tonyp@3957 2801 bool over_tams = _g1h->allocated_since_marking(obj, hr, _vo);
tonyp@3957 2802 bool marked = _g1h->is_marked(obj, _vo);
tonyp@1479 2803
tonyp@1479 2804 if (over_tams) {
tonyp@1823 2805 str = " >";
tonyp@1823 2806 if (marked) {
ysr@777 2807 str2 = " AND MARKED";
tonyp@1479 2808 }
tonyp@1823 2809 } else if (marked) {
tonyp@1823 2810 str = " M";
tonyp@1479 2811 } else {
tonyp@1823 2812 str = " NOT";
tonyp@1479 2813 }
ysr@777 2814 }
ysr@777 2815
tonyp@1823 2816 _out->print_cr(" "PTR_FORMAT": "PTR_FORMAT"%s%s",
drchase@6680 2817 p2i(p), p2i((void*) obj), str, str2);
ysr@777 2818 }
ysr@777 2819 };
ysr@777 2820
tonyp@1823 2821 class PrintReachableObjectClosure : public ObjectClosure {
ysr@777 2822 private:
johnc@2969 2823 G1CollectedHeap* _g1h;
johnc@2969 2824 outputStream* _out;
johnc@2969 2825 VerifyOption _vo;
johnc@2969 2826 bool _all;
johnc@2969 2827 HeapRegion* _hr;
ysr@777 2828
ysr@777 2829 public:
johnc@2969 2830 PrintReachableObjectClosure(outputStream* out,
johnc@2969 2831 VerifyOption vo,
tonyp@1823 2832 bool all,
tonyp@1823 2833 HeapRegion* hr) :
johnc@2969 2834 _g1h(G1CollectedHeap::heap()),
johnc@2969 2835 _out(out), _vo(vo), _all(all), _hr(hr) { }
tonyp@1823 2836
tonyp@1823 2837 void do_object(oop o) {
tonyp@3957 2838 bool over_tams = _g1h->allocated_since_marking(o, _hr, _vo);
tonyp@3957 2839 bool marked = _g1h->is_marked(o, _vo);
tonyp@1823 2840 bool print_it = _all || over_tams || marked;
tonyp@1823 2841
tonyp@1823 2842 if (print_it) {
tonyp@1823 2843 _out->print_cr(" "PTR_FORMAT"%s",
drchase@6680 2844 p2i((void *)o), (over_tams) ? " >" : (marked) ? " M" : "");
johnc@2969 2845 PrintReachableOopClosure oopCl(_out, _vo, _all);
coleenp@4037 2846 o->oop_iterate_no_header(&oopCl);
tonyp@1823 2847 }
ysr@777 2848 }
ysr@777 2849 };
ysr@777 2850
tonyp@1823 2851 class PrintReachableRegionClosure : public HeapRegionClosure {
ysr@777 2852 private:
tonyp@3957 2853 G1CollectedHeap* _g1h;
tonyp@3957 2854 outputStream* _out;
tonyp@3957 2855 VerifyOption _vo;
tonyp@3957 2856 bool _all;
ysr@777 2857
ysr@777 2858 public:
ysr@777 2859 bool doHeapRegion(HeapRegion* hr) {
ysr@777 2860 HeapWord* b = hr->bottom();
ysr@777 2861 HeapWord* e = hr->end();
ysr@777 2862 HeapWord* t = hr->top();
tonyp@3957 2863 HeapWord* p = _g1h->top_at_mark_start(hr, _vo);
ysr@777 2864 _out->print_cr("** ["PTR_FORMAT", "PTR_FORMAT"] top: "PTR_FORMAT" "
drchase@6680 2865 "TAMS: " PTR_FORMAT, p2i(b), p2i(e), p2i(t), p2i(p));
tonyp@1823 2866 _out->cr();
tonyp@1823 2867
tonyp@1823 2868 HeapWord* from = b;
tonyp@1823 2869 HeapWord* to = t;
tonyp@1823 2870
tonyp@1823 2871 if (to > from) {
drchase@6680 2872 _out->print_cr("Objects in [" PTR_FORMAT ", " PTR_FORMAT "]", p2i(from), p2i(to));
tonyp@1823 2873 _out->cr();
johnc@2969 2874 PrintReachableObjectClosure ocl(_out, _vo, _all, hr);
tonyp@1823 2875 hr->object_iterate_mem_careful(MemRegion(from, to), &ocl);
tonyp@1823 2876 _out->cr();
tonyp@1823 2877 }
ysr@777 2878
ysr@777 2879 return false;
ysr@777 2880 }
ysr@777 2881
johnc@2969 2882 PrintReachableRegionClosure(outputStream* out,
johnc@2969 2883 VerifyOption vo,
tonyp@1823 2884 bool all) :
tonyp@3957 2885 _g1h(G1CollectedHeap::heap()), _out(out), _vo(vo), _all(all) { }
ysr@777 2886 };
ysr@777 2887
tonyp@1823 2888 void ConcurrentMark::print_reachable(const char* str,
johnc@2969 2889 VerifyOption vo,
tonyp@1823 2890 bool all) {
tonyp@1823 2891 gclog_or_tty->cr();
tonyp@1823 2892 gclog_or_tty->print_cr("== Doing heap dump... ");
tonyp@1479 2893
tonyp@1479 2894 if (G1PrintReachableBaseFile == NULL) {
tonyp@1479 2895 gclog_or_tty->print_cr(" #### error: no base file defined");
tonyp@1479 2896 return;
tonyp@1479 2897 }
tonyp@1479 2898
tonyp@1479 2899 if (strlen(G1PrintReachableBaseFile) + 1 + strlen(str) >
tonyp@1479 2900 (JVM_MAXPATHLEN - 1)) {
tonyp@1479 2901 gclog_or_tty->print_cr(" #### error: file name too long");
tonyp@1479 2902 return;
tonyp@1479 2903 }
tonyp@1479 2904
tonyp@1479 2905 char file_name[JVM_MAXPATHLEN];
tonyp@1479 2906 sprintf(file_name, "%s.%s", G1PrintReachableBaseFile, str);
tonyp@1479 2907 gclog_or_tty->print_cr(" dumping to file %s", file_name);
tonyp@1479 2908
tonyp@1479 2909 fileStream fout(file_name);
tonyp@1479 2910 if (!fout.is_open()) {
tonyp@1479 2911 gclog_or_tty->print_cr(" #### error: could not open file");
tonyp@1479 2912 return;
tonyp@1479 2913 }
tonyp@1479 2914
tonyp@1479 2915 outputStream* out = &fout;
tonyp@3957 2916 out->print_cr("-- USING %s", _g1h->top_at_mark_start_str(vo));
tonyp@1479 2917 out->cr();
tonyp@1479 2918
tonyp@1823 2919 out->print_cr("--- ITERATING OVER REGIONS");
tonyp@1479 2920 out->cr();
johnc@2969 2921 PrintReachableRegionClosure rcl(out, vo, all);
ysr@777 2922 _g1h->heap_region_iterate(&rcl);
tonyp@1479 2923 out->cr();
tonyp@1479 2924
tonyp@1479 2925 gclog_or_tty->print_cr(" done");
tonyp@1823 2926 gclog_or_tty->flush();
ysr@777 2927 }
ysr@777 2928
tonyp@1479 2929 #endif // PRODUCT
tonyp@1479 2930
tonyp@3416 2931 void ConcurrentMark::clearRangePrevBitmap(MemRegion mr) {
ysr@777 2932 // Note we are overriding the read-only view of the prev map here, via
ysr@777 2933 // the cast.
ysr@777 2934 ((CMBitMap*)_prevMarkBitMap)->clearRange(mr);
tonyp@3416 2935 }
tonyp@3416 2936
tonyp@3416 2937 void ConcurrentMark::clearRangeNextBitmap(MemRegion mr) {
ysr@777 2938 _nextMarkBitMap->clearRange(mr);
ysr@777 2939 }
ysr@777 2940
ysr@777 2941 HeapRegion*
johnc@4173 2942 ConcurrentMark::claim_region(uint worker_id) {
ysr@777 2943 // "checkpoint" the finger
ysr@777 2944 HeapWord* finger = _finger;
ysr@777 2945
ysr@777 2946 // _heap_end will not change underneath our feet; it only changes at
ysr@777 2947 // yield points.
ysr@777 2948 while (finger < _heap_end) {
tonyp@1458 2949 assert(_g1h->is_in_g1_reserved(finger), "invariant");
ysr@777 2950
tonyp@2968 2951 // Note on how this code handles humongous regions. In the
tonyp@2968 2952 // normal case the finger will reach the start of a "starts
tonyp@2968 2953 // humongous" (SH) region. Its end will either be the end of the
tonyp@2968 2954 // last "continues humongous" (CH) region in the sequence, or the
tonyp@2968 2955 // standard end of the SH region (if the SH is the only region in
tonyp@2968 2956 // the sequence). That way claim_region() will skip over the CH
tonyp@2968 2957 // regions. However, there is a subtle race between a CM thread
tonyp@2968 2958 // executing this method and a mutator thread doing a humongous
tonyp@2968 2959 // object allocation. The two are not mutually exclusive as the CM
tonyp@2968 2960 // thread does not need to hold the Heap_lock when it gets
tonyp@2968 2961 // here. So there is a chance that claim_region() will come across
tonyp@2968 2962 // a free region that's in the progress of becoming a SH or a CH
tonyp@2968 2963 // region. In the former case, it will either
tonyp@2968 2964 // a) Miss the update to the region's end, in which case it will
tonyp@2968 2965 // visit every subsequent CH region, will find their bitmaps
tonyp@2968 2966 // empty, and do nothing, or
tonyp@2968 2967 // b) Will observe the update of the region's end (in which case
tonyp@2968 2968 // it will skip the subsequent CH regions).
tonyp@2968 2969 // If it comes across a region that suddenly becomes CH, the
tonyp@2968 2970 // scenario will be similar to b). So, the race between
tonyp@2968 2971 // claim_region() and a humongous object allocation might force us
tonyp@2968 2972 // to do a bit of unnecessary work (due to some unnecessary bitmap
tonyp@2968 2973 // iterations) but it should not introduce and correctness issues.
tschatzl@7051 2974 HeapRegion* curr_region = _g1h->heap_region_containing_raw(finger);
tschatzl@7051 2975
tschatzl@7051 2976 // Above heap_region_containing_raw may return NULL as we always scan claim
tschatzl@7051 2977 // until the end of the heap. In this case, just jump to the next region.
tschatzl@7051 2978 HeapWord* end = curr_region != NULL ? curr_region->end() : finger + HeapRegion::GrainWords;
tonyp@2968 2979
tonyp@2968 2980 // Is the gap between reading the finger and doing the CAS too long?
tonyp@2968 2981 HeapWord* res = (HeapWord*) Atomic::cmpxchg_ptr(end, &_finger, finger);
tschatzl@7051 2982 if (res == finger && curr_region != NULL) {
ysr@777 2983 // we succeeded
tschatzl@7051 2984 HeapWord* bottom = curr_region->bottom();
tschatzl@7051 2985 HeapWord* limit = curr_region->next_top_at_mark_start();
tschatzl@7051 2986
tschatzl@7051 2987 if (verbose_low()) {
tschatzl@7051 2988 gclog_or_tty->print_cr("[%u] curr_region = "PTR_FORMAT" "
tschatzl@7051 2989 "["PTR_FORMAT", "PTR_FORMAT"), "
tschatzl@7051 2990 "limit = "PTR_FORMAT,
tschatzl@7051 2991 worker_id, p2i(curr_region), p2i(bottom), p2i(end), p2i(limit));
tschatzl@7051 2992 }
ysr@777 2993
ysr@777 2994 // notice that _finger == end cannot be guaranteed here since,
ysr@777 2995 // someone else might have moved the finger even further
tonyp@1458 2996 assert(_finger >= end, "the finger should have moved forward");
ysr@777 2997
tonyp@2973 2998 if (verbose_low()) {
johnc@4173 2999 gclog_or_tty->print_cr("[%u] we were successful with region = "
drchase@6680 3000 PTR_FORMAT, worker_id, p2i(curr_region));
tonyp@2973 3001 }
ysr@777 3002
ysr@777 3003 if (limit > bottom) {
tonyp@2973 3004 if (verbose_low()) {
johnc@4173 3005 gclog_or_tty->print_cr("[%u] region "PTR_FORMAT" is not empty, "
drchase@6680 3006 "returning it ", worker_id, p2i(curr_region));
tonyp@2973 3007 }
ysr@777 3008 return curr_region;
ysr@777 3009 } else {
tonyp@1458 3010 assert(limit == bottom,
tonyp@1458 3011 "the region limit should be at bottom");
tonyp@2973 3012 if (verbose_low()) {
johnc@4173 3013 gclog_or_tty->print_cr("[%u] region "PTR_FORMAT" is empty, "
drchase@6680 3014 "returning NULL", worker_id, p2i(curr_region));
tonyp@2973 3015 }
ysr@777 3016 // we return NULL and the caller should try calling
ysr@777 3017 // claim_region() again.
ysr@777 3018 return NULL;
ysr@777 3019 }
ysr@777 3020 } else {
tonyp@1458 3021 assert(_finger > finger, "the finger should have moved forward");
tonyp@2973 3022 if (verbose_low()) {
tschatzl@7051 3023 if (curr_region == NULL) {
tschatzl@7051 3024 gclog_or_tty->print_cr("[%u] found uncommitted region, moving finger, "
tschatzl@7051 3025 "global finger = "PTR_FORMAT", "
tschatzl@7051 3026 "our finger = "PTR_FORMAT,
tschatzl@7051 3027 worker_id, p2i(_finger), p2i(finger));
tschatzl@7051 3028 } else {
tschatzl@7051 3029 gclog_or_tty->print_cr("[%u] somebody else moved the finger, "
tschatzl@7051 3030 "global finger = "PTR_FORMAT", "
tschatzl@7051 3031 "our finger = "PTR_FORMAT,
tschatzl@7051 3032 worker_id, p2i(_finger), p2i(finger));
tschatzl@7051 3033 }
tonyp@2973 3034 }
ysr@777 3035
ysr@777 3036 // read it again
ysr@777 3037 finger = _finger;
ysr@777 3038 }
ysr@777 3039 }
ysr@777 3040
ysr@777 3041 return NULL;
ysr@777 3042 }
ysr@777 3043
tonyp@3416 3044 #ifndef PRODUCT
tonyp@3416 3045 enum VerifyNoCSetOopsPhase {
tonyp@3416 3046 VerifyNoCSetOopsStack,
tonyp@3416 3047 VerifyNoCSetOopsQueues,
tonyp@3416 3048 VerifyNoCSetOopsSATBCompleted,
tonyp@3416 3049 VerifyNoCSetOopsSATBThread
tonyp@3416 3050 };
tonyp@3416 3051
tonyp@3416 3052 class VerifyNoCSetOopsClosure : public OopClosure, public ObjectClosure {
tonyp@3416 3053 private:
tonyp@3416 3054 G1CollectedHeap* _g1h;
tonyp@3416 3055 VerifyNoCSetOopsPhase _phase;
tonyp@3416 3056 int _info;
tonyp@3416 3057
tonyp@3416 3058 const char* phase_str() {
tonyp@3416 3059 switch (_phase) {
tonyp@3416 3060 case VerifyNoCSetOopsStack: return "Stack";
tonyp@3416 3061 case VerifyNoCSetOopsQueues: return "Queue";
tonyp@3416 3062 case VerifyNoCSetOopsSATBCompleted: return "Completed SATB Buffers";
tonyp@3416 3063 case VerifyNoCSetOopsSATBThread: return "Thread SATB Buffers";
tonyp@3416 3064 default: ShouldNotReachHere();
tonyp@3416 3065 }
tonyp@3416 3066 return NULL;
ysr@777 3067 }
johnc@2190 3068
tonyp@3416 3069 void do_object_work(oop obj) {
tonyp@3416 3070 guarantee(!_g1h->obj_in_cs(obj),
tonyp@3416 3071 err_msg("obj: "PTR_FORMAT" in CSet, phase: %s, info: %d",
drchase@6680 3072 p2i((void*) obj), phase_str(), _info));
johnc@2190 3073 }
johnc@2190 3074
tonyp@3416 3075 public:
tonyp@3416 3076 VerifyNoCSetOopsClosure() : _g1h(G1CollectedHeap::heap()) { }
tonyp@3416 3077
tonyp@3416 3078 void set_phase(VerifyNoCSetOopsPhase phase, int info = -1) {
tonyp@3416 3079 _phase = phase;
tonyp@3416 3080 _info = info;
tonyp@3416 3081 }
tonyp@3416 3082
tonyp@3416 3083 virtual void do_oop(oop* p) {
tonyp@3416 3084 oop obj = oopDesc::load_decode_heap_oop(p);
tonyp@3416 3085 do_object_work(obj);
tonyp@3416 3086 }
tonyp@3416 3087
tonyp@3416 3088 virtual void do_oop(narrowOop* p) {
tonyp@3416 3089 // We should not come across narrow oops while scanning marking
tonyp@3416 3090 // stacks and SATB buffers.
tonyp@3416 3091 ShouldNotReachHere();
tonyp@3416 3092 }
tonyp@3416 3093
tonyp@3416 3094 virtual void do_object(oop obj) {
tonyp@3416 3095 do_object_work(obj);
tonyp@3416 3096 }
tonyp@3416 3097 };
tonyp@3416 3098
tonyp@3416 3099 void ConcurrentMark::verify_no_cset_oops(bool verify_stacks,
tonyp@3416 3100 bool verify_enqueued_buffers,
tonyp@3416 3101 bool verify_thread_buffers,
tonyp@3416 3102 bool verify_fingers) {
tonyp@3416 3103 assert(SafepointSynchronize::is_at_safepoint(), "should be at a safepoint");
tonyp@3416 3104 if (!G1CollectedHeap::heap()->mark_in_progress()) {
tonyp@3416 3105 return;
tonyp@3416 3106 }
tonyp@3416 3107
tonyp@3416 3108 VerifyNoCSetOopsClosure cl;
tonyp@3416 3109
tonyp@3416 3110 if (verify_stacks) {
tonyp@3416 3111 // Verify entries on the global mark stack
tonyp@3416 3112 cl.set_phase(VerifyNoCSetOopsStack);
tonyp@3416 3113 _markStack.oops_do(&cl);
tonyp@3416 3114
tonyp@3416 3115 // Verify entries on the task queues
johnc@4173 3116 for (uint i = 0; i < _max_worker_id; i += 1) {
tonyp@3416 3117 cl.set_phase(VerifyNoCSetOopsQueues, i);
johnc@4333 3118 CMTaskQueue* queue = _task_queues->queue(i);
tonyp@3416 3119 queue->oops_do(&cl);
tonyp@3416 3120 }
tonyp@3416 3121 }
tonyp@3416 3122
tonyp@3416 3123 SATBMarkQueueSet& satb_qs = JavaThread::satb_mark_queue_set();
tonyp@3416 3124
tonyp@3416 3125 // Verify entries on the enqueued SATB buffers
tonyp@3416 3126 if (verify_enqueued_buffers) {
tonyp@3416 3127 cl.set_phase(VerifyNoCSetOopsSATBCompleted);
tonyp@3416 3128 satb_qs.iterate_completed_buffers_read_only(&cl);
tonyp@3416 3129 }
tonyp@3416 3130
tonyp@3416 3131 // Verify entries on the per-thread SATB buffers
tonyp@3416 3132 if (verify_thread_buffers) {
tonyp@3416 3133 cl.set_phase(VerifyNoCSetOopsSATBThread);
tonyp@3416 3134 satb_qs.iterate_thread_buffers_read_only(&cl);
tonyp@3416 3135 }
tonyp@3416 3136
tonyp@3416 3137 if (verify_fingers) {
tonyp@3416 3138 // Verify the global finger
tonyp@3416 3139 HeapWord* global_finger = finger();
tonyp@3416 3140 if (global_finger != NULL && global_finger < _heap_end) {
tonyp@3416 3141 // The global finger always points to a heap region boundary. We
tonyp@3416 3142 // use heap_region_containing_raw() to get the containing region
tonyp@3416 3143 // given that the global finger could be pointing to a free region
tonyp@3416 3144 // which subsequently becomes continues humongous. If that
tonyp@3416 3145 // happens, heap_region_containing() will return the bottom of the
tonyp@3416 3146 // corresponding starts humongous region and the check below will
tonyp@3416 3147 // not hold any more.
tschatzl@7051 3148 // Since we always iterate over all regions, we might get a NULL HeapRegion
tschatzl@7051 3149 // here.
tonyp@3416 3150 HeapRegion* global_hr = _g1h->heap_region_containing_raw(global_finger);
tschatzl@7051 3151 guarantee(global_hr == NULL || global_finger == global_hr->bottom(),
tonyp@3416 3152 err_msg("global finger: "PTR_FORMAT" region: "HR_FORMAT,
drchase@6680 3153 p2i(global_finger), HR_FORMAT_PARAMS(global_hr)));
tonyp@3416 3154 }
tonyp@3416 3155
tonyp@3416 3156 // Verify the task fingers
johnc@4173 3157 assert(parallel_marking_threads() <= _max_worker_id, "sanity");
tonyp@3416 3158 for (int i = 0; i < (int) parallel_marking_threads(); i += 1) {
tonyp@3416 3159 CMTask* task = _tasks[i];
tonyp@3416 3160 HeapWord* task_finger = task->finger();
tonyp@3416 3161 if (task_finger != NULL && task_finger < _heap_end) {
tonyp@3416 3162 // See above note on the global finger verification.
tonyp@3416 3163 HeapRegion* task_hr = _g1h->heap_region_containing_raw(task_finger);
tschatzl@7051 3164 guarantee(task_hr == NULL || task_finger == task_hr->bottom() ||
tonyp@3416 3165 !task_hr->in_collection_set(),
tonyp@3416 3166 err_msg("task finger: "PTR_FORMAT" region: "HR_FORMAT,
drchase@6680 3167 p2i(task_finger), HR_FORMAT_PARAMS(task_hr)));
tonyp@3416 3168 }
tonyp@3416 3169 }
tonyp@3416 3170 }
ysr@777 3171 }
tonyp@3416 3172 #endif // PRODUCT
ysr@777 3173
johnc@3463 3174 // Aggregate the counting data that was constructed concurrently
johnc@3463 3175 // with marking.
johnc@3463 3176 class AggregateCountDataHRClosure: public HeapRegionClosure {
johnc@4123 3177 G1CollectedHeap* _g1h;
johnc@3463 3178 ConcurrentMark* _cm;
johnc@4123 3179 CardTableModRefBS* _ct_bs;
johnc@3463 3180 BitMap* _cm_card_bm;
johnc@4173 3181 uint _max_worker_id;
johnc@3463 3182
johnc@3463 3183 public:
johnc@4123 3184 AggregateCountDataHRClosure(G1CollectedHeap* g1h,
johnc@3463 3185 BitMap* cm_card_bm,
johnc@4173 3186 uint max_worker_id) :
johnc@4123 3187 _g1h(g1h), _cm(g1h->concurrent_mark()),
johnc@4123 3188 _ct_bs((CardTableModRefBS*) (g1h->barrier_set())),
johnc@4173 3189 _cm_card_bm(cm_card_bm), _max_worker_id(max_worker_id) { }
johnc@3463 3190
johnc@3463 3191 bool doHeapRegion(HeapRegion* hr) {
johnc@3463 3192 if (hr->continuesHumongous()) {
johnc@3463 3193 // We will ignore these here and process them when their
johnc@3463 3194 // associated "starts humongous" region is processed.
johnc@3463 3195 // Note that we cannot rely on their associated
johnc@3463 3196 // "starts humongous" region to have their bit set to 1
johnc@3463 3197 // since, due to the region chunking in the parallel region
johnc@3463 3198 // iteration, a "continues humongous" region might be visited
johnc@3463 3199 // before its associated "starts humongous".
johnc@3463 3200 return false;
johnc@3463 3201 }
johnc@3463 3202
johnc@3463 3203 HeapWord* start = hr->bottom();
johnc@3463 3204 HeapWord* limit = hr->next_top_at_mark_start();
johnc@3463 3205 HeapWord* end = hr->end();
johnc@3463 3206
johnc@3463 3207 assert(start <= limit && limit <= hr->top() && hr->top() <= hr->end(),
johnc@3463 3208 err_msg("Preconditions not met - "
johnc@3463 3209 "start: "PTR_FORMAT", limit: "PTR_FORMAT", "
johnc@3463 3210 "top: "PTR_FORMAT", end: "PTR_FORMAT,
drchase@6680 3211 p2i(start), p2i(limit), p2i(hr->top()), p2i(hr->end())));
johnc@3463 3212
johnc@3463 3213 assert(hr->next_marked_bytes() == 0, "Precondition");
johnc@3463 3214
johnc@3463 3215 if (start == limit) {
johnc@3463 3216 // NTAMS of this region has not been set so nothing to do.
johnc@3463 3217 return false;
johnc@3463 3218 }
johnc@3463 3219
johnc@4123 3220 // 'start' should be in the heap.
johnc@4123 3221 assert(_g1h->is_in_g1_reserved(start) && _ct_bs->is_card_aligned(start), "sanity");
johnc@4123 3222 // 'end' *may* be just beyone the end of the heap (if hr is the last region)
johnc@4123 3223 assert(!_g1h->is_in_g1_reserved(end) || _ct_bs->is_card_aligned(end), "sanity");
johnc@3463 3224
johnc@3463 3225 BitMap::idx_t start_idx = _cm->card_bitmap_index_for(start);
johnc@3463 3226 BitMap::idx_t limit_idx = _cm->card_bitmap_index_for(limit);
johnc@3463 3227 BitMap::idx_t end_idx = _cm->card_bitmap_index_for(end);
johnc@3463 3228
johnc@4123 3229 // If ntams is not card aligned then we bump card bitmap index
johnc@4123 3230 // for limit so that we get the all the cards spanned by
johnc@4123 3231 // the object ending at ntams.
johnc@4123 3232 // Note: if this is the last region in the heap then ntams
johnc@4123 3233 // could be actually just beyond the end of the the heap;
johnc@4123 3234 // limit_idx will then correspond to a (non-existent) card
johnc@4123 3235 // that is also outside the heap.
johnc@4123 3236 if (_g1h->is_in_g1_reserved(limit) && !_ct_bs->is_card_aligned(limit)) {
johnc@3463 3237 limit_idx += 1;
johnc@3463 3238 }
johnc@3463 3239
johnc@3463 3240 assert(limit_idx <= end_idx, "or else use atomics");
johnc@3463 3241
johnc@3463 3242 // Aggregate the "stripe" in the count data associated with hr.
tschatzl@7091 3243 uint hrm_index = hr->hrm_index();
johnc@3463 3244 size_t marked_bytes = 0;
johnc@3463 3245
johnc@4173 3246 for (uint i = 0; i < _max_worker_id; i += 1) {
johnc@3463 3247 size_t* marked_bytes_array = _cm->count_marked_bytes_array_for(i);
johnc@3463 3248 BitMap* task_card_bm = _cm->count_card_bitmap_for(i);
johnc@3463 3249
johnc@3463 3250 // Fetch the marked_bytes in this region for task i and
johnc@3463 3251 // add it to the running total for this region.
tschatzl@7091 3252 marked_bytes += marked_bytes_array[hrm_index];
johnc@3463 3253
johnc@4173 3254 // Now union the bitmaps[0,max_worker_id)[start_idx..limit_idx)
johnc@3463 3255 // into the global card bitmap.
johnc@3463 3256 BitMap::idx_t scan_idx = task_card_bm->get_next_one_offset(start_idx, limit_idx);
johnc@3463 3257
johnc@3463 3258 while (scan_idx < limit_idx) {
johnc@3463 3259 assert(task_card_bm->at(scan_idx) == true, "should be");
johnc@3463 3260 _cm_card_bm->set_bit(scan_idx);
johnc@3463 3261 assert(_cm_card_bm->at(scan_idx) == true, "should be");
johnc@3463 3262
johnc@3463 3263 // BitMap::get_next_one_offset() can handle the case when
johnc@3463 3264 // its left_offset parameter is greater than its right_offset
johnc@4123 3265 // parameter. It does, however, have an early exit if
johnc@3463 3266 // left_offset == right_offset. So let's limit the value
johnc@3463 3267 // passed in for left offset here.
johnc@3463 3268 BitMap::idx_t next_idx = MIN2(scan_idx + 1, limit_idx);
johnc@3463 3269 scan_idx = task_card_bm->get_next_one_offset(next_idx, limit_idx);
johnc@3463 3270 }
johnc@3463 3271 }
johnc@3463 3272
johnc@3463 3273 // Update the marked bytes for this region.
johnc@3463 3274 hr->add_to_marked_bytes(marked_bytes);
johnc@3463 3275
johnc@3463 3276 // Next heap region
johnc@3463 3277 return false;
johnc@3463 3278 }
johnc@3463 3279 };
johnc@3463 3280
johnc@3463 3281 class G1AggregateCountDataTask: public AbstractGangTask {
johnc@3463 3282 protected:
johnc@3463 3283 G1CollectedHeap* _g1h;
johnc@3463 3284 ConcurrentMark* _cm;
johnc@3463 3285 BitMap* _cm_card_bm;
johnc@4173 3286 uint _max_worker_id;
johnc@3463 3287 int _active_workers;
johnc@3463 3288
johnc@3463 3289 public:
johnc@3463 3290 G1AggregateCountDataTask(G1CollectedHeap* g1h,
johnc@3463 3291 ConcurrentMark* cm,
johnc@3463 3292 BitMap* cm_card_bm,
johnc@4173 3293 uint max_worker_id,
johnc@3463 3294 int n_workers) :
johnc@3463 3295 AbstractGangTask("Count Aggregation"),
johnc@3463 3296 _g1h(g1h), _cm(cm), _cm_card_bm(cm_card_bm),
johnc@4173 3297 _max_worker_id(max_worker_id),
johnc@3463 3298 _active_workers(n_workers) { }
johnc@3463 3299
johnc@3463 3300 void work(uint worker_id) {
johnc@4173 3301 AggregateCountDataHRClosure cl(_g1h, _cm_card_bm, _max_worker_id);
johnc@3463 3302
johnc@3463 3303 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@3463 3304 _g1h->heap_region_par_iterate_chunked(&cl, worker_id,
johnc@3463 3305 _active_workers,
johnc@3463 3306 HeapRegion::AggregateCountClaimValue);
johnc@3463 3307 } else {
johnc@3463 3308 _g1h->heap_region_iterate(&cl);
johnc@3463 3309 }
johnc@3463 3310 }
johnc@3463 3311 };
johnc@3463 3312
johnc@3463 3313
johnc@3463 3314 void ConcurrentMark::aggregate_count_data() {
johnc@3463 3315 int n_workers = (G1CollectedHeap::use_parallel_gc_threads() ?
johnc@3463 3316 _g1h->workers()->active_workers() :
johnc@3463 3317 1);
johnc@3463 3318
johnc@3463 3319 G1AggregateCountDataTask g1_par_agg_task(_g1h, this, &_card_bm,
johnc@4173 3320 _max_worker_id, n_workers);
johnc@3463 3321
johnc@3463 3322 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@3463 3323 assert(_g1h->check_heap_region_claim_values(HeapRegion::InitialClaimValue),
johnc@3463 3324 "sanity check");
johnc@3463 3325 _g1h->set_par_threads(n_workers);
johnc@3463 3326 _g1h->workers()->run_task(&g1_par_agg_task);
johnc@3463 3327 _g1h->set_par_threads(0);
johnc@3463 3328
johnc@3463 3329 assert(_g1h->check_heap_region_claim_values(HeapRegion::AggregateCountClaimValue),
johnc@3463 3330 "sanity check");
johnc@3463 3331 _g1h->reset_heap_region_claim_values();
johnc@3463 3332 } else {
johnc@3463 3333 g1_par_agg_task.work(0);
johnc@3463 3334 }
jcoomes@7159 3335 _g1h->allocation_context_stats().update_at_remark();
johnc@3463 3336 }
johnc@3463 3337
johnc@3463 3338 // Clear the per-worker arrays used to store the per-region counting data
johnc@3463 3339 void ConcurrentMark::clear_all_count_data() {
johnc@3463 3340 // Clear the global card bitmap - it will be filled during
johnc@3463 3341 // liveness count aggregation (during remark) and the
johnc@3463 3342 // final counting task.
johnc@3463 3343 _card_bm.clear();
johnc@3463 3344
johnc@3463 3345 // Clear the global region bitmap - it will be filled as part
johnc@3463 3346 // of the final counting task.
johnc@3463 3347 _region_bm.clear();
johnc@3463 3348
tonyp@3713 3349 uint max_regions = _g1h->max_regions();
johnc@4173 3350 assert(_max_worker_id > 0, "uninitialized");
johnc@4173 3351
johnc@4173 3352 for (uint i = 0; i < _max_worker_id; i += 1) {
johnc@3463 3353 BitMap* task_card_bm = count_card_bitmap_for(i);
johnc@3463 3354 size_t* marked_bytes_array = count_marked_bytes_array_for(i);
johnc@3463 3355
johnc@3463 3356 assert(task_card_bm->size() == _card_bm.size(), "size mismatch");
johnc@3463 3357 assert(marked_bytes_array != NULL, "uninitialized");
johnc@3463 3358
tonyp@3713 3359 memset(marked_bytes_array, 0, (size_t) max_regions * sizeof(size_t));
johnc@3463 3360 task_card_bm->clear();
johnc@3463 3361 }
johnc@3463 3362 }
johnc@3463 3363
ysr@777 3364 void ConcurrentMark::print_stats() {
ysr@777 3365 if (verbose_stats()) {
ysr@777 3366 gclog_or_tty->print_cr("---------------------------------------------------------------------");
ysr@777 3367 for (size_t i = 0; i < _active_tasks; ++i) {
ysr@777 3368 _tasks[i]->print_stats();
ysr@777 3369 gclog_or_tty->print_cr("---------------------------------------------------------------------");
ysr@777 3370 }
ysr@777 3371 }
ysr@777 3372 }
ysr@777 3373
ysr@777 3374 // abandon current marking iteration due to a Full GC
ysr@777 3375 void ConcurrentMark::abort() {
tschatzl@7016 3376 // Clear all marks in the next bitmap for the next marking cycle. This will allow us to skip the next
tschatzl@7016 3377 // concurrent bitmap clearing.
ysr@777 3378 _nextMarkBitMap->clearAll();
brutisso@7005 3379
brutisso@7005 3380 // Note we cannot clear the previous marking bitmap here
brutisso@7005 3381 // since VerifyDuringGC verifies the objects marked during
brutisso@7005 3382 // a full GC against the previous bitmap.
brutisso@7005 3383
johnc@3463 3384 // Clear the liveness counting data
johnc@3463 3385 clear_all_count_data();
ysr@777 3386 // Empty mark stack
johnc@4386 3387 reset_marking_state();
johnc@4173 3388 for (uint i = 0; i < _max_worker_id; ++i) {
ysr@777 3389 _tasks[i]->clear_region_fields();
johnc@2190 3390 }
pliden@6692 3391 _first_overflow_barrier_sync.abort();
pliden@6692 3392 _second_overflow_barrier_sync.abort();
brutisso@6904 3393 const GCId& gc_id = _g1h->gc_tracer_cm()->gc_id();
brutisso@6904 3394 if (!gc_id.is_undefined()) {
brutisso@6904 3395 // We can do multiple full GCs before ConcurrentMarkThread::run() gets a chance
brutisso@6904 3396 // to detect that it was aborted. Only keep track of the first GC id that we aborted.
brutisso@6904 3397 _aborted_gc_id = gc_id;
brutisso@6904 3398 }
ysr@777 3399 _has_aborted = true;
ysr@777 3400
ysr@777 3401 SATBMarkQueueSet& satb_mq_set = JavaThread::satb_mark_queue_set();
ysr@777 3402 satb_mq_set.abandon_partial_marking();
tonyp@1752 3403 // This can be called either during or outside marking, we'll read
tonyp@1752 3404 // the expected_active value from the SATB queue set.
tonyp@1752 3405 satb_mq_set.set_active_all_threads(
tonyp@1752 3406 false, /* new active value */
tonyp@1752 3407 satb_mq_set.is_active() /* expected_active */);
sla@5237 3408
sla@5237 3409 _g1h->trace_heap_after_concurrent_cycle();
sla@5237 3410 _g1h->register_concurrent_cycle_end();
ysr@777 3411 }
ysr@777 3412
brutisso@6904 3413 const GCId& ConcurrentMark::concurrent_gc_id() {
brutisso@6904 3414 if (has_aborted()) {
brutisso@6904 3415 return _aborted_gc_id;
brutisso@6904 3416 }
brutisso@6904 3417 return _g1h->gc_tracer_cm()->gc_id();
brutisso@6904 3418 }
brutisso@6904 3419
ysr@777 3420 static void print_ms_time_info(const char* prefix, const char* name,
ysr@777 3421 NumberSeq& ns) {
ysr@777 3422 gclog_or_tty->print_cr("%s%5d %12s: total time = %8.2f s (avg = %8.2f ms).",
ysr@777 3423 prefix, ns.num(), name, ns.sum()/1000.0, ns.avg());
ysr@777 3424 if (ns.num() > 0) {
ysr@777 3425 gclog_or_tty->print_cr("%s [std. dev = %8.2f ms, max = %8.2f ms]",
ysr@777 3426 prefix, ns.sd(), ns.maximum());
ysr@777 3427 }
ysr@777 3428 }
ysr@777 3429
ysr@777 3430 void ConcurrentMark::print_summary_info() {
ysr@777 3431 gclog_or_tty->print_cr(" Concurrent marking:");
ysr@777 3432 print_ms_time_info(" ", "init marks", _init_times);
ysr@777 3433 print_ms_time_info(" ", "remarks", _remark_times);
ysr@777 3434 {
ysr@777 3435 print_ms_time_info(" ", "final marks", _remark_mark_times);
ysr@777 3436 print_ms_time_info(" ", "weak refs", _remark_weak_ref_times);
ysr@777 3437
ysr@777 3438 }
ysr@777 3439 print_ms_time_info(" ", "cleanups", _cleanup_times);
ysr@777 3440 gclog_or_tty->print_cr(" Final counting total time = %8.2f s (avg = %8.2f ms).",
ysr@777 3441 _total_counting_time,
ysr@777 3442 (_cleanup_times.num() > 0 ? _total_counting_time * 1000.0 /
ysr@777 3443 (double)_cleanup_times.num()
ysr@777 3444 : 0.0));
ysr@777 3445 if (G1ScrubRemSets) {
ysr@777 3446 gclog_or_tty->print_cr(" RS scrub total time = %8.2f s (avg = %8.2f ms).",
ysr@777 3447 _total_rs_scrub_time,
ysr@777 3448 (_cleanup_times.num() > 0 ? _total_rs_scrub_time * 1000.0 /
ysr@777 3449 (double)_cleanup_times.num()
ysr@777 3450 : 0.0));
ysr@777 3451 }
ysr@777 3452 gclog_or_tty->print_cr(" Total stop_world time = %8.2f s.",
ysr@777 3453 (_init_times.sum() + _remark_times.sum() +
ysr@777 3454 _cleanup_times.sum())/1000.0);
ysr@777 3455 gclog_or_tty->print_cr(" Total concurrent time = %8.2f s "
johnc@3463 3456 "(%8.2f s marking).",
ysr@777 3457 cmThread()->vtime_accum(),
johnc@3463 3458 cmThread()->vtime_mark_accum());
ysr@777 3459 }
ysr@777 3460
tonyp@1454 3461 void ConcurrentMark::print_worker_threads_on(outputStream* st) const {
johnc@4549 3462 if (use_parallel_marking_threads()) {
johnc@4549 3463 _parallel_workers->print_worker_threads_on(st);
johnc@4549 3464 }
tonyp@1454 3465 }
tonyp@1454 3466
stefank@4904 3467 void ConcurrentMark::print_on_error(outputStream* st) const {
stefank@4904 3468 st->print_cr("Marking Bits (Prev, Next): (CMBitMap*) " PTR_FORMAT ", (CMBitMap*) " PTR_FORMAT,
drchase@6680 3469 p2i(_prevMarkBitMap), p2i(_nextMarkBitMap));
stefank@4904 3470 _prevMarkBitMap->print_on_error(st, " Prev Bits: ");
stefank@4904 3471 _nextMarkBitMap->print_on_error(st, " Next Bits: ");
stefank@4904 3472 }
stefank@4904 3473
ysr@777 3474 // We take a break if someone is trying to stop the world.
jmasa@3357 3475 bool ConcurrentMark::do_yield_check(uint worker_id) {
pliden@6906 3476 if (SuspendibleThreadSet::should_yield()) {
jmasa@3357 3477 if (worker_id == 0) {
ysr@777 3478 _g1h->g1_policy()->record_concurrent_pause();
tonyp@2973 3479 }
pliden@6906 3480 SuspendibleThreadSet::yield();
ysr@777 3481 return true;
ysr@777 3482 } else {
ysr@777 3483 return false;
ysr@777 3484 }
ysr@777 3485 }
ysr@777 3486
ysr@777 3487 #ifndef PRODUCT
ysr@777 3488 // for debugging purposes
ysr@777 3489 void ConcurrentMark::print_finger() {
ysr@777 3490 gclog_or_tty->print_cr("heap ["PTR_FORMAT", "PTR_FORMAT"), global finger = "PTR_FORMAT,
drchase@6680 3491 p2i(_heap_start), p2i(_heap_end), p2i(_finger));
johnc@4173 3492 for (uint i = 0; i < _max_worker_id; ++i) {
drchase@6680 3493 gclog_or_tty->print(" %u: " PTR_FORMAT, i, p2i(_tasks[i]->finger()));
ysr@777 3494 }
drchase@6680 3495 gclog_or_tty->cr();
ysr@777 3496 }
ysr@777 3497 #endif
ysr@777 3498
tonyp@2968 3499 void CMTask::scan_object(oop obj) {
tonyp@2968 3500 assert(_nextMarkBitMap->isMarked((HeapWord*) obj), "invariant");
tonyp@2968 3501
tonyp@2968 3502 if (_cm->verbose_high()) {
johnc@4173 3503 gclog_or_tty->print_cr("[%u] we're scanning object "PTR_FORMAT,
drchase@6680 3504 _worker_id, p2i((void*) obj));
tonyp@2968 3505 }
tonyp@2968 3506
tonyp@2968 3507 size_t obj_size = obj->size();
tonyp@2968 3508 _words_scanned += obj_size;
tonyp@2968 3509
tonyp@2968 3510 obj->oop_iterate(_cm_oop_closure);
tonyp@2968 3511 statsOnly( ++_objs_scanned );
tonyp@2968 3512 check_limits();
tonyp@2968 3513 }
tonyp@2968 3514
ysr@777 3515 // Closure for iteration over bitmaps
ysr@777 3516 class CMBitMapClosure : public BitMapClosure {
ysr@777 3517 private:
ysr@777 3518 // the bitmap that is being iterated over
ysr@777 3519 CMBitMap* _nextMarkBitMap;
ysr@777 3520 ConcurrentMark* _cm;
ysr@777 3521 CMTask* _task;
ysr@777 3522
ysr@777 3523 public:
tonyp@3691 3524 CMBitMapClosure(CMTask *task, ConcurrentMark* cm, CMBitMap* nextMarkBitMap) :
tonyp@3691 3525 _task(task), _cm(cm), _nextMarkBitMap(nextMarkBitMap) { }
ysr@777 3526
ysr@777 3527 bool do_bit(size_t offset) {
ysr@777 3528 HeapWord* addr = _nextMarkBitMap->offsetToHeapWord(offset);
tonyp@1458 3529 assert(_nextMarkBitMap->isMarked(addr), "invariant");
tonyp@1458 3530 assert( addr < _cm->finger(), "invariant");
ysr@777 3531
tonyp@3691 3532 statsOnly( _task->increase_objs_found_on_bitmap() );
tonyp@3691 3533 assert(addr >= _task->finger(), "invariant");
tonyp@3691 3534
tonyp@3691 3535 // We move that task's local finger along.
tonyp@3691 3536 _task->move_finger_to(addr);
ysr@777 3537
ysr@777 3538 _task->scan_object(oop(addr));
ysr@777 3539 // we only partially drain the local queue and global stack
ysr@777 3540 _task->drain_local_queue(true);
ysr@777 3541 _task->drain_global_stack(true);
ysr@777 3542
ysr@777 3543 // if the has_aborted flag has been raised, we need to bail out of
ysr@777 3544 // the iteration
ysr@777 3545 return !_task->has_aborted();
ysr@777 3546 }
ysr@777 3547 };
ysr@777 3548
tonyp@2968 3549 G1CMOopClosure::G1CMOopClosure(G1CollectedHeap* g1h,
tonyp@2968 3550 ConcurrentMark* cm,
tonyp@2968 3551 CMTask* task)
tonyp@2968 3552 : _g1h(g1h), _cm(cm), _task(task) {
tonyp@2968 3553 assert(_ref_processor == NULL, "should be initialized to NULL");
tonyp@2968 3554
tonyp@2968 3555 if (G1UseConcMarkReferenceProcessing) {
johnc@3175 3556 _ref_processor = g1h->ref_processor_cm();
tonyp@2968 3557 assert(_ref_processor != NULL, "should not be NULL");
ysr@777 3558 }
tonyp@2968 3559 }
ysr@777 3560
ysr@777 3561 void CMTask::setup_for_region(HeapRegion* hr) {
tonyp@1458 3562 assert(hr != NULL,
brutisso@7049 3563 "claim_region() should have filtered out NULL regions");
tonyp@1458 3564 assert(!hr->continuesHumongous(),
tonyp@1458 3565 "claim_region() should have filtered out continues humongous regions");
ysr@777 3566
tonyp@2973 3567 if (_cm->verbose_low()) {
johnc@4173 3568 gclog_or_tty->print_cr("[%u] setting up for region "PTR_FORMAT,
drchase@6680 3569 _worker_id, p2i(hr));
tonyp@2973 3570 }
ysr@777 3571
ysr@777 3572 _curr_region = hr;
ysr@777 3573 _finger = hr->bottom();
ysr@777 3574 update_region_limit();
ysr@777 3575 }
ysr@777 3576
ysr@777 3577 void CMTask::update_region_limit() {
ysr@777 3578 HeapRegion* hr = _curr_region;
ysr@777 3579 HeapWord* bottom = hr->bottom();
ysr@777 3580 HeapWord* limit = hr->next_top_at_mark_start();
ysr@777 3581
ysr@777 3582 if (limit == bottom) {
tonyp@2973 3583 if (_cm->verbose_low()) {
johnc@4173 3584 gclog_or_tty->print_cr("[%u] found an empty region "
ysr@777 3585 "["PTR_FORMAT", "PTR_FORMAT")",
drchase@6680 3586 _worker_id, p2i(bottom), p2i(limit));
tonyp@2973 3587 }
ysr@777 3588 // The region was collected underneath our feet.
ysr@777 3589 // We set the finger to bottom to ensure that the bitmap
ysr@777 3590 // iteration that will follow this will not do anything.
ysr@777 3591 // (this is not a condition that holds when we set the region up,
ysr@777 3592 // as the region is not supposed to be empty in the first place)
ysr@777 3593 _finger = bottom;
ysr@777 3594 } else if (limit >= _region_limit) {
tonyp@1458 3595 assert(limit >= _finger, "peace of mind");
ysr@777 3596 } else {
tonyp@1458 3597 assert(limit < _region_limit, "only way to get here");
ysr@777 3598 // This can happen under some pretty unusual circumstances. An
ysr@777 3599 // evacuation pause empties the region underneath our feet (NTAMS
ysr@777 3600 // at bottom). We then do some allocation in the region (NTAMS
ysr@777 3601 // stays at bottom), followed by the region being used as a GC
ysr@777 3602 // alloc region (NTAMS will move to top() and the objects
ysr@777 3603 // originally below it will be grayed). All objects now marked in
ysr@777 3604 // the region are explicitly grayed, if below the global finger,
ysr@777 3605 // and we do not need in fact to scan anything else. So, we simply
ysr@777 3606 // set _finger to be limit to ensure that the bitmap iteration
ysr@777 3607 // doesn't do anything.
ysr@777 3608 _finger = limit;
ysr@777 3609 }
ysr@777 3610
ysr@777 3611 _region_limit = limit;
ysr@777 3612 }
ysr@777 3613
ysr@777 3614 void CMTask::giveup_current_region() {
tonyp@1458 3615 assert(_curr_region != NULL, "invariant");
tonyp@2973 3616 if (_cm->verbose_low()) {
johnc@4173 3617 gclog_or_tty->print_cr("[%u] giving up region "PTR_FORMAT,
drchase@6680 3618 _worker_id, p2i(_curr_region));
tonyp@2973 3619 }
ysr@777 3620 clear_region_fields();
ysr@777 3621 }
ysr@777 3622
ysr@777 3623 void CMTask::clear_region_fields() {
ysr@777 3624 // Values for these three fields that indicate that we're not
ysr@777 3625 // holding on to a region.
ysr@777 3626 _curr_region = NULL;
ysr@777 3627 _finger = NULL;
ysr@777 3628 _region_limit = NULL;
ysr@777 3629 }
ysr@777 3630
tonyp@2968 3631 void CMTask::set_cm_oop_closure(G1CMOopClosure* cm_oop_closure) {
tonyp@2968 3632 if (cm_oop_closure == NULL) {
tonyp@2968 3633 assert(_cm_oop_closure != NULL, "invariant");
tonyp@2968 3634 } else {
tonyp@2968 3635 assert(_cm_oop_closure == NULL, "invariant");
tonyp@2968 3636 }
tonyp@2968 3637 _cm_oop_closure = cm_oop_closure;
tonyp@2968 3638 }
tonyp@2968 3639
ysr@777 3640 void CMTask::reset(CMBitMap* nextMarkBitMap) {
tonyp@1458 3641 guarantee(nextMarkBitMap != NULL, "invariant");
ysr@777 3642
tonyp@2973 3643 if (_cm->verbose_low()) {
johnc@4173 3644 gclog_or_tty->print_cr("[%u] resetting", _worker_id);
tonyp@2973 3645 }
ysr@777 3646
ysr@777 3647 _nextMarkBitMap = nextMarkBitMap;
ysr@777 3648 clear_region_fields();
ysr@777 3649
ysr@777 3650 _calls = 0;
ysr@777 3651 _elapsed_time_ms = 0.0;
ysr@777 3652 _termination_time_ms = 0.0;
ysr@777 3653 _termination_start_time_ms = 0.0;
ysr@777 3654
ysr@777 3655 #if _MARKING_STATS_
ysr@777 3656 _local_pushes = 0;
ysr@777 3657 _local_pops = 0;
ysr@777 3658 _local_max_size = 0;
ysr@777 3659 _objs_scanned = 0;
ysr@777 3660 _global_pushes = 0;
ysr@777 3661 _global_pops = 0;
ysr@777 3662 _global_max_size = 0;
ysr@777 3663 _global_transfers_to = 0;
ysr@777 3664 _global_transfers_from = 0;
ysr@777 3665 _regions_claimed = 0;
ysr@777 3666 _objs_found_on_bitmap = 0;
ysr@777 3667 _satb_buffers_processed = 0;
ysr@777 3668 _steal_attempts = 0;
ysr@777 3669 _steals = 0;
ysr@777 3670 _aborted = 0;
ysr@777 3671 _aborted_overflow = 0;
ysr@777 3672 _aborted_cm_aborted = 0;
ysr@777 3673 _aborted_yield = 0;
ysr@777 3674 _aborted_timed_out = 0;
ysr@777 3675 _aborted_satb = 0;
ysr@777 3676 _aborted_termination = 0;
ysr@777 3677 #endif // _MARKING_STATS_
ysr@777 3678 }
ysr@777 3679
ysr@777 3680 bool CMTask::should_exit_termination() {
ysr@777 3681 regular_clock_call();
ysr@777 3682 // This is called when we are in the termination protocol. We should
ysr@777 3683 // quit if, for some reason, this task wants to abort or the global
ysr@777 3684 // stack is not empty (this means that we can get work from it).
ysr@777 3685 return !_cm->mark_stack_empty() || has_aborted();
ysr@777 3686 }
ysr@777 3687
ysr@777 3688 void CMTask::reached_limit() {
tonyp@1458 3689 assert(_words_scanned >= _words_scanned_limit ||
tonyp@1458 3690 _refs_reached >= _refs_reached_limit ,
tonyp@1458 3691 "shouldn't have been called otherwise");
ysr@777 3692 regular_clock_call();
ysr@777 3693 }
ysr@777 3694
ysr@777 3695 void CMTask::regular_clock_call() {
tonyp@2973 3696 if (has_aborted()) return;
ysr@777 3697
ysr@777 3698 // First, we need to recalculate the words scanned and refs reached
ysr@777 3699 // limits for the next clock call.
ysr@777 3700 recalculate_limits();
ysr@777 3701
ysr@777 3702 // During the regular clock call we do the following
ysr@777 3703
ysr@777 3704 // (1) If an overflow has been flagged, then we abort.
ysr@777 3705 if (_cm->has_overflown()) {
ysr@777 3706 set_has_aborted();
ysr@777 3707 return;
ysr@777 3708 }
ysr@777 3709
ysr@777 3710 // If we are not concurrent (i.e. we're doing remark) we don't need
ysr@777 3711 // to check anything else. The other steps are only needed during
ysr@777 3712 // the concurrent marking phase.
tonyp@2973 3713 if (!concurrent()) return;
ysr@777 3714
ysr@777 3715 // (2) If marking has been aborted for Full GC, then we also abort.
ysr@777 3716 if (_cm->has_aborted()) {
ysr@777 3717 set_has_aborted();
ysr@777 3718 statsOnly( ++_aborted_cm_aborted );
ysr@777 3719 return;
ysr@777 3720 }
ysr@777 3721
ysr@777 3722 double curr_time_ms = os::elapsedVTime() * 1000.0;
ysr@777 3723
ysr@777 3724 // (3) If marking stats are enabled, then we update the step history.
ysr@777 3725 #if _MARKING_STATS_
tonyp@2973 3726 if (_words_scanned >= _words_scanned_limit) {
ysr@777 3727 ++_clock_due_to_scanning;
tonyp@2973 3728 }
tonyp@2973 3729 if (_refs_reached >= _refs_reached_limit) {
ysr@777 3730 ++_clock_due_to_marking;
tonyp@2973 3731 }
ysr@777 3732
ysr@777 3733 double last_interval_ms = curr_time_ms - _interval_start_time_ms;
ysr@777 3734 _interval_start_time_ms = curr_time_ms;
ysr@777 3735 _all_clock_intervals_ms.add(last_interval_ms);
ysr@777 3736
ysr@777 3737 if (_cm->verbose_medium()) {
johnc@4173 3738 gclog_or_tty->print_cr("[%u] regular clock, interval = %1.2lfms, "
tschatzl@7094 3739 "scanned = "SIZE_FORMAT"%s, refs reached = "SIZE_FORMAT"%s",
johnc@4173 3740 _worker_id, last_interval_ms,
tonyp@2973 3741 _words_scanned,
tonyp@2973 3742 (_words_scanned >= _words_scanned_limit) ? " (*)" : "",
tonyp@2973 3743 _refs_reached,
tonyp@2973 3744 (_refs_reached >= _refs_reached_limit) ? " (*)" : "");
ysr@777 3745 }
ysr@777 3746 #endif // _MARKING_STATS_
ysr@777 3747
ysr@777 3748 // (4) We check whether we should yield. If we have to, then we abort.
pliden@6906 3749 if (SuspendibleThreadSet::should_yield()) {
ysr@777 3750 // We should yield. To do this we abort the task. The caller is
ysr@777 3751 // responsible for yielding.
ysr@777 3752 set_has_aborted();
ysr@777 3753 statsOnly( ++_aborted_yield );
ysr@777 3754 return;
ysr@777 3755 }
ysr@777 3756
ysr@777 3757 // (5) We check whether we've reached our time quota. If we have,
ysr@777 3758 // then we abort.
ysr@777 3759 double elapsed_time_ms = curr_time_ms - _start_time_ms;
ysr@777 3760 if (elapsed_time_ms > _time_target_ms) {
ysr@777 3761 set_has_aborted();
johnc@2494 3762 _has_timed_out = true;
ysr@777 3763 statsOnly( ++_aborted_timed_out );
ysr@777 3764 return;
ysr@777 3765 }
ysr@777 3766
ysr@777 3767 // (6) Finally, we check whether there are enough completed STAB
ysr@777 3768 // buffers available for processing. If there are, we abort.
ysr@777 3769 SATBMarkQueueSet& satb_mq_set = JavaThread::satb_mark_queue_set();
ysr@777 3770 if (!_draining_satb_buffers && satb_mq_set.process_completed_buffers()) {
tonyp@2973 3771 if (_cm->verbose_low()) {
johnc@4173 3772 gclog_or_tty->print_cr("[%u] aborting to deal with pending SATB buffers",
johnc@4173 3773 _worker_id);
tonyp@2973 3774 }
ysr@777 3775 // we do need to process SATB buffers, we'll abort and restart
ysr@777 3776 // the marking task to do so
ysr@777 3777 set_has_aborted();
ysr@777 3778 statsOnly( ++_aborted_satb );
ysr@777 3779 return;
ysr@777 3780 }
ysr@777 3781 }
ysr@777 3782
ysr@777 3783 void CMTask::recalculate_limits() {
ysr@777 3784 _real_words_scanned_limit = _words_scanned + words_scanned_period;
ysr@777 3785 _words_scanned_limit = _real_words_scanned_limit;
ysr@777 3786
ysr@777 3787 _real_refs_reached_limit = _refs_reached + refs_reached_period;
ysr@777 3788 _refs_reached_limit = _real_refs_reached_limit;
ysr@777 3789 }
ysr@777 3790
ysr@777 3791 void CMTask::decrease_limits() {
ysr@777 3792 // This is called when we believe that we're going to do an infrequent
ysr@777 3793 // operation which will increase the per byte scanned cost (i.e. move
ysr@777 3794 // entries to/from the global stack). It basically tries to decrease the
ysr@777 3795 // scanning limit so that the clock is called earlier.
ysr@777 3796
tonyp@2973 3797 if (_cm->verbose_medium()) {
johnc@4173 3798 gclog_or_tty->print_cr("[%u] decreasing limits", _worker_id);
tonyp@2973 3799 }
ysr@777 3800
ysr@777 3801 _words_scanned_limit = _real_words_scanned_limit -
ysr@777 3802 3 * words_scanned_period / 4;
ysr@777 3803 _refs_reached_limit = _real_refs_reached_limit -
ysr@777 3804 3 * refs_reached_period / 4;
ysr@777 3805 }
ysr@777 3806
ysr@777 3807 void CMTask::move_entries_to_global_stack() {
ysr@777 3808 // local array where we'll store the entries that will be popped
ysr@777 3809 // from the local queue
ysr@777 3810 oop buffer[global_stack_transfer_size];
ysr@777 3811
ysr@777 3812 int n = 0;
ysr@777 3813 oop obj;
ysr@777 3814 while (n < global_stack_transfer_size && _task_queue->pop_local(obj)) {
ysr@777 3815 buffer[n] = obj;
ysr@777 3816 ++n;
ysr@777 3817 }
ysr@777 3818
ysr@777 3819 if (n > 0) {
ysr@777 3820 // we popped at least one entry from the local queue
ysr@777 3821
ysr@777 3822 statsOnly( ++_global_transfers_to; _local_pops += n );
ysr@777 3823
ysr@777 3824 if (!_cm->mark_stack_push(buffer, n)) {
tonyp@2973 3825 if (_cm->verbose_low()) {
johnc@4173 3826 gclog_or_tty->print_cr("[%u] aborting due to global stack overflow",
johnc@4173 3827 _worker_id);
tonyp@2973 3828 }
ysr@777 3829 set_has_aborted();
ysr@777 3830 } else {
ysr@777 3831 // the transfer was successful
ysr@777 3832
tonyp@2973 3833 if (_cm->verbose_medium()) {
johnc@4173 3834 gclog_or_tty->print_cr("[%u] pushed %d entries to the global stack",
johnc@4173 3835 _worker_id, n);
tonyp@2973 3836 }
ysr@777 3837 statsOnly( int tmp_size = _cm->mark_stack_size();
tonyp@2973 3838 if (tmp_size > _global_max_size) {
ysr@777 3839 _global_max_size = tmp_size;
tonyp@2973 3840 }
ysr@777 3841 _global_pushes += n );
ysr@777 3842 }
ysr@777 3843 }
ysr@777 3844
ysr@777 3845 // this operation was quite expensive, so decrease the limits
ysr@777 3846 decrease_limits();
ysr@777 3847 }
ysr@777 3848
ysr@777 3849 void CMTask::get_entries_from_global_stack() {
ysr@777 3850 // local array where we'll store the entries that will be popped
ysr@777 3851 // from the global stack.
ysr@777 3852 oop buffer[global_stack_transfer_size];
ysr@777 3853 int n;
ysr@777 3854 _cm->mark_stack_pop(buffer, global_stack_transfer_size, &n);
tonyp@1458 3855 assert(n <= global_stack_transfer_size,
tonyp@1458 3856 "we should not pop more than the given limit");
ysr@777 3857 if (n > 0) {
ysr@777 3858 // yes, we did actually pop at least one entry
ysr@777 3859
ysr@777 3860 statsOnly( ++_global_transfers_from; _global_pops += n );
tonyp@2973 3861 if (_cm->verbose_medium()) {
johnc@4173 3862 gclog_or_tty->print_cr("[%u] popped %d entries from the global stack",
johnc@4173 3863 _worker_id, n);
tonyp@2973 3864 }
ysr@777 3865 for (int i = 0; i < n; ++i) {
ysr@777 3866 bool success = _task_queue->push(buffer[i]);
ysr@777 3867 // We only call this when the local queue is empty or under a
ysr@777 3868 // given target limit. So, we do not expect this push to fail.
tonyp@1458 3869 assert(success, "invariant");
ysr@777 3870 }
ysr@777 3871
ysr@777 3872 statsOnly( int tmp_size = _task_queue->size();
tonyp@2973 3873 if (tmp_size > _local_max_size) {
ysr@777 3874 _local_max_size = tmp_size;
tonyp@2973 3875 }
ysr@777 3876 _local_pushes += n );
ysr@777 3877 }
ysr@777 3878
ysr@777 3879 // this operation was quite expensive, so decrease the limits
ysr@777 3880 decrease_limits();
ysr@777 3881 }
ysr@777 3882
ysr@777 3883 void CMTask::drain_local_queue(bool partially) {
tonyp@2973 3884 if (has_aborted()) return;
ysr@777 3885
ysr@777 3886 // Decide what the target size is, depending whether we're going to
ysr@777 3887 // drain it partially (so that other tasks can steal if they run out
ysr@777 3888 // of things to do) or totally (at the very end).
ysr@777 3889 size_t target_size;
tonyp@2973 3890 if (partially) {
ysr@777 3891 target_size = MIN2((size_t)_task_queue->max_elems()/3, GCDrainStackTargetSize);
tonyp@2973 3892 } else {
ysr@777 3893 target_size = 0;
tonyp@2973 3894 }
ysr@777 3895
ysr@777 3896 if (_task_queue->size() > target_size) {
tonyp@2973 3897 if (_cm->verbose_high()) {
drchase@6680 3898 gclog_or_tty->print_cr("[%u] draining local queue, target size = " SIZE_FORMAT,
johnc@4173 3899 _worker_id, target_size);
tonyp@2973 3900 }
ysr@777 3901
ysr@777 3902 oop obj;
ysr@777 3903 bool ret = _task_queue->pop_local(obj);
ysr@777 3904 while (ret) {
ysr@777 3905 statsOnly( ++_local_pops );
ysr@777 3906
tonyp@2973 3907 if (_cm->verbose_high()) {
johnc@4173 3908 gclog_or_tty->print_cr("[%u] popped "PTR_FORMAT, _worker_id,
drchase@6680 3909 p2i((void*) obj));
tonyp@2973 3910 }
ysr@777 3911
tonyp@1458 3912 assert(_g1h->is_in_g1_reserved((HeapWord*) obj), "invariant" );
tonyp@2643 3913 assert(!_g1h->is_on_master_free_list(
tonyp@2472 3914 _g1h->heap_region_containing((HeapWord*) obj)), "invariant");
ysr@777 3915
ysr@777 3916 scan_object(obj);
ysr@777 3917
tonyp@2973 3918 if (_task_queue->size() <= target_size || has_aborted()) {
ysr@777 3919 ret = false;
tonyp@2973 3920 } else {
ysr@777 3921 ret = _task_queue->pop_local(obj);
tonyp@2973 3922 }
ysr@777 3923 }
ysr@777 3924
tonyp@2973 3925 if (_cm->verbose_high()) {
johnc@4173 3926 gclog_or_tty->print_cr("[%u] drained local queue, size = %d",
johnc@4173 3927 _worker_id, _task_queue->size());
tonyp@2973 3928 }
ysr@777 3929 }
ysr@777 3930 }
ysr@777 3931
ysr@777 3932 void CMTask::drain_global_stack(bool partially) {
tonyp@2973 3933 if (has_aborted()) return;
ysr@777 3934
ysr@777 3935 // We have a policy to drain the local queue before we attempt to
ysr@777 3936 // drain the global stack.
tonyp@1458 3937 assert(partially || _task_queue->size() == 0, "invariant");
ysr@777 3938
ysr@777 3939 // Decide what the target size is, depending whether we're going to
ysr@777 3940 // drain it partially (so that other tasks can steal if they run out
ysr@777 3941 // of things to do) or totally (at the very end). Notice that,
ysr@777 3942 // because we move entries from the global stack in chunks or
ysr@777 3943 // because another task might be doing the same, we might in fact
ysr@777 3944 // drop below the target. But, this is not a problem.
ysr@777 3945 size_t target_size;
tonyp@2973 3946 if (partially) {
ysr@777 3947 target_size = _cm->partial_mark_stack_size_target();
tonyp@2973 3948 } else {
ysr@777 3949 target_size = 0;
tonyp@2973 3950 }
ysr@777 3951
ysr@777 3952 if (_cm->mark_stack_size() > target_size) {
tonyp@2973 3953 if (_cm->verbose_low()) {
drchase@6680 3954 gclog_or_tty->print_cr("[%u] draining global_stack, target size " SIZE_FORMAT,
johnc@4173 3955 _worker_id, target_size);
tonyp@2973 3956 }
ysr@777 3957
ysr@777 3958 while (!has_aborted() && _cm->mark_stack_size() > target_size) {
ysr@777 3959 get_entries_from_global_stack();
ysr@777 3960 drain_local_queue(partially);
ysr@777 3961 }
ysr@777 3962
tonyp@2973 3963 if (_cm->verbose_low()) {
drchase@6680 3964 gclog_or_tty->print_cr("[%u] drained global stack, size = " SIZE_FORMAT,
johnc@4173 3965 _worker_id, _cm->mark_stack_size());
tonyp@2973 3966 }
ysr@777 3967 }
ysr@777 3968 }
ysr@777 3969
ysr@777 3970 // SATB Queue has several assumptions on whether to call the par or
ysr@777 3971 // non-par versions of the methods. this is why some of the code is
ysr@777 3972 // replicated. We should really get rid of the single-threaded version
ysr@777 3973 // of the code to simplify things.
ysr@777 3974 void CMTask::drain_satb_buffers() {
tonyp@2973 3975 if (has_aborted()) return;
ysr@777 3976
ysr@777 3977 // We set this so that the regular clock knows that we're in the
ysr@777 3978 // middle of draining buffers and doesn't set the abort flag when it
ysr@777 3979 // notices that SATB buffers are available for draining. It'd be
ysr@777 3980 // very counter productive if it did that. :-)
ysr@777 3981 _draining_satb_buffers = true;
ysr@777 3982
ysr@777 3983 CMObjectClosure oc(this);
ysr@777 3984 SATBMarkQueueSet& satb_mq_set = JavaThread::satb_mark_queue_set();
tonyp@2973 3985 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@4173 3986 satb_mq_set.set_par_closure(_worker_id, &oc);
tonyp@2973 3987 } else {
ysr@777 3988 satb_mq_set.set_closure(&oc);
tonyp@2973 3989 }
ysr@777 3990
ysr@777 3991 // This keeps claiming and applying the closure to completed buffers
ysr@777 3992 // until we run out of buffers or we need to abort.
jmasa@2188 3993 if (G1CollectedHeap::use_parallel_gc_threads()) {
ysr@777 3994 while (!has_aborted() &&
johnc@4173 3995 satb_mq_set.par_apply_closure_to_completed_buffer(_worker_id)) {
tonyp@2973 3996 if (_cm->verbose_medium()) {
johnc@4173 3997 gclog_or_tty->print_cr("[%u] processed an SATB buffer", _worker_id);
tonyp@2973 3998 }
ysr@777 3999 statsOnly( ++_satb_buffers_processed );
ysr@777 4000 regular_clock_call();
ysr@777 4001 }
ysr@777 4002 } else {
ysr@777 4003 while (!has_aborted() &&
ysr@777 4004 satb_mq_set.apply_closure_to_completed_buffer()) {
tonyp@2973 4005 if (_cm->verbose_medium()) {
johnc@4173 4006 gclog_or_tty->print_cr("[%u] processed an SATB buffer", _worker_id);
tonyp@2973 4007 }
ysr@777 4008 statsOnly( ++_satb_buffers_processed );
ysr@777 4009 regular_clock_call();
ysr@777 4010 }
ysr@777 4011 }
ysr@777 4012
ysr@777 4013 _draining_satb_buffers = false;
ysr@777 4014
tonyp@1458 4015 assert(has_aborted() ||
tonyp@1458 4016 concurrent() ||
tonyp@1458 4017 satb_mq_set.completed_buffers_num() == 0, "invariant");
ysr@777 4018
tonyp@2973 4019 if (G1CollectedHeap::use_parallel_gc_threads()) {
johnc@4173 4020 satb_mq_set.set_par_closure(_worker_id, NULL);
tonyp@2973 4021 } else {
ysr@777 4022 satb_mq_set.set_closure(NULL);
tonyp@2973 4023 }
ysr@777 4024
ysr@777 4025 // again, this was a potentially expensive operation, decrease the
ysr@777 4026 // limits to get the regular clock call early
ysr@777 4027 decrease_limits();
ysr@777 4028 }
ysr@777 4029
ysr@777 4030 void CMTask::print_stats() {
johnc@4173 4031 gclog_or_tty->print_cr("Marking Stats, task = %u, calls = %d",
johnc@4173 4032 _worker_id, _calls);
ysr@777 4033 gclog_or_tty->print_cr(" Elapsed time = %1.2lfms, Termination time = %1.2lfms",
ysr@777 4034 _elapsed_time_ms, _termination_time_ms);
ysr@777 4035 gclog_or_tty->print_cr(" Step Times (cum): num = %d, avg = %1.2lfms, sd = %1.2lfms",
ysr@777 4036 _step_times_ms.num(), _step_times_ms.avg(),
ysr@777 4037 _step_times_ms.sd());
ysr@777 4038 gclog_or_tty->print_cr(" max = %1.2lfms, total = %1.2lfms",
ysr@777 4039 _step_times_ms.maximum(), _step_times_ms.sum());
ysr@777 4040
ysr@777 4041 #if _MARKING_STATS_
ysr@777 4042 gclog_or_tty->print_cr(" Clock Intervals (cum): num = %d, avg = %1.2lfms, sd = %1.2lfms",
ysr@777 4043 _all_clock_intervals_ms.num(), _all_clock_intervals_ms.avg(),
ysr@777 4044 _all_clock_intervals_ms.sd());
ysr@777 4045 gclog_or_tty->print_cr(" max = %1.2lfms, total = %1.2lfms",
ysr@777 4046 _all_clock_intervals_ms.maximum(),
ysr@777 4047 _all_clock_intervals_ms.sum());
ysr@777 4048 gclog_or_tty->print_cr(" Clock Causes (cum): scanning = %d, marking = %d",
ysr@777 4049 _clock_due_to_scanning, _clock_due_to_marking);
ysr@777 4050 gclog_or_tty->print_cr(" Objects: scanned = %d, found on the bitmap = %d",
ysr@777 4051 _objs_scanned, _objs_found_on_bitmap);
ysr@777 4052 gclog_or_tty->print_cr(" Local Queue: pushes = %d, pops = %d, max size = %d",
ysr@777 4053 _local_pushes, _local_pops, _local_max_size);
ysr@777 4054 gclog_or_tty->print_cr(" Global Stack: pushes = %d, pops = %d, max size = %d",
ysr@777 4055 _global_pushes, _global_pops, _global_max_size);
ysr@777 4056 gclog_or_tty->print_cr(" transfers to = %d, transfers from = %d",
ysr@777 4057 _global_transfers_to,_global_transfers_from);
tonyp@3691 4058 gclog_or_tty->print_cr(" Regions: claimed = %d", _regions_claimed);
ysr@777 4059 gclog_or_tty->print_cr(" SATB buffers: processed = %d", _satb_buffers_processed);
ysr@777 4060 gclog_or_tty->print_cr(" Steals: attempts = %d, successes = %d",
ysr@777 4061 _steal_attempts, _steals);
ysr@777 4062 gclog_or_tty->print_cr(" Aborted: %d, due to", _aborted);
ysr@777 4063 gclog_or_tty->print_cr(" overflow: %d, global abort: %d, yield: %d",
ysr@777 4064 _aborted_overflow, _aborted_cm_aborted, _aborted_yield);
ysr@777 4065 gclog_or_tty->print_cr(" time out: %d, SATB: %d, termination: %d",
ysr@777 4066 _aborted_timed_out, _aborted_satb, _aborted_termination);
ysr@777 4067 #endif // _MARKING_STATS_
ysr@777 4068 }
ysr@777 4069
ysr@777 4070 /*****************************************************************************
ysr@777 4071
johnc@4787 4072 The do_marking_step(time_target_ms, ...) method is the building
johnc@4787 4073 block of the parallel marking framework. It can be called in parallel
ysr@777 4074 with other invocations of do_marking_step() on different tasks
ysr@777 4075 (but only one per task, obviously) and concurrently with the
ysr@777 4076 mutator threads, or during remark, hence it eliminates the need
ysr@777 4077 for two versions of the code. When called during remark, it will
ysr@777 4078 pick up from where the task left off during the concurrent marking
ysr@777 4079 phase. Interestingly, tasks are also claimable during evacuation
ysr@777 4080 pauses too, since do_marking_step() ensures that it aborts before
ysr@777 4081 it needs to yield.
ysr@777 4082
johnc@4787 4083 The data structures that it uses to do marking work are the
ysr@777 4084 following:
ysr@777 4085
ysr@777 4086 (1) Marking Bitmap. If there are gray objects that appear only
ysr@777 4087 on the bitmap (this happens either when dealing with an overflow
ysr@777 4088 or when the initial marking phase has simply marked the roots
ysr@777 4089 and didn't push them on the stack), then tasks claim heap
ysr@777 4090 regions whose bitmap they then scan to find gray objects. A
ysr@777 4091 global finger indicates where the end of the last claimed region
ysr@777 4092 is. A local finger indicates how far into the region a task has
ysr@777 4093 scanned. The two fingers are used to determine how to gray an
ysr@777 4094 object (i.e. whether simply marking it is OK, as it will be
ysr@777 4095 visited by a task in the future, or whether it needs to be also
ysr@777 4096 pushed on a stack).
ysr@777 4097
ysr@777 4098 (2) Local Queue. The local queue of the task which is accessed
ysr@777 4099 reasonably efficiently by the task. Other tasks can steal from
ysr@777 4100 it when they run out of work. Throughout the marking phase, a
ysr@777 4101 task attempts to keep its local queue short but not totally
ysr@777 4102 empty, so that entries are available for stealing by other
ysr@777 4103 tasks. Only when there is no more work, a task will totally
ysr@777 4104 drain its local queue.
ysr@777 4105
ysr@777 4106 (3) Global Mark Stack. This handles local queue overflow. During
ysr@777 4107 marking only sets of entries are moved between it and the local
ysr@777 4108 queues, as access to it requires a mutex and more fine-grain
ysr@777 4109 interaction with it which might cause contention. If it
ysr@777 4110 overflows, then the marking phase should restart and iterate
ysr@777 4111 over the bitmap to identify gray objects. Throughout the marking
ysr@777 4112 phase, tasks attempt to keep the global mark stack at a small
ysr@777 4113 length but not totally empty, so that entries are available for
ysr@777 4114 popping by other tasks. Only when there is no more work, tasks
ysr@777 4115 will totally drain the global mark stack.
ysr@777 4116
tonyp@3691 4117 (4) SATB Buffer Queue. This is where completed SATB buffers are
ysr@777 4118 made available. Buffers are regularly removed from this queue
ysr@777 4119 and scanned for roots, so that the queue doesn't get too
ysr@777 4120 long. During remark, all completed buffers are processed, as
ysr@777 4121 well as the filled in parts of any uncompleted buffers.
ysr@777 4122
ysr@777 4123 The do_marking_step() method tries to abort when the time target
ysr@777 4124 has been reached. There are a few other cases when the
ysr@777 4125 do_marking_step() method also aborts:
ysr@777 4126
ysr@777 4127 (1) When the marking phase has been aborted (after a Full GC).
ysr@777 4128
tonyp@3691 4129 (2) When a global overflow (on the global stack) has been
tonyp@3691 4130 triggered. Before the task aborts, it will actually sync up with
tonyp@3691 4131 the other tasks to ensure that all the marking data structures
johnc@4788 4132 (local queues, stacks, fingers etc.) are re-initialized so that
tonyp@3691 4133 when do_marking_step() completes, the marking phase can
tonyp@3691 4134 immediately restart.
ysr@777 4135
ysr@777 4136 (3) When enough completed SATB buffers are available. The
ysr@777 4137 do_marking_step() method only tries to drain SATB buffers right
ysr@777 4138 at the beginning. So, if enough buffers are available, the
ysr@777 4139 marking step aborts and the SATB buffers are processed at
ysr@777 4140 the beginning of the next invocation.
ysr@777 4141
ysr@777 4142 (4) To yield. when we have to yield then we abort and yield
ysr@777 4143 right at the end of do_marking_step(). This saves us from a lot
ysr@777 4144 of hassle as, by yielding we might allow a Full GC. If this
ysr@777 4145 happens then objects will be compacted underneath our feet, the
ysr@777 4146 heap might shrink, etc. We save checking for this by just
ysr@777 4147 aborting and doing the yield right at the end.
ysr@777 4148
ysr@777 4149 From the above it follows that the do_marking_step() method should
ysr@777 4150 be called in a loop (or, otherwise, regularly) until it completes.
ysr@777 4151
ysr@777 4152 If a marking step completes without its has_aborted() flag being
ysr@777 4153 true, it means it has completed the current marking phase (and
ysr@777 4154 also all other marking tasks have done so and have all synced up).
ysr@777 4155
ysr@777 4156 A method called regular_clock_call() is invoked "regularly" (in
ysr@777 4157 sub ms intervals) throughout marking. It is this clock method that
ysr@777 4158 checks all the abort conditions which were mentioned above and
ysr@777 4159 decides when the task should abort. A work-based scheme is used to
ysr@777 4160 trigger this clock method: when the number of object words the
ysr@777 4161 marking phase has scanned or the number of references the marking
ysr@777 4162 phase has visited reach a given limit. Additional invocations to
ysr@777 4163 the method clock have been planted in a few other strategic places
ysr@777 4164 too. The initial reason for the clock method was to avoid calling
ysr@777 4165 vtime too regularly, as it is quite expensive. So, once it was in
ysr@777 4166 place, it was natural to piggy-back all the other conditions on it
ysr@777 4167 too and not constantly check them throughout the code.
ysr@777 4168
johnc@4787 4169 If do_termination is true then do_marking_step will enter its
johnc@4787 4170 termination protocol.
johnc@4787 4171
johnc@4787 4172 The value of is_serial must be true when do_marking_step is being
johnc@4787 4173 called serially (i.e. by the VMThread) and do_marking_step should
johnc@4787 4174 skip any synchronization in the termination and overflow code.
johnc@4787 4175 Examples include the serial remark code and the serial reference
johnc@4787 4176 processing closures.
johnc@4787 4177
johnc@4787 4178 The value of is_serial must be false when do_marking_step is
johnc@4787 4179 being called by any of the worker threads in a work gang.
johnc@4787 4180 Examples include the concurrent marking code (CMMarkingTask),
johnc@4787 4181 the MT remark code, and the MT reference processing closures.
johnc@4787 4182
ysr@777 4183 *****************************************************************************/
ysr@777 4184
johnc@2494 4185 void CMTask::do_marking_step(double time_target_ms,
johnc@4787 4186 bool do_termination,
johnc@4787 4187 bool is_serial) {
tonyp@1458 4188 assert(time_target_ms >= 1.0, "minimum granularity is 1ms");
tonyp@1458 4189 assert(concurrent() == _cm->concurrent(), "they should be the same");
tonyp@1458 4190
ysr@777 4191 G1CollectorPolicy* g1_policy = _g1h->g1_policy();
tonyp@1458 4192 assert(_task_queues != NULL, "invariant");
tonyp@1458 4193 assert(_task_queue != NULL, "invariant");
johnc@4173 4194 assert(_task_queues->queue(_worker_id) == _task_queue, "invariant");
tonyp@1458 4195
tonyp@1458 4196 assert(!_claimed,
tonyp@1458 4197 "only one thread should claim this task at any one time");
ysr@777 4198
ysr@777 4199 // OK, this doesn't safeguard again all possible scenarios, as it is
ysr@777 4200 // possible for two threads to set the _claimed flag at the same
ysr@777 4201 // time. But it is only for debugging purposes anyway and it will
ysr@777 4202 // catch most problems.
ysr@777 4203 _claimed = true;
ysr@777 4204
ysr@777 4205 _start_time_ms = os::elapsedVTime() * 1000.0;
ysr@777 4206 statsOnly( _interval_start_time_ms = _start_time_ms );
ysr@777 4207
johnc@4787 4208 // If do_stealing is true then do_marking_step will attempt to
johnc@4787 4209 // steal work from the other CMTasks. It only makes sense to
johnc@4787 4210 // enable stealing when the termination protocol is enabled
johnc@4787 4211 // and do_marking_step() is not being called serially.
johnc@4787 4212 bool do_stealing = do_termination && !is_serial;
johnc@4787 4213
ysr@777 4214 double diff_prediction_ms =
ysr@777 4215 g1_policy->get_new_prediction(&_marking_step_diffs_ms);
ysr@777 4216 _time_target_ms = time_target_ms - diff_prediction_ms;
ysr@777 4217
ysr@777 4218 // set up the variables that are used in the work-based scheme to
ysr@777 4219 // call the regular clock method
ysr@777 4220 _words_scanned = 0;
ysr@777 4221 _refs_reached = 0;
ysr@777 4222 recalculate_limits();
ysr@777 4223
ysr@777 4224 // clear all flags
ysr@777 4225 clear_has_aborted();
johnc@2494 4226 _has_timed_out = false;
ysr@777 4227 _draining_satb_buffers = false;
ysr@777 4228
ysr@777 4229 ++_calls;
ysr@777 4230
tonyp@2973 4231 if (_cm->verbose_low()) {
johnc@4173 4232 gclog_or_tty->print_cr("[%u] >>>>>>>>>> START, call = %d, "
ysr@777 4233 "target = %1.2lfms >>>>>>>>>>",
johnc@4173 4234 _worker_id, _calls, _time_target_ms);
tonyp@2973 4235 }
ysr@777 4236
ysr@777 4237 // Set up the bitmap and oop closures. Anything that uses them is
ysr@777 4238 // eventually called from this method, so it is OK to allocate these
ysr@777 4239 // statically.
ysr@777 4240 CMBitMapClosure bitmap_closure(this, _cm, _nextMarkBitMap);
tonyp@2968 4241 G1CMOopClosure cm_oop_closure(_g1h, _cm, this);
tonyp@2968 4242 set_cm_oop_closure(&cm_oop_closure);
ysr@777 4243
ysr@777 4244 if (_cm->has_overflown()) {
tonyp@3691 4245 // This can happen if the mark stack overflows during a GC pause
tonyp@3691 4246 // and this task, after a yield point, restarts. We have to abort
tonyp@3691 4247 // as we need to get into the overflow protocol which happens
tonyp@3691 4248 // right at the end of this task.
ysr@777 4249 set_has_aborted();
ysr@777 4250 }
ysr@777 4251
ysr@777 4252 // First drain any available SATB buffers. After this, we will not
ysr@777 4253 // look at SATB buffers before the next invocation of this method.
ysr@777 4254 // If enough completed SATB buffers are queued up, the regular clock
ysr@777 4255 // will abort this task so that it restarts.
ysr@777 4256 drain_satb_buffers();
ysr@777 4257 // ...then partially drain the local queue and the global stack
ysr@777 4258 drain_local_queue(true);
ysr@777 4259 drain_global_stack(true);
ysr@777 4260
ysr@777 4261 do {
ysr@777 4262 if (!has_aborted() && _curr_region != NULL) {
ysr@777 4263 // This means that we're already holding on to a region.
tonyp@1458 4264 assert(_finger != NULL, "if region is not NULL, then the finger "
tonyp@1458 4265 "should not be NULL either");
ysr@777 4266
ysr@777 4267 // We might have restarted this task after an evacuation pause
ysr@777 4268 // which might have evacuated the region we're holding on to
ysr@777 4269 // underneath our feet. Let's read its limit again to make sure
ysr@777 4270 // that we do not iterate over a region of the heap that
ysr@777 4271 // contains garbage (update_region_limit() will also move
ysr@777 4272 // _finger to the start of the region if it is found empty).
ysr@777 4273 update_region_limit();
ysr@777 4274 // We will start from _finger not from the start of the region,
ysr@777 4275 // as we might be restarting this task after aborting half-way
ysr@777 4276 // through scanning this region. In this case, _finger points to
ysr@777 4277 // the address where we last found a marked object. If this is a
ysr@777 4278 // fresh region, _finger points to start().
ysr@777 4279 MemRegion mr = MemRegion(_finger, _region_limit);
ysr@777 4280
tonyp@2973 4281 if (_cm->verbose_low()) {
johnc@4173 4282 gclog_or_tty->print_cr("[%u] we're scanning part "
ysr@777 4283 "["PTR_FORMAT", "PTR_FORMAT") "
johnc@4580 4284 "of region "HR_FORMAT,
drchase@6680 4285 _worker_id, p2i(_finger), p2i(_region_limit),
johnc@4580 4286 HR_FORMAT_PARAMS(_curr_region));
tonyp@2973 4287 }
ysr@777 4288
johnc@4580 4289 assert(!_curr_region->isHumongous() || mr.start() == _curr_region->bottom(),
johnc@4580 4290 "humongous regions should go around loop once only");
johnc@4580 4291
johnc@4580 4292 // Some special cases:
johnc@4580 4293 // If the memory region is empty, we can just give up the region.
johnc@4580 4294 // If the current region is humongous then we only need to check
johnc@4580 4295 // the bitmap for the bit associated with the start of the object,
johnc@4580 4296 // scan the object if it's live, and give up the region.
johnc@4580 4297 // Otherwise, let's iterate over the bitmap of the part of the region
johnc@4580 4298 // that is left.
johnc@4575 4299 // If the iteration is successful, give up the region.
johnc@4580 4300 if (mr.is_empty()) {
johnc@4580 4301 giveup_current_region();
johnc@4580 4302 regular_clock_call();
johnc@4580 4303 } else if (_curr_region->isHumongous() && mr.start() == _curr_region->bottom()) {
johnc@4580 4304 if (_nextMarkBitMap->isMarked(mr.start())) {
johnc@4580 4305 // The object is marked - apply the closure
johnc@4580 4306 BitMap::idx_t offset = _nextMarkBitMap->heapWordToOffset(mr.start());
johnc@4580 4307 bitmap_closure.do_bit(offset);
johnc@4580 4308 }
johnc@4580 4309 // Even if this task aborted while scanning the humongous object
johnc@4580 4310 // we can (and should) give up the current region.
johnc@4580 4311 giveup_current_region();
johnc@4580 4312 regular_clock_call();
johnc@4580 4313 } else if (_nextMarkBitMap->iterate(&bitmap_closure, mr)) {
ysr@777 4314 giveup_current_region();
ysr@777 4315 regular_clock_call();
ysr@777 4316 } else {
tonyp@1458 4317 assert(has_aborted(), "currently the only way to do so");
ysr@777 4318 // The only way to abort the bitmap iteration is to return
ysr@777 4319 // false from the do_bit() method. However, inside the
ysr@777 4320 // do_bit() method we move the _finger to point to the
ysr@777 4321 // object currently being looked at. So, if we bail out, we
ysr@777 4322 // have definitely set _finger to something non-null.
tonyp@1458 4323 assert(_finger != NULL, "invariant");
ysr@777 4324
ysr@777 4325 // Region iteration was actually aborted. So now _finger
ysr@777 4326 // points to the address of the object we last scanned. If we
ysr@777 4327 // leave it there, when we restart this task, we will rescan
ysr@777 4328 // the object. It is easy to avoid this. We move the finger by
ysr@777 4329 // enough to point to the next possible object header (the
ysr@777 4330 // bitmap knows by how much we need to move it as it knows its
ysr@777 4331 // granularity).
apetrusenko@1749 4332 assert(_finger < _region_limit, "invariant");
tamao@4733 4333 HeapWord* new_finger = _nextMarkBitMap->nextObject(_finger);
apetrusenko@1749 4334 // Check if bitmap iteration was aborted while scanning the last object
apetrusenko@1749 4335 if (new_finger >= _region_limit) {
tonyp@3691 4336 giveup_current_region();
apetrusenko@1749 4337 } else {
tonyp@3691 4338 move_finger_to(new_finger);
apetrusenko@1749 4339 }
ysr@777 4340 }
ysr@777 4341 }
ysr@777 4342 // At this point we have either completed iterating over the
ysr@777 4343 // region we were holding on to, or we have aborted.
ysr@777 4344
ysr@777 4345 // We then partially drain the local queue and the global stack.
ysr@777 4346 // (Do we really need this?)
ysr@777 4347 drain_local_queue(true);
ysr@777 4348 drain_global_stack(true);
ysr@777 4349
ysr@777 4350 // Read the note on the claim_region() method on why it might
ysr@777 4351 // return NULL with potentially more regions available for
ysr@777 4352 // claiming and why we have to check out_of_regions() to determine
ysr@777 4353 // whether we're done or not.
ysr@777 4354 while (!has_aborted() && _curr_region == NULL && !_cm->out_of_regions()) {
ysr@777 4355 // We are going to try to claim a new region. We should have
ysr@777 4356 // given up on the previous one.
tonyp@1458 4357 // Separated the asserts so that we know which one fires.
tonyp@1458 4358 assert(_curr_region == NULL, "invariant");
tonyp@1458 4359 assert(_finger == NULL, "invariant");
tonyp@1458 4360 assert(_region_limit == NULL, "invariant");
tonyp@2973 4361 if (_cm->verbose_low()) {
johnc@4173 4362 gclog_or_tty->print_cr("[%u] trying to claim a new region", _worker_id);
tonyp@2973 4363 }
johnc@4173 4364 HeapRegion* claimed_region = _cm->claim_region(_worker_id);
ysr@777 4365 if (claimed_region != NULL) {
ysr@777 4366 // Yes, we managed to claim one
ysr@777 4367 statsOnly( ++_regions_claimed );
ysr@777 4368
tonyp@2973 4369 if (_cm->verbose_low()) {
johnc@4173 4370 gclog_or_tty->print_cr("[%u] we successfully claimed "
ysr@777 4371 "region "PTR_FORMAT,
drchase@6680 4372 _worker_id, p2i(claimed_region));
tonyp@2973 4373 }
ysr@777 4374
ysr@777 4375 setup_for_region(claimed_region);
tonyp@1458 4376 assert(_curr_region == claimed_region, "invariant");
ysr@777 4377 }
ysr@777 4378 // It is important to call the regular clock here. It might take
ysr@777 4379 // a while to claim a region if, for example, we hit a large
ysr@777 4380 // block of empty regions. So we need to call the regular clock
ysr@777 4381 // method once round the loop to make sure it's called
ysr@777 4382 // frequently enough.
ysr@777 4383 regular_clock_call();
ysr@777 4384 }
ysr@777 4385
ysr@777 4386 if (!has_aborted() && _curr_region == NULL) {
tonyp@1458 4387 assert(_cm->out_of_regions(),
tonyp@1458 4388 "at this point we should be out of regions");
ysr@777 4389 }
ysr@777 4390 } while ( _curr_region != NULL && !has_aborted());
ysr@777 4391
ysr@777 4392 if (!has_aborted()) {
ysr@777 4393 // We cannot check whether the global stack is empty, since other
tonyp@3691 4394 // tasks might be pushing objects to it concurrently.
tonyp@1458 4395 assert(_cm->out_of_regions(),
tonyp@1458 4396 "at this point we should be out of regions");
ysr@777 4397
tonyp@2973 4398 if (_cm->verbose_low()) {
johnc@4173 4399 gclog_or_tty->print_cr("[%u] all regions claimed", _worker_id);
tonyp@2973 4400 }
ysr@777 4401
ysr@777 4402 // Try to reduce the number of available SATB buffers so that
ysr@777 4403 // remark has less work to do.
ysr@777 4404 drain_satb_buffers();
ysr@777 4405 }
ysr@777 4406
ysr@777 4407 // Since we've done everything else, we can now totally drain the
ysr@777 4408 // local queue and global stack.
ysr@777 4409 drain_local_queue(false);
ysr@777 4410 drain_global_stack(false);
ysr@777 4411
ysr@777 4412 // Attempt at work stealing from other task's queues.
johnc@2494 4413 if (do_stealing && !has_aborted()) {
ysr@777 4414 // We have not aborted. This means that we have finished all that
ysr@777 4415 // we could. Let's try to do some stealing...
ysr@777 4416
ysr@777 4417 // We cannot check whether the global stack is empty, since other
tonyp@3691 4418 // tasks might be pushing objects to it concurrently.
tonyp@1458 4419 assert(_cm->out_of_regions() && _task_queue->size() == 0,
tonyp@1458 4420 "only way to reach here");
ysr@777 4421
tonyp@2973 4422 if (_cm->verbose_low()) {
johnc@4173 4423 gclog_or_tty->print_cr("[%u] starting to steal", _worker_id);
tonyp@2973 4424 }
ysr@777 4425
ysr@777 4426 while (!has_aborted()) {
ysr@777 4427 oop obj;
ysr@777 4428 statsOnly( ++_steal_attempts );
ysr@777 4429
johnc@4173 4430 if (_cm->try_stealing(_worker_id, &_hash_seed, obj)) {
tonyp@2973 4431 if (_cm->verbose_medium()) {
johnc@4173 4432 gclog_or_tty->print_cr("[%u] stolen "PTR_FORMAT" successfully",
drchase@6680 4433 _worker_id, p2i((void*) obj));
tonyp@2973 4434 }
ysr@777 4435
ysr@777 4436 statsOnly( ++_steals );
ysr@777 4437
tonyp@1458 4438 assert(_nextMarkBitMap->isMarked((HeapWord*) obj),
tonyp@1458 4439 "any stolen object should be marked");
ysr@777 4440 scan_object(obj);
ysr@777 4441
ysr@777 4442 // And since we're towards the end, let's totally drain the
ysr@777 4443 // local queue and global stack.
ysr@777 4444 drain_local_queue(false);
ysr@777 4445 drain_global_stack(false);
ysr@777 4446 } else {
ysr@777 4447 break;
ysr@777 4448 }
ysr@777 4449 }
ysr@777 4450 }
ysr@777 4451
tonyp@2848 4452 // If we are about to wrap up and go into termination, check if we
tonyp@2848 4453 // should raise the overflow flag.
tonyp@2848 4454 if (do_termination && !has_aborted()) {
tonyp@2848 4455 if (_cm->force_overflow()->should_force()) {
tonyp@2848 4456 _cm->set_has_overflown();
tonyp@2848 4457 regular_clock_call();
tonyp@2848 4458 }
tonyp@2848 4459 }
tonyp@2848 4460
ysr@777 4461 // We still haven't aborted. Now, let's try to get into the
ysr@777 4462 // termination protocol.
johnc@2494 4463 if (do_termination && !has_aborted()) {
ysr@777 4464 // We cannot check whether the global stack is empty, since other
tonyp@3691 4465 // tasks might be concurrently pushing objects on it.
tonyp@1458 4466 // Separated the asserts so that we know which one fires.
tonyp@1458 4467 assert(_cm->out_of_regions(), "only way to reach here");
tonyp@1458 4468 assert(_task_queue->size() == 0, "only way to reach here");
ysr@777 4469
tonyp@2973 4470 if (_cm->verbose_low()) {
johnc@4173 4471 gclog_or_tty->print_cr("[%u] starting termination protocol", _worker_id);
tonyp@2973 4472 }
ysr@777 4473
ysr@777 4474 _termination_start_time_ms = os::elapsedVTime() * 1000.0;
johnc@4787 4475
ysr@777 4476 // The CMTask class also extends the TerminatorTerminator class,
ysr@777 4477 // hence its should_exit_termination() method will also decide
ysr@777 4478 // whether to exit the termination protocol or not.
johnc@4787 4479 bool finished = (is_serial ||
johnc@4787 4480 _cm->terminator()->offer_termination(this));
ysr@777 4481 double termination_end_time_ms = os::elapsedVTime() * 1000.0;
ysr@777 4482 _termination_time_ms +=
ysr@777 4483 termination_end_time_ms - _termination_start_time_ms;
ysr@777 4484
ysr@777 4485 if (finished) {
ysr@777 4486 // We're all done.
ysr@777 4487
johnc@4173 4488 if (_worker_id == 0) {
ysr@777 4489 // let's allow task 0 to do this
ysr@777 4490 if (concurrent()) {
tonyp@1458 4491 assert(_cm->concurrent_marking_in_progress(), "invariant");
ysr@777 4492 // we need to set this to false before the next
ysr@777 4493 // safepoint. This way we ensure that the marking phase
ysr@777 4494 // doesn't observe any more heap expansions.
ysr@777 4495 _cm->clear_concurrent_marking_in_progress();
ysr@777 4496 }
ysr@777 4497 }
ysr@777 4498
ysr@777 4499 // We can now guarantee that the global stack is empty, since
tonyp@1458 4500 // all other tasks have finished. We separated the guarantees so
tonyp@1458 4501 // that, if a condition is false, we can immediately find out
tonyp@1458 4502 // which one.
tonyp@1458 4503 guarantee(_cm->out_of_regions(), "only way to reach here");
tonyp@1458 4504 guarantee(_cm->mark_stack_empty(), "only way to reach here");
tonyp@1458 4505 guarantee(_task_queue->size() == 0, "only way to reach here");
tonyp@1458 4506 guarantee(!_cm->has_overflown(), "only way to reach here");
tonyp@1458 4507 guarantee(!_cm->mark_stack_overflow(), "only way to reach here");
ysr@777 4508
tonyp@2973 4509 if (_cm->verbose_low()) {
johnc@4173 4510 gclog_or_tty->print_cr("[%u] all tasks terminated", _worker_id);
tonyp@2973 4511 }
ysr@777 4512 } else {
ysr@777 4513 // Apparently there's more work to do. Let's abort this task. It
ysr@777 4514 // will restart it and we can hopefully find more things to do.
ysr@777 4515
tonyp@2973 4516 if (_cm->verbose_low()) {
johnc@4173 4517 gclog_or_tty->print_cr("[%u] apparently there is more work to do",
johnc@4173 4518 _worker_id);
tonyp@2973 4519 }
ysr@777 4520
ysr@777 4521 set_has_aborted();
ysr@777 4522 statsOnly( ++_aborted_termination );
ysr@777 4523 }
ysr@777 4524 }
ysr@777 4525
ysr@777 4526 // Mainly for debugging purposes to make sure that a pointer to the
ysr@777 4527 // closure which was statically allocated in this frame doesn't
ysr@777 4528 // escape it by accident.
tonyp@2968 4529 set_cm_oop_closure(NULL);
ysr@777 4530 double end_time_ms = os::elapsedVTime() * 1000.0;
ysr@777 4531 double elapsed_time_ms = end_time_ms - _start_time_ms;
ysr@777 4532 // Update the step history.
ysr@777 4533 _step_times_ms.add(elapsed_time_ms);
ysr@777 4534
ysr@777 4535 if (has_aborted()) {
ysr@777 4536 // The task was aborted for some reason.
ysr@777 4537
ysr@777 4538 statsOnly( ++_aborted );
ysr@777 4539
johnc@2494 4540 if (_has_timed_out) {
ysr@777 4541 double diff_ms = elapsed_time_ms - _time_target_ms;
ysr@777 4542 // Keep statistics of how well we did with respect to hitting
ysr@777 4543 // our target only if we actually timed out (if we aborted for
ysr@777 4544 // other reasons, then the results might get skewed).
ysr@777 4545 _marking_step_diffs_ms.add(diff_ms);
ysr@777 4546 }
ysr@777 4547
ysr@777 4548 if (_cm->has_overflown()) {
ysr@777 4549 // This is the interesting one. We aborted because a global
ysr@777 4550 // overflow was raised. This means we have to restart the
ysr@777 4551 // marking phase and start iterating over regions. However, in
ysr@777 4552 // order to do this we have to make sure that all tasks stop
ysr@777 4553 // what they are doing and re-initialise in a safe manner. We
ysr@777 4554 // will achieve this with the use of two barrier sync points.
ysr@777 4555
tonyp@2973 4556 if (_cm->verbose_low()) {
johnc@4173 4557 gclog_or_tty->print_cr("[%u] detected overflow", _worker_id);
tonyp@2973 4558 }
ysr@777 4559
johnc@4787 4560 if (!is_serial) {
johnc@4787 4561 // We only need to enter the sync barrier if being called
johnc@4787 4562 // from a parallel context
johnc@4787 4563 _cm->enter_first_sync_barrier(_worker_id);
johnc@4787 4564
johnc@4787 4565 // When we exit this sync barrier we know that all tasks have
johnc@4787 4566 // stopped doing marking work. So, it's now safe to
johnc@4787 4567 // re-initialise our data structures. At the end of this method,
johnc@4787 4568 // task 0 will clear the global data structures.
johnc@4787 4569 }
ysr@777 4570
ysr@777 4571 statsOnly( ++_aborted_overflow );
ysr@777 4572
ysr@777 4573 // We clear the local state of this task...
ysr@777 4574 clear_region_fields();
ysr@777 4575
johnc@4787 4576 if (!is_serial) {
johnc@4787 4577 // ...and enter the second barrier.
johnc@4787 4578 _cm->enter_second_sync_barrier(_worker_id);
johnc@4787 4579 }
johnc@4788 4580 // At this point, if we're during the concurrent phase of
johnc@4788 4581 // marking, everything has been re-initialized and we're
ysr@777 4582 // ready to restart.
ysr@777 4583 }
ysr@777 4584
ysr@777 4585 if (_cm->verbose_low()) {
johnc@4173 4586 gclog_or_tty->print_cr("[%u] <<<<<<<<<< ABORTING, target = %1.2lfms, "
ysr@777 4587 "elapsed = %1.2lfms <<<<<<<<<<",
johnc@4173 4588 _worker_id, _time_target_ms, elapsed_time_ms);
tonyp@2973 4589 if (_cm->has_aborted()) {
johnc@4173 4590 gclog_or_tty->print_cr("[%u] ========== MARKING ABORTED ==========",
johnc@4173 4591 _worker_id);
tonyp@2973 4592 }
ysr@777 4593 }
ysr@777 4594 } else {
tonyp@2973 4595 if (_cm->verbose_low()) {
johnc@4173 4596 gclog_or_tty->print_cr("[%u] <<<<<<<<<< FINISHED, target = %1.2lfms, "
ysr@777 4597 "elapsed = %1.2lfms <<<<<<<<<<",
johnc@4173 4598 _worker_id, _time_target_ms, elapsed_time_ms);
tonyp@2973 4599 }
ysr@777 4600 }
ysr@777 4601
ysr@777 4602 _claimed = false;
ysr@777 4603 }
ysr@777 4604
johnc@4173 4605 CMTask::CMTask(uint worker_id,
ysr@777 4606 ConcurrentMark* cm,
johnc@3463 4607 size_t* marked_bytes,
johnc@3463 4608 BitMap* card_bm,
ysr@777 4609 CMTaskQueue* task_queue,
ysr@777 4610 CMTaskQueueSet* task_queues)
ysr@777 4611 : _g1h(G1CollectedHeap::heap()),
johnc@4173 4612 _worker_id(worker_id), _cm(cm),
ysr@777 4613 _claimed(false),
ysr@777 4614 _nextMarkBitMap(NULL), _hash_seed(17),
ysr@777 4615 _task_queue(task_queue),
ysr@777 4616 _task_queues(task_queues),
tonyp@2968 4617 _cm_oop_closure(NULL),
johnc@3463 4618 _marked_bytes_array(marked_bytes),
johnc@3463 4619 _card_bm(card_bm) {
tonyp@1458 4620 guarantee(task_queue != NULL, "invariant");
tonyp@1458 4621 guarantee(task_queues != NULL, "invariant");
ysr@777 4622
ysr@777 4623 statsOnly( _clock_due_to_scanning = 0;
ysr@777 4624 _clock_due_to_marking = 0 );
ysr@777 4625
ysr@777 4626 _marking_step_diffs_ms.add(0.5);
ysr@777 4627 }
tonyp@2717 4628
tonyp@2717 4629 // These are formatting macros that are used below to ensure
tonyp@2717 4630 // consistent formatting. The *_H_* versions are used to format the
tonyp@2717 4631 // header for a particular value and they should be kept consistent
tonyp@2717 4632 // with the corresponding macro. Also note that most of the macros add
tonyp@2717 4633 // the necessary white space (as a prefix) which makes them a bit
tonyp@2717 4634 // easier to compose.
tonyp@2717 4635
tonyp@2717 4636 // All the output lines are prefixed with this string to be able to
tonyp@2717 4637 // identify them easily in a large log file.
tonyp@2717 4638 #define G1PPRL_LINE_PREFIX "###"
tonyp@2717 4639
tonyp@2717 4640 #define G1PPRL_ADDR_BASE_FORMAT " "PTR_FORMAT"-"PTR_FORMAT
tonyp@2717 4641 #ifdef _LP64
tonyp@2717 4642 #define G1PPRL_ADDR_BASE_H_FORMAT " %37s"
tonyp@2717 4643 #else // _LP64
tonyp@2717 4644 #define G1PPRL_ADDR_BASE_H_FORMAT " %21s"
tonyp@2717 4645 #endif // _LP64
tonyp@2717 4646
tonyp@2717 4647 // For per-region info
tonyp@2717 4648 #define G1PPRL_TYPE_FORMAT " %-4s"
tonyp@2717 4649 #define G1PPRL_TYPE_H_FORMAT " %4s"
tonyp@2717 4650 #define G1PPRL_BYTE_FORMAT " "SIZE_FORMAT_W(9)
tonyp@2717 4651 #define G1PPRL_BYTE_H_FORMAT " %9s"
tonyp@2717 4652 #define G1PPRL_DOUBLE_FORMAT " %14.1f"
tonyp@2717 4653 #define G1PPRL_DOUBLE_H_FORMAT " %14s"
tonyp@2717 4654
tonyp@2717 4655 // For summary info
tonyp@2717 4656 #define G1PPRL_SUM_ADDR_FORMAT(tag) " "tag":"G1PPRL_ADDR_BASE_FORMAT
tonyp@2717 4657 #define G1PPRL_SUM_BYTE_FORMAT(tag) " "tag": "SIZE_FORMAT
tonyp@2717 4658 #define G1PPRL_SUM_MB_FORMAT(tag) " "tag": %1.2f MB"
tonyp@2717 4659 #define G1PPRL_SUM_MB_PERC_FORMAT(tag) G1PPRL_SUM_MB_FORMAT(tag)" / %1.2f %%"
tonyp@2717 4660
tonyp@2717 4661 G1PrintRegionLivenessInfoClosure::
tonyp@2717 4662 G1PrintRegionLivenessInfoClosure(outputStream* out, const char* phase_name)
tonyp@2717 4663 : _out(out),
tonyp@2717 4664 _total_used_bytes(0), _total_capacity_bytes(0),
tonyp@2717 4665 _total_prev_live_bytes(0), _total_next_live_bytes(0),
tonyp@2717 4666 _hum_used_bytes(0), _hum_capacity_bytes(0),
tschatzl@5122 4667 _hum_prev_live_bytes(0), _hum_next_live_bytes(0),
johnc@5548 4668 _total_remset_bytes(0), _total_strong_code_roots_bytes(0) {
tonyp@2717 4669 G1CollectedHeap* g1h = G1CollectedHeap::heap();
tonyp@2717 4670 MemRegion g1_reserved = g1h->g1_reserved();
tonyp@2717 4671 double now = os::elapsedTime();
tonyp@2717 4672
tonyp@2717 4673 // Print the header of the output.
tonyp@2717 4674 _out->cr();
tonyp@2717 4675 _out->print_cr(G1PPRL_LINE_PREFIX" PHASE %s @ %1.3f", phase_name, now);
tonyp@2717 4676 _out->print_cr(G1PPRL_LINE_PREFIX" HEAP"
tonyp@2717 4677 G1PPRL_SUM_ADDR_FORMAT("reserved")
tonyp@2717 4678 G1PPRL_SUM_BYTE_FORMAT("region-size"),
drchase@6680 4679 p2i(g1_reserved.start()), p2i(g1_reserved.end()),
johnc@3182 4680 HeapRegion::GrainBytes);
tonyp@2717 4681 _out->print_cr(G1PPRL_LINE_PREFIX);
tonyp@2717 4682 _out->print_cr(G1PPRL_LINE_PREFIX
tschatzl@5122 4683 G1PPRL_TYPE_H_FORMAT
tschatzl@5122 4684 G1PPRL_ADDR_BASE_H_FORMAT
tschatzl@5122 4685 G1PPRL_BYTE_H_FORMAT
tschatzl@5122 4686 G1PPRL_BYTE_H_FORMAT
tschatzl@5122 4687 G1PPRL_BYTE_H_FORMAT
tschatzl@5122 4688 G1PPRL_DOUBLE_H_FORMAT
johnc@5548 4689 G1PPRL_BYTE_H_FORMAT
tschatzl@5122 4690 G1PPRL_BYTE_H_FORMAT,
tschatzl@5122 4691 "type", "address-range",
johnc@5548 4692 "used", "prev-live", "next-live", "gc-eff",
johnc@5548 4693 "remset", "code-roots");
johnc@3173 4694 _out->print_cr(G1PPRL_LINE_PREFIX
tschatzl@5122 4695 G1PPRL_TYPE_H_FORMAT
tschatzl@5122 4696 G1PPRL_ADDR_BASE_H_FORMAT
tschatzl@5122 4697 G1PPRL_BYTE_H_FORMAT
tschatzl@5122 4698 G1PPRL_BYTE_H_FORMAT
tschatzl@5122 4699 G1PPRL_BYTE_H_FORMAT
tschatzl@5122 4700 G1PPRL_DOUBLE_H_FORMAT
johnc@5548 4701 G1PPRL_BYTE_H_FORMAT
tschatzl@5122 4702 G1PPRL_BYTE_H_FORMAT,
tschatzl@5122 4703 "", "",
johnc@5548 4704 "(bytes)", "(bytes)", "(bytes)", "(bytes/ms)",
johnc@5548 4705 "(bytes)", "(bytes)");
tonyp@2717 4706 }
tonyp@2717 4707
tonyp@2717 4708 // It takes as a parameter a reference to one of the _hum_* fields, it
tonyp@2717 4709 // deduces the corresponding value for a region in a humongous region
tonyp@2717 4710 // series (either the region size, or what's left if the _hum_* field
tonyp@2717 4711 // is < the region size), and updates the _hum_* field accordingly.
tonyp@2717 4712 size_t G1PrintRegionLivenessInfoClosure::get_hum_bytes(size_t* hum_bytes) {
tonyp@2717 4713 size_t bytes = 0;
tonyp@2717 4714 // The > 0 check is to deal with the prev and next live bytes which
tonyp@2717 4715 // could be 0.
tonyp@2717 4716 if (*hum_bytes > 0) {
johnc@3182 4717 bytes = MIN2(HeapRegion::GrainBytes, *hum_bytes);
tonyp@2717 4718 *hum_bytes -= bytes;
tonyp@2717 4719 }
tonyp@2717 4720 return bytes;
tonyp@2717 4721 }
tonyp@2717 4722
tonyp@2717 4723 // It deduces the values for a region in a humongous region series
tonyp@2717 4724 // from the _hum_* fields and updates those accordingly. It assumes
tonyp@2717 4725 // that that _hum_* fields have already been set up from the "starts
tonyp@2717 4726 // humongous" region and we visit the regions in address order.
tonyp@2717 4727 void G1PrintRegionLivenessInfoClosure::get_hum_bytes(size_t* used_bytes,
tonyp@2717 4728 size_t* capacity_bytes,
tonyp@2717 4729 size_t* prev_live_bytes,
tonyp@2717 4730 size_t* next_live_bytes) {
tonyp@2717 4731 assert(_hum_used_bytes > 0 && _hum_capacity_bytes > 0, "pre-condition");
tonyp@2717 4732 *used_bytes = get_hum_bytes(&_hum_used_bytes);
tonyp@2717 4733 *capacity_bytes = get_hum_bytes(&_hum_capacity_bytes);
tonyp@2717 4734 *prev_live_bytes = get_hum_bytes(&_hum_prev_live_bytes);
tonyp@2717 4735 *next_live_bytes = get_hum_bytes(&_hum_next_live_bytes);
tonyp@2717 4736 }
tonyp@2717 4737
tonyp@2717 4738 bool G1PrintRegionLivenessInfoClosure::doHeapRegion(HeapRegion* r) {
tonyp@2717 4739 const char* type = "";
tonyp@2717 4740 HeapWord* bottom = r->bottom();
tonyp@2717 4741 HeapWord* end = r->end();
tonyp@2717 4742 size_t capacity_bytes = r->capacity();
tonyp@2717 4743 size_t used_bytes = r->used();
tonyp@2717 4744 size_t prev_live_bytes = r->live_bytes();
tonyp@2717 4745 size_t next_live_bytes = r->next_live_bytes();
tonyp@2717 4746 double gc_eff = r->gc_efficiency();
tschatzl@5122 4747 size_t remset_bytes = r->rem_set()->mem_size();
johnc@5548 4748 size_t strong_code_roots_bytes = r->rem_set()->strong_code_roots_mem_size();
johnc@5548 4749
tonyp@2717 4750 if (r->used() == 0) {
tonyp@2717 4751 type = "FREE";
tonyp@2717 4752 } else if (r->is_survivor()) {
tonyp@2717 4753 type = "SURV";
tonyp@2717 4754 } else if (r->is_young()) {
tonyp@2717 4755 type = "EDEN";
tonyp@2717 4756 } else if (r->startsHumongous()) {
tonyp@2717 4757 type = "HUMS";
tonyp@2717 4758
tonyp@2717 4759 assert(_hum_used_bytes == 0 && _hum_capacity_bytes == 0 &&
tonyp@2717 4760 _hum_prev_live_bytes == 0 && _hum_next_live_bytes == 0,
tonyp@2717 4761 "they should have been zeroed after the last time we used them");
tonyp@2717 4762 // Set up the _hum_* fields.
tonyp@2717 4763 _hum_capacity_bytes = capacity_bytes;
tonyp@2717 4764 _hum_used_bytes = used_bytes;
tonyp@2717 4765 _hum_prev_live_bytes = prev_live_bytes;
tonyp@2717 4766 _hum_next_live_bytes = next_live_bytes;
tonyp@2717 4767 get_hum_bytes(&used_bytes, &capacity_bytes,
tonyp@2717 4768 &prev_live_bytes, &next_live_bytes);
tonyp@2717 4769 end = bottom + HeapRegion::GrainWords;
tonyp@2717 4770 } else if (r->continuesHumongous()) {
tonyp@2717 4771 type = "HUMC";
tonyp@2717 4772 get_hum_bytes(&used_bytes, &capacity_bytes,
tonyp@2717 4773 &prev_live_bytes, &next_live_bytes);
tonyp@2717 4774 assert(end == bottom + HeapRegion::GrainWords, "invariant");
tonyp@2717 4775 } else {
tonyp@2717 4776 type = "OLD";
tonyp@2717 4777 }
tonyp@2717 4778
tonyp@2717 4779 _total_used_bytes += used_bytes;
tonyp@2717 4780 _total_capacity_bytes += capacity_bytes;
tonyp@2717 4781 _total_prev_live_bytes += prev_live_bytes;
tonyp@2717 4782 _total_next_live_bytes += next_live_bytes;
tschatzl@5122 4783 _total_remset_bytes += remset_bytes;
johnc@5548 4784 _total_strong_code_roots_bytes += strong_code_roots_bytes;
tonyp@2717 4785
tonyp@2717 4786 // Print a line for this particular region.
tonyp@2717 4787 _out->print_cr(G1PPRL_LINE_PREFIX
tonyp@2717 4788 G1PPRL_TYPE_FORMAT
tonyp@2717 4789 G1PPRL_ADDR_BASE_FORMAT
tonyp@2717 4790 G1PPRL_BYTE_FORMAT
tonyp@2717 4791 G1PPRL_BYTE_FORMAT
tonyp@2717 4792 G1PPRL_BYTE_FORMAT
tschatzl@5122 4793 G1PPRL_DOUBLE_FORMAT
johnc@5548 4794 G1PPRL_BYTE_FORMAT
tschatzl@5122 4795 G1PPRL_BYTE_FORMAT,
drchase@6680 4796 type, p2i(bottom), p2i(end),
johnc@5548 4797 used_bytes, prev_live_bytes, next_live_bytes, gc_eff,
johnc@5548 4798 remset_bytes, strong_code_roots_bytes);
tonyp@2717 4799
tonyp@2717 4800 return false;
tonyp@2717 4801 }
tonyp@2717 4802
tonyp@2717 4803 G1PrintRegionLivenessInfoClosure::~G1PrintRegionLivenessInfoClosure() {
tschatzl@5122 4804 // add static memory usages to remembered set sizes
tschatzl@5122 4805 _total_remset_bytes += HeapRegionRemSet::fl_mem_size() + HeapRegionRemSet::static_mem_size();
tonyp@2717 4806 // Print the footer of the output.
tonyp@2717 4807 _out->print_cr(G1PPRL_LINE_PREFIX);
tonyp@2717 4808 _out->print_cr(G1PPRL_LINE_PREFIX
tonyp@2717 4809 " SUMMARY"
tonyp@2717 4810 G1PPRL_SUM_MB_FORMAT("capacity")
tonyp@2717 4811 G1PPRL_SUM_MB_PERC_FORMAT("used")
tonyp@2717 4812 G1PPRL_SUM_MB_PERC_FORMAT("prev-live")
tschatzl@5122 4813 G1PPRL_SUM_MB_PERC_FORMAT("next-live")
johnc@5548 4814 G1PPRL_SUM_MB_FORMAT("remset")
johnc@5548 4815 G1PPRL_SUM_MB_FORMAT("code-roots"),
tonyp@2717 4816 bytes_to_mb(_total_capacity_bytes),
tonyp@2717 4817 bytes_to_mb(_total_used_bytes),
tonyp@2717 4818 perc(_total_used_bytes, _total_capacity_bytes),
tonyp@2717 4819 bytes_to_mb(_total_prev_live_bytes),
tonyp@2717 4820 perc(_total_prev_live_bytes, _total_capacity_bytes),
tonyp@2717 4821 bytes_to_mb(_total_next_live_bytes),
tschatzl@5122 4822 perc(_total_next_live_bytes, _total_capacity_bytes),
johnc@5548 4823 bytes_to_mb(_total_remset_bytes),
johnc@5548 4824 bytes_to_mb(_total_strong_code_roots_bytes));
tonyp@2717 4825 _out->cr();
tonyp@2717 4826 }

mercurial