Thu, 04 Oct 2012 10:04:13 -0700
8000311: G1: ParallelGCThreads==0 broken
Summary: Divide by zero error, if ParallelGCThreads is 0, when adjusting the PLAB size.
Reviewed-by: jmasa, jcoomes
duke@435 | 1 | /* |
katleman@3058 | 2 | * Copyright (c) 2007, 2011, Oracle and/or its affiliates. All rights reserved. |
duke@435 | 3 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
duke@435 | 4 | * |
duke@435 | 5 | * This code is free software; you can redistribute it and/or modify it |
duke@435 | 6 | * under the terms of the GNU General Public License version 2 only, as |
duke@435 | 7 | * published by the Free Software Foundation. |
duke@435 | 8 | * |
duke@435 | 9 | * This code is distributed in the hope that it will be useful, but WITHOUT |
duke@435 | 10 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
duke@435 | 11 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
duke@435 | 12 | * version 2 for more details (a copy is included in the LICENSE file that |
duke@435 | 13 | * accompanied this code). |
duke@435 | 14 | * |
duke@435 | 15 | * You should have received a copy of the GNU General Public License version |
duke@435 | 16 | * 2 along with this work; if not, write to the Free Software Foundation, |
duke@435 | 17 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
duke@435 | 18 | * |
trims@1907 | 19 | * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
trims@1907 | 20 | * or visit www.oracle.com if you need additional information or have any |
trims@1907 | 21 | * questions. |
duke@435 | 22 | * |
duke@435 | 23 | */ |
duke@435 | 24 | |
stefank@2314 | 25 | #include "precompiled.hpp" |
stefank@2314 | 26 | #include "memory/allocation.inline.hpp" |
stefank@2314 | 27 | #include "memory/cardTableModRefBS.hpp" |
stefank@2314 | 28 | #include "memory/cardTableRS.hpp" |
stefank@2314 | 29 | #include "memory/sharedHeap.hpp" |
stefank@2314 | 30 | #include "memory/space.inline.hpp" |
stefank@2314 | 31 | #include "memory/universe.hpp" |
ysr@2889 | 32 | #include "oops/oop.inline.hpp" |
stefank@2314 | 33 | #include "runtime/java.hpp" |
stefank@2314 | 34 | #include "runtime/mutexLocker.hpp" |
stefank@2314 | 35 | #include "runtime/virtualspace.hpp" |
jmasa@3294 | 36 | #include "runtime/vmThread.hpp" |
duke@435 | 37 | |
ysr@2819 | 38 | void CardTableModRefBS::non_clean_card_iterate_parallel_work(Space* sp, MemRegion mr, |
ysr@2889 | 39 | OopsInGenClosure* cl, |
ysr@2889 | 40 | CardTableRS* ct, |
ysr@2819 | 41 | int n_threads) { |
ysr@2819 | 42 | assert(n_threads > 0, "Error: expected n_threads > 0"); |
ysr@2819 | 43 | assert((n_threads == 1 && ParallelGCThreads == 0) || |
ysr@2819 | 44 | n_threads <= (int)ParallelGCThreads, |
ysr@2819 | 45 | "# worker threads != # requested!"); |
jmasa@3294 | 46 | assert(!Thread::current()->is_VM_thread() || (n_threads == 1), "There is only 1 VM thread"); |
jmasa@3294 | 47 | assert(UseDynamicNumberOfGCThreads || |
jmasa@3294 | 48 | !FLAG_IS_DEFAULT(ParallelGCThreads) || |
jmasa@3294 | 49 | n_threads == (int)ParallelGCThreads, |
jmasa@3294 | 50 | "# worker threads != # requested!"); |
ysr@2819 | 51 | // Make sure the LNC array is valid for the space. |
ysr@2819 | 52 | jbyte** lowest_non_clean; |
ysr@2819 | 53 | uintptr_t lowest_non_clean_base_chunk_index; |
ysr@2819 | 54 | size_t lowest_non_clean_chunk_size; |
ysr@2819 | 55 | get_LNC_array_for_space(sp, lowest_non_clean, |
ysr@2819 | 56 | lowest_non_clean_base_chunk_index, |
ysr@2819 | 57 | lowest_non_clean_chunk_size); |
duke@435 | 58 | |
jmasa@3357 | 59 | uint n_strides = n_threads * ParGCStridesPerThread; |
ysr@2819 | 60 | SequentialSubTasksDone* pst = sp->par_seq_tasks(); |
jmasa@3294 | 61 | // Sets the condition for completion of the subtask (how many threads |
jmasa@3294 | 62 | // need to finish in order to be done). |
ysr@2819 | 63 | pst->set_n_threads(n_threads); |
ysr@2819 | 64 | pst->set_n_tasks(n_strides); |
duke@435 | 65 | |
jmasa@3357 | 66 | uint stride = 0; |
ysr@2819 | 67 | while (!pst->is_task_claimed(/* reference */ stride)) { |
ysr@2889 | 68 | process_stride(sp, mr, stride, n_strides, cl, ct, |
ysr@2819 | 69 | lowest_non_clean, |
ysr@2819 | 70 | lowest_non_clean_base_chunk_index, |
ysr@2819 | 71 | lowest_non_clean_chunk_size); |
ysr@2819 | 72 | } |
ysr@2819 | 73 | if (pst->all_tasks_completed()) { |
ysr@2819 | 74 | // Clear lowest_non_clean array for next time. |
ysr@2819 | 75 | intptr_t first_chunk_index = addr_to_chunk_index(mr.start()); |
ysr@2819 | 76 | uintptr_t last_chunk_index = addr_to_chunk_index(mr.last()); |
ysr@2819 | 77 | for (uintptr_t ch = first_chunk_index; ch <= last_chunk_index; ch++) { |
ysr@2819 | 78 | intptr_t ind = ch - lowest_non_clean_base_chunk_index; |
ysr@2819 | 79 | assert(0 <= ind && ind < (intptr_t)lowest_non_clean_chunk_size, |
ysr@2819 | 80 | "Bounds error"); |
ysr@2819 | 81 | lowest_non_clean[ind] = NULL; |
duke@435 | 82 | } |
duke@435 | 83 | } |
duke@435 | 84 | } |
duke@435 | 85 | |
duke@435 | 86 | void |
duke@435 | 87 | CardTableModRefBS:: |
duke@435 | 88 | process_stride(Space* sp, |
duke@435 | 89 | MemRegion used, |
duke@435 | 90 | jint stride, int n_strides, |
ysr@2889 | 91 | OopsInGenClosure* cl, |
ysr@2889 | 92 | CardTableRS* ct, |
duke@435 | 93 | jbyte** lowest_non_clean, |
duke@435 | 94 | uintptr_t lowest_non_clean_base_chunk_index, |
duke@435 | 95 | size_t lowest_non_clean_chunk_size) { |
ysr@2889 | 96 | // We go from higher to lower addresses here; it wouldn't help that much |
ysr@2889 | 97 | // because of the strided parallelism pattern used here. |
duke@435 | 98 | |
duke@435 | 99 | // Find the first card address of the first chunk in the stride that is |
duke@435 | 100 | // at least "bottom" of the used region. |
duke@435 | 101 | jbyte* start_card = byte_for(used.start()); |
duke@435 | 102 | jbyte* end_card = byte_after(used.last()); |
duke@435 | 103 | uintptr_t start_chunk = addr_to_chunk_index(used.start()); |
duke@435 | 104 | uintptr_t start_chunk_stride_num = start_chunk % n_strides; |
duke@435 | 105 | jbyte* chunk_card_start; |
duke@435 | 106 | |
duke@435 | 107 | if ((uintptr_t)stride >= start_chunk_stride_num) { |
duke@435 | 108 | chunk_card_start = (jbyte*)(start_card + |
duke@435 | 109 | (stride - start_chunk_stride_num) * |
ysr@2889 | 110 | ParGCCardsPerStrideChunk); |
duke@435 | 111 | } else { |
duke@435 | 112 | // Go ahead to the next chunk group boundary, then to the requested stride. |
duke@435 | 113 | chunk_card_start = (jbyte*)(start_card + |
duke@435 | 114 | (n_strides - start_chunk_stride_num + stride) * |
ysr@2889 | 115 | ParGCCardsPerStrideChunk); |
duke@435 | 116 | } |
duke@435 | 117 | |
duke@435 | 118 | while (chunk_card_start < end_card) { |
ysr@2889 | 119 | // Even though we go from lower to higher addresses below, the |
ysr@2889 | 120 | // strided parallelism can interleave the actual processing of the |
ysr@2889 | 121 | // dirty pages in various ways. For a specific chunk within this |
ysr@2889 | 122 | // stride, we take care to avoid double scanning or missing a card |
ysr@2889 | 123 | // by suitably initializing the "min_done" field in process_chunk_boundaries() |
ysr@2889 | 124 | // below, together with the dirty region extension accomplished in |
ysr@2889 | 125 | // DirtyCardToOopClosure::do_MemRegion(). |
ysr@2889 | 126 | jbyte* chunk_card_end = chunk_card_start + ParGCCardsPerStrideChunk; |
duke@435 | 127 | // Invariant: chunk_mr should be fully contained within the "used" region. |
duke@435 | 128 | MemRegion chunk_mr = MemRegion(addr_for(chunk_card_start), |
duke@435 | 129 | chunk_card_end >= end_card ? |
duke@435 | 130 | used.end() : addr_for(chunk_card_end)); |
duke@435 | 131 | assert(chunk_mr.word_size() > 0, "[chunk_card_start > used_end)"); |
duke@435 | 132 | assert(used.contains(chunk_mr), "chunk_mr should be subset of used"); |
duke@435 | 133 | |
ysr@2889 | 134 | DirtyCardToOopClosure* dcto_cl = sp->new_dcto_cl(cl, precision(), |
ysr@2889 | 135 | cl->gen_boundary()); |
ysr@2889 | 136 | ClearNoncleanCardWrapper clear_cl(dcto_cl, ct); |
ysr@2889 | 137 | |
ysr@2889 | 138 | |
duke@435 | 139 | // Process the chunk. |
duke@435 | 140 | process_chunk_boundaries(sp, |
duke@435 | 141 | dcto_cl, |
duke@435 | 142 | chunk_mr, |
duke@435 | 143 | used, |
duke@435 | 144 | lowest_non_clean, |
duke@435 | 145 | lowest_non_clean_base_chunk_index, |
duke@435 | 146 | lowest_non_clean_chunk_size); |
duke@435 | 147 | |
ysr@2889 | 148 | // We want the LNC array updates above in process_chunk_boundaries |
ysr@2889 | 149 | // to be visible before any of the card table value changes as a |
ysr@2889 | 150 | // result of the dirty card iteration below. |
ysr@2889 | 151 | OrderAccess::storestore(); |
ysr@2889 | 152 | |
ysr@2819 | 153 | // We do not call the non_clean_card_iterate_serial() version because |
ysr@2889 | 154 | // we want to clear the cards: clear_cl here does the work of finding |
ysr@2889 | 155 | // contiguous dirty ranges of cards to process and clear. |
ysr@2889 | 156 | clear_cl.do_MemRegion(chunk_mr); |
duke@435 | 157 | |
duke@435 | 158 | // Find the next chunk of the stride. |
ysr@2889 | 159 | chunk_card_start += ParGCCardsPerStrideChunk * n_strides; |
duke@435 | 160 | } |
duke@435 | 161 | } |
duke@435 | 162 | |
ysr@2889 | 163 | |
ysr@2889 | 164 | // If you want a talkative process_chunk_boundaries, |
ysr@2889 | 165 | // then #define NOISY(x) x |
ysr@2889 | 166 | #ifdef NOISY |
ysr@2889 | 167 | #error "Encountered a global preprocessor flag, NOISY, which might clash with local definition to follow" |
ysr@2889 | 168 | #else |
ysr@2889 | 169 | #define NOISY(x) |
ysr@2889 | 170 | #endif |
ysr@2889 | 171 | |
duke@435 | 172 | void |
duke@435 | 173 | CardTableModRefBS:: |
duke@435 | 174 | process_chunk_boundaries(Space* sp, |
duke@435 | 175 | DirtyCardToOopClosure* dcto_cl, |
duke@435 | 176 | MemRegion chunk_mr, |
duke@435 | 177 | MemRegion used, |
duke@435 | 178 | jbyte** lowest_non_clean, |
duke@435 | 179 | uintptr_t lowest_non_clean_base_chunk_index, |
duke@435 | 180 | size_t lowest_non_clean_chunk_size) |
duke@435 | 181 | { |
ysr@2889 | 182 | // We must worry about non-array objects that cross chunk boundaries, |
ysr@2889 | 183 | // because such objects are both precisely and imprecisely marked: |
ysr@2889 | 184 | // .. if the head of such an object is dirty, the entire object |
ysr@2889 | 185 | // needs to be scanned, under the interpretation that this |
ysr@2889 | 186 | // was an imprecise mark |
ysr@2889 | 187 | // .. if the head of such an object is not dirty, we can assume |
ysr@2889 | 188 | // precise marking and it's efficient to scan just the dirty |
ysr@2889 | 189 | // cards. |
ysr@2889 | 190 | // In either case, each scanned reference must be scanned precisely |
ysr@2889 | 191 | // once so as to avoid cloning of a young referent. For efficiency, |
ysr@2889 | 192 | // our closures depend on this property and do not protect against |
ysr@2889 | 193 | // double scans. |
duke@435 | 194 | |
duke@435 | 195 | uintptr_t cur_chunk_index = addr_to_chunk_index(chunk_mr.start()); |
duke@435 | 196 | cur_chunk_index = cur_chunk_index - lowest_non_clean_base_chunk_index; |
duke@435 | 197 | |
ysr@2889 | 198 | NOISY(tty->print_cr("===========================================================================");) |
ysr@2889 | 199 | NOISY(tty->print_cr(" process_chunk_boundary: Called with [" PTR_FORMAT "," PTR_FORMAT ")", |
ysr@2889 | 200 | chunk_mr.start(), chunk_mr.end());) |
ysr@2889 | 201 | |
ysr@2889 | 202 | // First, set "our" lowest_non_clean entry, which would be |
ysr@2889 | 203 | // used by the thread scanning an adjoining left chunk with |
ysr@2889 | 204 | // a non-array object straddling the mutual boundary. |
ysr@2889 | 205 | // Find the object that spans our boundary, if one exists. |
ysr@2889 | 206 | // first_block is the block possibly straddling our left boundary. |
ysr@2889 | 207 | HeapWord* first_block = sp->block_start(chunk_mr.start()); |
ysr@2889 | 208 | assert((chunk_mr.start() != used.start()) || (first_block == chunk_mr.start()), |
ysr@2889 | 209 | "First chunk should always have a co-initial block"); |
ysr@2889 | 210 | // Does the block straddle the chunk's left boundary, and is it |
ysr@2889 | 211 | // a non-array object? |
ysr@2889 | 212 | if (first_block < chunk_mr.start() // first block straddles left bdry |
ysr@2889 | 213 | && sp->block_is_obj(first_block) // first block is an object |
ysr@2889 | 214 | && !(oop(first_block)->is_objArray() // first block is not an array (arrays are precisely dirtied) |
ysr@2889 | 215 | || oop(first_block)->is_typeArray())) { |
ysr@2889 | 216 | // Find our least non-clean card, so that a left neighbour |
ysr@2889 | 217 | // does not scan an object straddling the mutual boundary |
ysr@2889 | 218 | // too far to the right, and attempt to scan a portion of |
ysr@2889 | 219 | // that object twice. |
ysr@2889 | 220 | jbyte* first_dirty_card = NULL; |
ysr@2889 | 221 | jbyte* last_card_of_first_obj = |
ysr@2889 | 222 | byte_for(first_block + sp->block_size(first_block) - 1); |
ysr@2889 | 223 | jbyte* first_card_of_cur_chunk = byte_for(chunk_mr.start()); |
ysr@2889 | 224 | jbyte* last_card_of_cur_chunk = byte_for(chunk_mr.last()); |
ysr@2889 | 225 | jbyte* last_card_to_check = |
ysr@2889 | 226 | (jbyte*) MIN2((intptr_t) last_card_of_cur_chunk, |
ysr@2889 | 227 | (intptr_t) last_card_of_first_obj); |
ysr@2889 | 228 | // Note that this does not need to go beyond our last card |
ysr@2889 | 229 | // if our first object completely straddles this chunk. |
ysr@2889 | 230 | for (jbyte* cur = first_card_of_cur_chunk; |
ysr@2889 | 231 | cur <= last_card_to_check; cur++) { |
ysr@2889 | 232 | jbyte val = *cur; |
ysr@2889 | 233 | if (card_will_be_scanned(val)) { |
ysr@2889 | 234 | first_dirty_card = cur; break; |
ysr@2889 | 235 | } else { |
ysr@2889 | 236 | assert(!card_may_have_been_dirty(val), "Error"); |
ysr@2889 | 237 | } |
ysr@2889 | 238 | } |
ysr@2889 | 239 | if (first_dirty_card != NULL) { |
ysr@2889 | 240 | NOISY(tty->print_cr(" LNC: Found a dirty card at " PTR_FORMAT " in current chunk", |
ysr@2889 | 241 | first_dirty_card);) |
ysr@2889 | 242 | assert(0 <= cur_chunk_index && cur_chunk_index < lowest_non_clean_chunk_size, |
ysr@2889 | 243 | "Bounds error."); |
ysr@2889 | 244 | assert(lowest_non_clean[cur_chunk_index] == NULL, |
ysr@2889 | 245 | "Write exactly once : value should be stable hereafter for this round"); |
ysr@2889 | 246 | lowest_non_clean[cur_chunk_index] = first_dirty_card; |
ysr@2889 | 247 | } NOISY(else { |
ysr@2889 | 248 | tty->print_cr(" LNC: Found no dirty card in current chunk; leaving LNC entry NULL"); |
ysr@2889 | 249 | // In the future, we could have this thread look for a non-NULL value to copy from its |
ysr@2889 | 250 | // right neighbour (up to the end of the first object). |
ysr@2889 | 251 | if (last_card_of_cur_chunk < last_card_of_first_obj) { |
ysr@2889 | 252 | tty->print_cr(" LNC: BEWARE!!! first obj straddles past right end of chunk:\n" |
ysr@2889 | 253 | " might be efficient to get value from right neighbour?"); |
ysr@2889 | 254 | } |
ysr@2889 | 255 | }) |
ysr@2889 | 256 | } else { |
ysr@2889 | 257 | // In this case we can help our neighbour by just asking them |
ysr@2889 | 258 | // to stop at our first card (even though it may not be dirty). |
ysr@2889 | 259 | NOISY(tty->print_cr(" LNC: first block is not a non-array object; setting LNC to first card of current chunk");) |
ysr@2889 | 260 | assert(lowest_non_clean[cur_chunk_index] == NULL, "Write once : value should be stable hereafter"); |
ysr@2889 | 261 | jbyte* first_card_of_cur_chunk = byte_for(chunk_mr.start()); |
ysr@2889 | 262 | lowest_non_clean[cur_chunk_index] = first_card_of_cur_chunk; |
ysr@2889 | 263 | } |
ysr@2889 | 264 | NOISY(tty->print_cr(" process_chunk_boundary: lowest_non_clean[" INTPTR_FORMAT "] = " PTR_FORMAT |
ysr@2889 | 265 | " which corresponds to the heap address " PTR_FORMAT, |
ysr@2889 | 266 | cur_chunk_index, lowest_non_clean[cur_chunk_index], |
ysr@2889 | 267 | (lowest_non_clean[cur_chunk_index] != NULL) |
ysr@2889 | 268 | ? addr_for(lowest_non_clean[cur_chunk_index]) |
ysr@2889 | 269 | : NULL);) |
ysr@2889 | 270 | NOISY(tty->print_cr("---------------------------------------------------------------------------");) |
ysr@2889 | 271 | |
ysr@2889 | 272 | // Next, set our own max_to_do, which will strictly/exclusively bound |
ysr@2889 | 273 | // the highest address that we will scan past the right end of our chunk. |
ysr@2889 | 274 | HeapWord* max_to_do = NULL; |
duke@435 | 275 | if (chunk_mr.end() < used.end()) { |
ysr@2889 | 276 | // This is not the last chunk in the used region. |
ysr@2889 | 277 | // What is our last block? We check the first block of |
ysr@2889 | 278 | // the next (right) chunk rather than strictly check our last block |
ysr@2889 | 279 | // because it's potentially more efficient to do so. |
ysr@2889 | 280 | HeapWord* const last_block = sp->block_start(chunk_mr.end()); |
duke@435 | 281 | assert(last_block <= chunk_mr.end(), "In case this property changes."); |
ysr@2889 | 282 | if ((last_block == chunk_mr.end()) // our last block does not straddle boundary |
ysr@2889 | 283 | || !sp->block_is_obj(last_block) // last_block isn't an object |
ysr@2889 | 284 | || oop(last_block)->is_objArray() // last_block is an array (precisely marked) |
ysr@2889 | 285 | || oop(last_block)->is_typeArray()) { |
duke@435 | 286 | max_to_do = chunk_mr.end(); |
ysr@2889 | 287 | NOISY(tty->print_cr(" process_chunk_boundary: Last block on this card is not a non-array object;\n" |
ysr@2889 | 288 | " max_to_do left at " PTR_FORMAT, max_to_do);) |
duke@435 | 289 | } else { |
ysr@2889 | 290 | assert(last_block < chunk_mr.end(), "Tautology"); |
ysr@2889 | 291 | // It is a non-array object that straddles the right boundary of this chunk. |
duke@435 | 292 | // last_obj_card is the card corresponding to the start of the last object |
duke@435 | 293 | // in the chunk. Note that the last object may not start in |
duke@435 | 294 | // the chunk. |
ysr@2889 | 295 | jbyte* const last_obj_card = byte_for(last_block); |
ysr@2889 | 296 | const jbyte val = *last_obj_card; |
ysr@2889 | 297 | if (!card_will_be_scanned(val)) { |
ysr@2889 | 298 | assert(!card_may_have_been_dirty(val), "Error"); |
ysr@2889 | 299 | // The card containing the head is not dirty. Any marks on |
duke@435 | 300 | // subsequent cards still in this chunk must have been made |
ysr@2889 | 301 | // precisely; we can cap processing at the end of our chunk. |
duke@435 | 302 | max_to_do = chunk_mr.end(); |
ysr@2889 | 303 | NOISY(tty->print_cr(" process_chunk_boundary: Head of last object on this card is not dirty;\n" |
ysr@2889 | 304 | " max_to_do left at " PTR_FORMAT, |
ysr@2889 | 305 | max_to_do);) |
duke@435 | 306 | } else { |
duke@435 | 307 | // The last object must be considered dirty, and extends onto the |
duke@435 | 308 | // following chunk. Look for a dirty card in that chunk that will |
duke@435 | 309 | // bound our processing. |
duke@435 | 310 | jbyte* limit_card = NULL; |
ysr@2889 | 311 | const size_t last_block_size = sp->block_size(last_block); |
ysr@2889 | 312 | jbyte* const last_card_of_last_obj = |
duke@435 | 313 | byte_for(last_block + last_block_size - 1); |
ysr@2889 | 314 | jbyte* const first_card_of_next_chunk = byte_for(chunk_mr.end()); |
duke@435 | 315 | // This search potentially goes a long distance looking |
ysr@2889 | 316 | // for the next card that will be scanned, terminating |
ysr@2889 | 317 | // at the end of the last_block, if no earlier dirty card |
ysr@2889 | 318 | // is found. |
ysr@2889 | 319 | assert(byte_for(chunk_mr.end()) - byte_for(chunk_mr.start()) == ParGCCardsPerStrideChunk, |
ysr@2889 | 320 | "last card of next chunk may be wrong"); |
duke@435 | 321 | for (jbyte* cur = first_card_of_next_chunk; |
ysr@2889 | 322 | cur <= last_card_of_last_obj; cur++) { |
ysr@2889 | 323 | const jbyte val = *cur; |
ysr@2889 | 324 | if (card_will_be_scanned(val)) { |
ysr@2889 | 325 | NOISY(tty->print_cr(" Found a non-clean card " PTR_FORMAT " with value 0x%x", |
ysr@2889 | 326 | cur, (int)val);) |
duke@435 | 327 | limit_card = cur; break; |
ysr@2889 | 328 | } else { |
ysr@2889 | 329 | assert(!card_may_have_been_dirty(val), "Error: card can't be skipped"); |
duke@435 | 330 | } |
duke@435 | 331 | } |
ysr@2889 | 332 | if (limit_card != NULL) { |
ysr@2889 | 333 | max_to_do = addr_for(limit_card); |
ysr@2889 | 334 | assert(limit_card != NULL && max_to_do != NULL, "Error"); |
ysr@2889 | 335 | NOISY(tty->print_cr(" process_chunk_boundary: Found a dirty card at " PTR_FORMAT |
ysr@2889 | 336 | " max_to_do set at " PTR_FORMAT " which is before end of last block in chunk: " |
ysr@2889 | 337 | PTR_FORMAT " + " PTR_FORMAT " = " PTR_FORMAT, |
ysr@2889 | 338 | limit_card, max_to_do, last_block, last_block_size, (last_block+last_block_size));) |
ysr@2889 | 339 | } else { |
ysr@2889 | 340 | // The following is a pessimistic value, because it's possible |
ysr@2889 | 341 | // that a dirty card on a subsequent chunk has been cleared by |
ysr@2889 | 342 | // the time we get to look at it; we'll correct for that further below, |
ysr@2889 | 343 | // using the LNC array which records the least non-clean card |
ysr@2889 | 344 | // before cards were cleared in a particular chunk. |
ysr@2889 | 345 | limit_card = last_card_of_last_obj; |
ysr@2889 | 346 | max_to_do = last_block + last_block_size; |
ysr@2889 | 347 | assert(limit_card != NULL && max_to_do != NULL, "Error"); |
ysr@2889 | 348 | NOISY(tty->print_cr(" process_chunk_boundary: Found no dirty card before end of last block in chunk\n" |
ysr@2889 | 349 | " Setting limit_card to " PTR_FORMAT |
ysr@2889 | 350 | " and max_to_do " PTR_FORMAT " + " PTR_FORMAT " = " PTR_FORMAT, |
ysr@2889 | 351 | limit_card, last_block, last_block_size, max_to_do);) |
ysr@2889 | 352 | } |
ysr@2889 | 353 | assert(0 < cur_chunk_index+1 && cur_chunk_index+1 < lowest_non_clean_chunk_size, |
duke@435 | 354 | "Bounds error."); |
ysr@2889 | 355 | // It is possible that a dirty card for the last object may have been |
ysr@2889 | 356 | // cleared before we had a chance to examine it. In that case, the value |
ysr@2889 | 357 | // will have been logged in the LNC for that chunk. |
ysr@2889 | 358 | // We need to examine as many chunks to the right as this object |
ysr@2959 | 359 | // covers. However, we need to bound this checking to the largest |
ysr@2959 | 360 | // entry in the LNC array: this is because the heap may expand |
ysr@2959 | 361 | // after the LNC array has been created but before we reach this point, |
ysr@2959 | 362 | // and the last block in our chunk may have been expanded to include |
ysr@2959 | 363 | // the expansion delta (and possibly subsequently allocated from, so |
ysr@2959 | 364 | // it wouldn't be sufficient to check whether that last block was |
ysr@2959 | 365 | // or was not an object at this point). |
ysr@2959 | 366 | uintptr_t last_chunk_index_to_check = addr_to_chunk_index(last_block + last_block_size - 1) |
ysr@2959 | 367 | - lowest_non_clean_base_chunk_index; |
ysr@2959 | 368 | const uintptr_t last_chunk_index = addr_to_chunk_index(used.last()) |
ysr@2959 | 369 | - lowest_non_clean_base_chunk_index; |
ysr@2959 | 370 | if (last_chunk_index_to_check > last_chunk_index) { |
ysr@2959 | 371 | assert(last_block + last_block_size > used.end(), |
ysr@2959 | 372 | err_msg("Inconsistency detected: last_block [" PTR_FORMAT "," PTR_FORMAT "]" |
ysr@2959 | 373 | " does not exceed used.end() = " PTR_FORMAT "," |
ysr@2959 | 374 | " yet last_chunk_index_to_check " INTPTR_FORMAT |
ysr@2959 | 375 | " exceeds last_chunk_index " INTPTR_FORMAT, |
ysr@2959 | 376 | last_chunk_index_to_check, last_chunk_index)); |
ysr@2959 | 377 | assert(sp->used_region().end() > used.end(), |
ysr@2959 | 378 | err_msg("Expansion did not happen: " |
ysr@2959 | 379 | "[" PTR_FORMAT "," PTR_FORMAT ") -> [" PTR_FORMAT "," PTR_FORMAT ")", |
ysr@2959 | 380 | sp->used_region().start(), sp->used_region().end(), used.start(), used.end())); |
ysr@2959 | 381 | NOISY(tty->print_cr(" process_chunk_boundary: heap expanded; explicitly bounding last_chunk");) |
ysr@2959 | 382 | last_chunk_index_to_check = last_chunk_index; |
ysr@2959 | 383 | } |
ysr@2889 | 384 | for (uintptr_t lnc_index = cur_chunk_index + 1; |
ysr@2889 | 385 | lnc_index <= last_chunk_index_to_check; |
ysr@2889 | 386 | lnc_index++) { |
ysr@2889 | 387 | jbyte* lnc_card = lowest_non_clean[lnc_index]; |
ysr@2889 | 388 | if (lnc_card != NULL) { |
ysr@2889 | 389 | // we can stop at the first non-NULL entry we find |
ysr@2889 | 390 | if (lnc_card <= limit_card) { |
ysr@2889 | 391 | NOISY(tty->print_cr(" process_chunk_boundary: LNC card " PTR_FORMAT " is lower than limit_card " PTR_FORMAT, |
ysr@2889 | 392 | " max_to_do will be lowered to " PTR_FORMAT " from " PTR_FORMAT, |
ysr@2889 | 393 | lnc_card, limit_card, addr_for(lnc_card), max_to_do);) |
ysr@2889 | 394 | limit_card = lnc_card; |
ysr@2889 | 395 | max_to_do = addr_for(limit_card); |
ysr@2889 | 396 | assert(limit_card != NULL && max_to_do != NULL, "Error"); |
ysr@2889 | 397 | } |
ysr@2889 | 398 | // In any case, we break now |
ysr@2889 | 399 | break; |
ysr@2889 | 400 | } // else continue to look for a non-NULL entry if any |
duke@435 | 401 | } |
ysr@2889 | 402 | assert(limit_card != NULL && max_to_do != NULL, "Error"); |
duke@435 | 403 | } |
ysr@2889 | 404 | assert(max_to_do != NULL, "OOPS 1 !"); |
duke@435 | 405 | } |
ysr@2889 | 406 | assert(max_to_do != NULL, "OOPS 2!"); |
duke@435 | 407 | } else { |
duke@435 | 408 | max_to_do = used.end(); |
ysr@2889 | 409 | NOISY(tty->print_cr(" process_chunk_boundary: Last chunk of this space;\n" |
ysr@2889 | 410 | " max_to_do left at " PTR_FORMAT, |
ysr@2889 | 411 | max_to_do);) |
duke@435 | 412 | } |
ysr@2889 | 413 | assert(max_to_do != NULL, "OOPS 3!"); |
duke@435 | 414 | // Now we can set the closure we're using so it doesn't to beyond |
duke@435 | 415 | // max_to_do. |
duke@435 | 416 | dcto_cl->set_min_done(max_to_do); |
duke@435 | 417 | #ifndef PRODUCT |
duke@435 | 418 | dcto_cl->set_last_bottom(max_to_do); |
duke@435 | 419 | #endif |
ysr@2889 | 420 | NOISY(tty->print_cr("===========================================================================\n");) |
ysr@2889 | 421 | } |
duke@435 | 422 | |
ysr@2889 | 423 | #undef NOISY |
duke@435 | 424 | |
duke@435 | 425 | void |
duke@435 | 426 | CardTableModRefBS:: |
duke@435 | 427 | get_LNC_array_for_space(Space* sp, |
duke@435 | 428 | jbyte**& lowest_non_clean, |
duke@435 | 429 | uintptr_t& lowest_non_clean_base_chunk_index, |
duke@435 | 430 | size_t& lowest_non_clean_chunk_size) { |
duke@435 | 431 | |
duke@435 | 432 | int i = find_covering_region_containing(sp->bottom()); |
duke@435 | 433 | MemRegion covered = _covered[i]; |
duke@435 | 434 | size_t n_chunks = chunks_to_cover(covered); |
duke@435 | 435 | |
duke@435 | 436 | // Only the first thread to obtain the lock will resize the |
duke@435 | 437 | // LNC array for the covered region. Any later expansion can't affect |
duke@435 | 438 | // the used_at_save_marks region. |
duke@435 | 439 | // (I observed a bug in which the first thread to execute this would |
ysr@2889 | 440 | // resize, and then it would cause "expand_and_allocate" that would |
ysr@2889 | 441 | // increase the number of chunks in the covered region. Then a second |
duke@435 | 442 | // thread would come and execute this, see that the size didn't match, |
duke@435 | 443 | // and free and allocate again. So the first thread would be using a |
duke@435 | 444 | // freed "_lowest_non_clean" array.) |
duke@435 | 445 | |
duke@435 | 446 | // Do a dirty read here. If we pass the conditional then take the rare |
duke@435 | 447 | // event lock and do the read again in case some other thread had already |
duke@435 | 448 | // succeeded and done the resize. |
duke@435 | 449 | int cur_collection = Universe::heap()->total_collections(); |
duke@435 | 450 | if (_last_LNC_resizing_collection[i] != cur_collection) { |
duke@435 | 451 | MutexLocker x(ParGCRareEvent_lock); |
duke@435 | 452 | if (_last_LNC_resizing_collection[i] != cur_collection) { |
duke@435 | 453 | if (_lowest_non_clean[i] == NULL || |
duke@435 | 454 | n_chunks != _lowest_non_clean_chunk_size[i]) { |
duke@435 | 455 | |
duke@435 | 456 | // Should we delete the old? |
duke@435 | 457 | if (_lowest_non_clean[i] != NULL) { |
duke@435 | 458 | assert(n_chunks != _lowest_non_clean_chunk_size[i], |
duke@435 | 459 | "logical consequence"); |
zgu@3900 | 460 | FREE_C_HEAP_ARRAY(CardPtr, _lowest_non_clean[i], mtGC); |
duke@435 | 461 | _lowest_non_clean[i] = NULL; |
duke@435 | 462 | } |
duke@435 | 463 | // Now allocate a new one if necessary. |
duke@435 | 464 | if (_lowest_non_clean[i] == NULL) { |
zgu@3900 | 465 | _lowest_non_clean[i] = NEW_C_HEAP_ARRAY(CardPtr, n_chunks, mtGC); |
duke@435 | 466 | _lowest_non_clean_chunk_size[i] = n_chunks; |
duke@435 | 467 | _lowest_non_clean_base_chunk_index[i] = addr_to_chunk_index(covered.start()); |
duke@435 | 468 | for (int j = 0; j < (int)n_chunks; j++) |
duke@435 | 469 | _lowest_non_clean[i][j] = NULL; |
duke@435 | 470 | } |
duke@435 | 471 | } |
duke@435 | 472 | _last_LNC_resizing_collection[i] = cur_collection; |
duke@435 | 473 | } |
duke@435 | 474 | } |
duke@435 | 475 | // In any case, now do the initialization. |
duke@435 | 476 | lowest_non_clean = _lowest_non_clean[i]; |
duke@435 | 477 | lowest_non_clean_base_chunk_index = _lowest_non_clean_base_chunk_index[i]; |
duke@435 | 478 | lowest_non_clean_chunk_size = _lowest_non_clean_chunk_size[i]; |
duke@435 | 479 | } |