src/share/vm/gc_implementation/shared/mutableNUMASpace.hpp

Wed, 23 Jan 2013 13:02:39 -0500

author
jprovino
date
Wed, 23 Jan 2013 13:02:39 -0500
changeset 4542
db9981fd3124
parent 3900
d2a62e0f25eb
child 6198
55fb97c4c58d
permissions
-rw-r--r--

8005915: Unify SERIALGC and INCLUDE_ALTERNATE_GCS
Summary: Rename INCLUDE_ALTERNATE_GCS to INCLUDE_ALL_GCS and replace SERIALGC with INCLUDE_ALL_GCS.
Reviewed-by: coleenp, stefank

duke@435 1 /*
brutisso@3711 2 * Copyright (c) 2006, 2012, Oracle and/or its affiliates. All rights reserved.
duke@435 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
duke@435 4 *
duke@435 5 * This code is free software; you can redistribute it and/or modify it
duke@435 6 * under the terms of the GNU General Public License version 2 only, as
duke@435 7 * published by the Free Software Foundation.
duke@435 8 *
duke@435 9 * This code is distributed in the hope that it will be useful, but WITHOUT
duke@435 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
duke@435 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
duke@435 12 * version 2 for more details (a copy is included in the LICENSE file that
duke@435 13 * accompanied this code).
duke@435 14 *
duke@435 15 * You should have received a copy of the GNU General Public License version
duke@435 16 * 2 along with this work; if not, write to the Free Software Foundation,
duke@435 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
duke@435 18 *
trims@1907 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
trims@1907 20 * or visit www.oracle.com if you need additional information or have any
trims@1907 21 * questions.
duke@435 22 *
duke@435 23 */
duke@435 24
stefank@2314 25 #ifndef SHARE_VM_GC_IMPLEMENTATION_SHARED_MUTABLENUMASPACE_HPP
stefank@2314 26 #define SHARE_VM_GC_IMPLEMENTATION_SHARED_MUTABLENUMASPACE_HPP
stefank@2314 27
jprovino@4542 28 #include "utilities/macros.hpp"
jprovino@4542 29 #if INCLUDE_ALL_GCS
stefank@2314 30 #include "gc_implementation/shared/gcUtil.hpp"
stefank@2314 31 #include "gc_implementation/shared/mutableSpace.hpp"
jprovino@4542 32 #endif // INCLUDE_ALL_GCS
stefank@2314 33
duke@435 34 /*
duke@435 35 * The NUMA-aware allocator (MutableNUMASpace) is basically a modification
duke@435 36 * of MutableSpace which preserves interfaces but implements different
duke@435 37 * functionality. The space is split into chunks for each locality group
duke@435 38 * (resizing for adaptive size policy is also supported). For each thread
duke@435 39 * allocations are performed in the chunk corresponding to the home locality
duke@435 40 * group of the thread. Whenever any chunk fills-in the young generation
duke@435 41 * collection occurs.
duke@435 42 * The chunks can be also be adaptively resized. The idea behind the adaptive
duke@435 43 * sizing is to reduce the loss of the space in the eden due to fragmentation.
duke@435 44 * The main cause of fragmentation is uneven allocation rates of threads.
duke@435 45 * The allocation rate difference between locality groups may be caused either by
duke@435 46 * application specifics or by uneven LWP distribution by the OS. Besides,
duke@435 47 * application can have less threads then the number of locality groups.
duke@435 48 * In order to resize the chunk we measure the allocation rate of the
duke@435 49 * application between collections. After that we reshape the chunks to reflect
duke@435 50 * the allocation rate pattern. The AdaptiveWeightedAverage exponentially
duke@435 51 * decaying average is used to smooth the measurements. The NUMASpaceResizeRate
duke@435 52 * parameter is used to control the adaptation speed by restricting the number of
duke@435 53 * bytes that can be moved during the adaptation phase.
duke@435 54 * Chunks may contain pages from a wrong locality group. The page-scanner has
duke@435 55 * been introduced to address the problem. Remote pages typically appear due to
duke@435 56 * the memory shortage in the target locality group. Besides Solaris would
duke@435 57 * allocate a large page from the remote locality group even if there are small
duke@435 58 * local pages available. The page-scanner scans the pages right after the
duke@435 59 * collection and frees remote pages in hope that subsequent reallocation would
duke@435 60 * be more successful. This approach proved to be useful on systems with high
duke@435 61 * load where multiple processes are competing for the memory.
duke@435 62 */
duke@435 63
duke@435 64 class MutableNUMASpace : public MutableSpace {
duke@435 65 friend class VMStructs;
duke@435 66
zgu@3900 67 class LGRPSpace : public CHeapObj<mtGC> {
duke@435 68 int _lgrp_id;
duke@435 69 MutableSpace* _space;
duke@435 70 MemRegion _invalid_region;
duke@435 71 AdaptiveWeightedAverage *_alloc_rate;
iveresov@808 72 bool _allocation_failed;
duke@435 73
duke@435 74 struct SpaceStats {
duke@435 75 size_t _local_space, _remote_space, _unbiased_space, _uncommited_space;
duke@435 76 size_t _large_pages, _small_pages;
duke@435 77
duke@435 78 SpaceStats() {
duke@435 79 _local_space = 0;
duke@435 80 _remote_space = 0;
duke@435 81 _unbiased_space = 0;
duke@435 82 _uncommited_space = 0;
duke@435 83 _large_pages = 0;
duke@435 84 _small_pages = 0;
duke@435 85 }
duke@435 86 };
duke@435 87
duke@435 88 SpaceStats _space_stats;
duke@435 89
duke@435 90 char* _last_page_scanned;
duke@435 91 char* last_page_scanned() { return _last_page_scanned; }
duke@435 92 void set_last_page_scanned(char* p) { _last_page_scanned = p; }
duke@435 93 public:
iveresov@970 94 LGRPSpace(int l, size_t alignment) : _lgrp_id(l), _last_page_scanned(NULL), _allocation_failed(false) {
iveresov@970 95 _space = new MutableSpace(alignment);
duke@435 96 _alloc_rate = new AdaptiveWeightedAverage(NUMAChunkResizeWeight);
duke@435 97 }
duke@435 98 ~LGRPSpace() {
duke@435 99 delete _space;
duke@435 100 delete _alloc_rate;
duke@435 101 }
duke@435 102
duke@435 103 void add_invalid_region(MemRegion r) {
duke@435 104 if (!_invalid_region.is_empty()) {
duke@435 105 _invalid_region.set_start(MIN2(_invalid_region.start(), r.start()));
duke@435 106 _invalid_region.set_end(MAX2(_invalid_region.end(), r.end()));
duke@435 107 } else {
duke@435 108 _invalid_region = r;
duke@435 109 }
duke@435 110 }
duke@435 111
duke@435 112 static bool equals(void* lgrp_id_value, LGRPSpace* p) {
duke@435 113 return *(int*)lgrp_id_value == p->lgrp_id();
duke@435 114 }
duke@435 115
iveresov@808 116 // Report a failed allocation.
iveresov@808 117 void set_allocation_failed() { _allocation_failed = true; }
iveresov@808 118
duke@435 119 void sample() {
iveresov@808 120 // If there was a failed allocation make allocation rate equal
iveresov@808 121 // to the size of the whole chunk. This ensures the progress of
iveresov@808 122 // the adaptation process.
iveresov@808 123 size_t alloc_rate_sample;
iveresov@808 124 if (_allocation_failed) {
iveresov@808 125 alloc_rate_sample = space()->capacity_in_bytes();
iveresov@808 126 _allocation_failed = false;
iveresov@808 127 } else {
iveresov@808 128 alloc_rate_sample = space()->used_in_bytes();
iveresov@808 129 }
iveresov@808 130 alloc_rate()->sample(alloc_rate_sample);
duke@435 131 }
duke@435 132
duke@435 133 MemRegion invalid_region() const { return _invalid_region; }
duke@435 134 void set_invalid_region(MemRegion r) { _invalid_region = r; }
duke@435 135 int lgrp_id() const { return _lgrp_id; }
duke@435 136 MutableSpace* space() const { return _space; }
duke@435 137 AdaptiveWeightedAverage* alloc_rate() const { return _alloc_rate; }
iveresov@703 138 void clear_alloc_rate() { _alloc_rate->clear(); }
duke@435 139 SpaceStats* space_stats() { return &_space_stats; }
duke@435 140 void clear_space_stats() { _space_stats = SpaceStats(); }
duke@435 141
duke@435 142 void accumulate_statistics(size_t page_size);
duke@435 143 void scan_pages(size_t page_size, size_t page_count);
duke@435 144 };
duke@435 145
duke@435 146 GrowableArray<LGRPSpace*>* _lgrp_spaces;
duke@435 147 size_t _page_size;
duke@435 148 unsigned _adaptation_cycles, _samples_count;
duke@435 149
duke@435 150 void set_page_size(size_t psz) { _page_size = psz; }
duke@435 151 size_t page_size() const { return _page_size; }
duke@435 152
duke@435 153 unsigned adaptation_cycles() { return _adaptation_cycles; }
duke@435 154 void set_adaptation_cycles(int v) { _adaptation_cycles = v; }
duke@435 155
duke@435 156 unsigned samples_count() { return _samples_count; }
duke@435 157 void increment_samples_count() { ++_samples_count; }
duke@435 158
duke@435 159 size_t _base_space_size;
duke@435 160 void set_base_space_size(size_t v) { _base_space_size = v; }
duke@435 161 size_t base_space_size() const { return _base_space_size; }
duke@435 162
duke@435 163 // Check if the NUMA topology has changed. Add and remove spaces if needed.
duke@435 164 // The update can be forced by setting the force parameter equal to true.
duke@435 165 bool update_layout(bool force);
iveresov@576 166 // Bias region towards the lgrp.
iveresov@576 167 void bias_region(MemRegion mr, int lgrp_id);
duke@435 168 // Free pages in a given region.
duke@435 169 void free_region(MemRegion mr);
duke@435 170 // Get current chunk size.
duke@435 171 size_t current_chunk_size(int i);
duke@435 172 // Get default chunk size (equally divide the space).
duke@435 173 size_t default_chunk_size();
duke@435 174 // Adapt the chunk size to follow the allocation rate.
duke@435 175 size_t adaptive_chunk_size(int i, size_t limit);
duke@435 176 // Scan and free invalid pages.
duke@435 177 void scan_pages(size_t page_count);
duke@435 178 // Return the bottom_region and the top_region. Align them to page_size() boundary.
duke@435 179 // |------------------new_region---------------------------------|
duke@435 180 // |----bottom_region--|---intersection---|------top_region------|
duke@435 181 void select_tails(MemRegion new_region, MemRegion intersection,
duke@435 182 MemRegion* bottom_region, MemRegion *top_region);
duke@435 183 // Try to merge the invalid region with the bottom or top region by decreasing
duke@435 184 // the intersection area. Return the invalid_region aligned to the page_size()
duke@435 185 // boundary if it's inside the intersection. Return non-empty invalid_region
duke@435 186 // if it lies inside the intersection (also page-aligned).
duke@435 187 // |------------------new_region---------------------------------|
duke@435 188 // |----------------|-------invalid---|--------------------------|
duke@435 189 // |----bottom_region--|---intersection---|------top_region------|
duke@435 190 void merge_regions(MemRegion new_region, MemRegion* intersection,
duke@435 191 MemRegion *invalid_region);
duke@435 192
duke@435 193 public:
duke@435 194 GrowableArray<LGRPSpace*>* lgrp_spaces() const { return _lgrp_spaces; }
iveresov@970 195 MutableNUMASpace(size_t alignment);
duke@435 196 virtual ~MutableNUMASpace();
duke@435 197 // Space initialization.
iveresov@970 198 virtual void initialize(MemRegion mr, bool clear_space, bool mangle_space, bool setup_pages = SetupPages);
duke@435 199 // Update space layout if necessary. Do all adaptive resizing job.
duke@435 200 virtual void update();
duke@435 201 // Update allocation rate averages.
duke@435 202 virtual void accumulate_statistics();
duke@435 203
jmasa@698 204 virtual void clear(bool mangle_space);
jmasa@698 205 virtual void mangle_unused_area() PRODUCT_RETURN;
jmasa@698 206 virtual void mangle_unused_area_complete() PRODUCT_RETURN;
jmasa@698 207 virtual void mangle_region(MemRegion mr) PRODUCT_RETURN;
jmasa@698 208 virtual void check_mangled_unused_area(HeapWord* limit) PRODUCT_RETURN;
jmasa@698 209 virtual void check_mangled_unused_area_complete() PRODUCT_RETURN;
jmasa@698 210 virtual void set_top_for_allocations(HeapWord* v) PRODUCT_RETURN;
jmasa@698 211 virtual void set_top_for_allocations() PRODUCT_RETURN;
jmasa@698 212
duke@435 213 virtual void ensure_parsability();
duke@435 214 virtual size_t used_in_words() const;
duke@435 215 virtual size_t free_in_words() const;
iveresov@808 216
iveresov@808 217 using MutableSpace::capacity_in_words;
iveresov@808 218 virtual size_t capacity_in_words(Thread* thr) const;
duke@435 219 virtual size_t tlab_capacity(Thread* thr) const;
duke@435 220 virtual size_t unsafe_max_tlab_alloc(Thread* thr) const;
duke@435 221
duke@435 222 // Allocation (return NULL if full)
duke@435 223 virtual HeapWord* allocate(size_t word_size);
duke@435 224 virtual HeapWord* cas_allocate(size_t word_size);
duke@435 225
duke@435 226 // Debugging
duke@435 227 virtual void print_on(outputStream* st) const;
duke@435 228 virtual void print_short_on(outputStream* st) const;
brutisso@3711 229 virtual void verify();
duke@435 230
duke@435 231 virtual void set_top(HeapWord* value);
duke@435 232 };
stefank@2314 233
stefank@2314 234 #endif // SHARE_VM_GC_IMPLEMENTATION_SHARED_MUTABLENUMASPACE_HPP

mercurial