Tue, 28 Jun 2016 15:59:50 +0800
Added flag PrintBiasedLockingStatistics support.
e.g.
the output of -XX:+PrintBiasedLockingStatistics would be like:
# total entries: 0
# biased lock entries: 7620231
# anonymously biased lock entries: 1258240
# rebiased lock entries: 11652
# revoked lock entries: 2
# fast path lock entries: 14836092
# slow path lock entries: 109781
aoqi@1 | 1 | /* |
aoqi@1 | 2 | * Copyright (c) 1999, 2013, Oracle and/or its affiliates. All rights reserved. |
aoqi@1 | 3 | * Copyright (c) 2015, 2016, Loongson Technology. All rights reserved. |
aoqi@1 | 4 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
aoqi@1 | 5 | * |
aoqi@1 | 6 | * This code is free software; you can redistribute it and/or modify it |
aoqi@1 | 7 | * under the terms of the GNU General Public License version 2 only, as |
aoqi@1 | 8 | * published by the Free Software Foundation. |
aoqi@1 | 9 | * |
aoqi@1 | 10 | * This code is distributed in the hope that it will be useful, but WITHOUT |
aoqi@1 | 11 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
aoqi@1 | 12 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
aoqi@1 | 13 | * version 2 for more details (a copy is included in the LICENSE file that |
aoqi@1 | 14 | * accompanied this code). |
aoqi@1 | 15 | * |
aoqi@1 | 16 | * You should have received a copy of the GNU General Public License version |
aoqi@1 | 17 | * 2 along with this work; if not, write to the Free Software Foundation, |
aoqi@1 | 18 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
aoqi@1 | 19 | * |
aoqi@1 | 20 | * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
aoqi@1 | 21 | * or visit www.oracle.com if you need additional information or have any |
aoqi@1 | 22 | * questions. |
aoqi@1 | 23 | * |
aoqi@1 | 24 | */ |
aoqi@1 | 25 | |
aoqi@1 | 26 | #include "precompiled.hpp" |
aoqi@1 | 27 | #include "c1/c1_MacroAssembler.hpp" |
aoqi@1 | 28 | #include "c1/c1_Runtime1.hpp" |
aoqi@1 | 29 | #include "classfile/systemDictionary.hpp" |
aoqi@1 | 30 | #include "gc_interface/collectedHeap.hpp" |
aoqi@1 | 31 | #include "interpreter/interpreter.hpp" |
aoqi@1 | 32 | #include "oops/arrayOop.hpp" |
aoqi@1 | 33 | #include "oops/markOop.hpp" |
aoqi@1 | 34 | #include "runtime/basicLock.hpp" |
aoqi@1 | 35 | #include "runtime/biasedLocking.hpp" |
aoqi@1 | 36 | #include "runtime/os.hpp" |
aoqi@1 | 37 | #include "runtime/stubRoutines.hpp" |
aoqi@1 | 38 | |
aoqi@1 | 39 | int C1_MacroAssembler::lock_object(Register hdr, Register obj, Register disp_hdr,Register scratch, Label& slow_case) { |
aoqi@1 | 40 | const int aligned_mask = BytesPerWord -1; |
aoqi@1 | 41 | const int hdr_offset = oopDesc::mark_offset_in_bytes(); |
aoqi@1 | 42 | |
aoqi@1 | 43 | // hdr is just a temperary register, it cannot be AT, however |
aoqi@1 | 44 | if ( hdr == NOREG ) { |
aoqi@1 | 45 | hdr = T8; |
aoqi@1 | 46 | } |
aoqi@1 | 47 | |
aoqi@1 | 48 | assert_different_registers(hdr, obj, disp_hdr); |
aoqi@1 | 49 | Label done; |
aoqi@1 | 50 | // The following move must be the first instruction of emitted since debug |
aoqi@1 | 51 | // information may be generated for it. |
aoqi@1 | 52 | // Load object header |
aoqi@1 | 53 | int null_check_offset = -1; |
aoqi@1 | 54 | verify_oop(obj); |
aoqi@1 | 55 | |
aoqi@1 | 56 | // save object being locked into the BasicObjectLock |
aoqi@1 | 57 | st_ptr(obj, disp_hdr, BasicObjectLock::obj_offset_in_bytes()); |
aoqi@1 | 58 | if (UseBiasedLocking) { |
aoqi@1 | 59 | assert(scratch != noreg, "should have scratch register at this point"); |
aoqi@1 | 60 | null_check_offset = biased_locking_enter(disp_hdr, obj, hdr, scratch, false, |
aoqi@1 | 61 | done, &slow_case); |
aoqi@1 | 62 | } else { |
aoqi@1 | 63 | null_check_offset = offset(); |
aoqi@1 | 64 | } |
aoqi@1 | 65 | |
aoqi@1 | 66 | // Load object header |
aoqi@1 | 67 | ld_ptr(hdr, obj, hdr_offset); |
aoqi@1 | 68 | // and mark it as unlocked |
aoqi@1 | 69 | ori(hdr, hdr, markOopDesc::unlocked_value); |
aoqi@1 | 70 | // save unlocked object header into the displaced header location on the stack |
aoqi@1 | 71 | sd(hdr, disp_hdr, 0); |
aoqi@1 | 72 | |
aoqi@1 | 73 | // test if object header is still the same (i.e. unlocked), and if so, store the |
aoqi@1 | 74 | // displaced header address in the object header - if it is not the same, get the |
aoqi@1 | 75 | // object header instead |
aoqi@1 | 76 | //if (os::is_MP()) MacroAssembler::lock(); // must be immediately before cmpxchg! |
aoqi@1 | 77 | cmpxchg(disp_hdr, Address(obj, hdr_offset), hdr); |
aoqi@1 | 78 | // if the object header was the same, we're done |
aoqi@1 | 79 | if (PrintBiasedLockingStatistics) { |
aoqi@29 | 80 | Label L; |
aoqi@29 | 81 | beq(AT, R0, L); |
aoqi@29 | 82 | delayed()->nop(); |
aoqi@29 | 83 | push(T0); |
aoqi@29 | 84 | push(T1); |
aoqi@29 | 85 | li(T0, (address) BiasedLocking::fast_path_entry_count_addr()); |
aoqi@29 | 86 | lw(T1, T0, 0); |
aoqi@29 | 87 | addi(T1, T1, 1); |
aoqi@29 | 88 | sw(T1, T0, 0); |
aoqi@29 | 89 | pop(T1); |
aoqi@29 | 90 | pop(T0); |
aoqi@29 | 91 | bind(L); |
aoqi@1 | 92 | } |
aoqi@1 | 93 | |
aoqi@1 | 94 | |
aoqi@1 | 95 | bne(AT, R0, done); |
aoqi@1 | 96 | delayed()->nop(); |
aoqi@1 | 97 | // if the object header was not the same, it is now in the hdr register |
aoqi@1 | 98 | // => test if it is a stack pointer into the same stack (recursive locking), i.e.: |
aoqi@1 | 99 | // |
aoqi@1 | 100 | // 1) (hdr & aligned_mask) == 0 |
aoqi@1 | 101 | // 2) SP <= hdr |
aoqi@1 | 102 | // 3) hdr <= SP + page_size |
aoqi@1 | 103 | // |
aoqi@1 | 104 | // these 3 tests can be done by evaluating the following expression: |
aoqi@1 | 105 | // |
aoqi@1 | 106 | // (hdr - SP) & (aligned_mask - page_size) |
aoqi@1 | 107 | // |
aoqi@1 | 108 | // assuming both the stack pointer and page_size have their least |
aoqi@1 | 109 | // significant 2 bits cleared and page_size is a power of 2 |
aoqi@1 | 110 | sub(hdr, hdr, SP); |
aoqi@1 | 111 | move(AT, aligned_mask - os::vm_page_size()); |
aoqi@1 | 112 | andr(hdr, hdr, AT); |
aoqi@1 | 113 | // for recursive locking, the result is zero => save it in the displaced header |
aoqi@1 | 114 | // location (NULL in the displaced hdr location indicates recursive locking) |
aoqi@1 | 115 | st_ptr(hdr, disp_hdr, 0); |
aoqi@1 | 116 | // otherwise we don't care about the result and handle locking via runtime call |
aoqi@1 | 117 | bne_far(hdr, R0, slow_case); |
aoqi@1 | 118 | delayed()->nop(); |
aoqi@1 | 119 | // done |
aoqi@1 | 120 | bind(done); |
aoqi@1 | 121 | return null_check_offset; |
aoqi@1 | 122 | } |
aoqi@1 | 123 | |
aoqi@1 | 124 | |
aoqi@1 | 125 | void C1_MacroAssembler::unlock_object(Register hdr, Register obj, Register disp_hdr, Label& slow_case) { |
aoqi@1 | 126 | const int aligned_mask = BytesPerWord -1; |
aoqi@1 | 127 | const int hdr_offset = oopDesc::mark_offset_in_bytes(); |
aoqi@1 | 128 | |
aoqi@1 | 129 | // hdr is just a temparay register, however, it cannot be AT |
aoqi@1 | 130 | if ( hdr == NOREG ) { |
aoqi@1 | 131 | hdr = T8; |
aoqi@1 | 132 | } |
aoqi@1 | 133 | |
aoqi@1 | 134 | assert_different_registers(hdr, obj, disp_hdr); |
aoqi@1 | 135 | assert(BytesPerWord == 8, "adjust aligned_mask and code"); |
aoqi@1 | 136 | Label done; |
aoqi@1 | 137 | if (UseBiasedLocking) { |
aoqi@1 | 138 | // load object |
aoqi@1 | 139 | ld_ptr(obj, Address(disp_hdr, BasicObjectLock::obj_offset_in_bytes())); |
aoqi@1 | 140 | biased_locking_exit(obj, hdr, done); |
aoqi@1 | 141 | } |
aoqi@1 | 142 | |
aoqi@1 | 143 | |
aoqi@1 | 144 | |
aoqi@1 | 145 | // load displaced header |
aoqi@1 | 146 | ld_ptr(hdr, disp_hdr, 0); |
aoqi@1 | 147 | // if the loaded hdr is NULL we had recursive locking |
aoqi@1 | 148 | // if we had recursive locking, we are done |
aoqi@1 | 149 | beq(hdr, R0, done); |
aoqi@1 | 150 | delayed()->nop(); |
aoqi@1 | 151 | // load object |
aoqi@1 | 152 | if(!UseBiasedLocking){ |
aoqi@1 | 153 | ld_ptr(obj, disp_hdr, BasicObjectLock::obj_offset_in_bytes()); |
aoqi@1 | 154 | } |
aoqi@1 | 155 | |
aoqi@1 | 156 | verify_oop(obj); |
aoqi@1 | 157 | // test if object header is pointing to the displaced header, and if so, restore |
aoqi@1 | 158 | // the displaced header in the object - if the object header is not pointing to |
aoqi@1 | 159 | // the displaced header, get the object header instead |
aoqi@1 | 160 | //if (os::is_MP()) MacroAssembler::lock(); // must be immediately before cmpxchg! |
aoqi@1 | 161 | cmpxchg(hdr, Address(obj, hdr_offset), disp_hdr); |
aoqi@1 | 162 | // if the object header was not pointing to the displaced header, |
aoqi@1 | 163 | // we do unlocking via runtime call |
aoqi@1 | 164 | beq_far(AT, R0, slow_case); |
aoqi@1 | 165 | delayed()->nop(); |
aoqi@1 | 166 | // done |
aoqi@1 | 167 | bind(done); |
aoqi@1 | 168 | } |
aoqi@1 | 169 | |
aoqi@1 | 170 | |
aoqi@1 | 171 | |
aoqi@1 | 172 | // Defines obj, preserves var_size_in_bytes |
aoqi@1 | 173 | void C1_MacroAssembler::try_allocate(Register obj, Register var_size_in_bytes, int con_size_in_bytes, Register t1, Register t2, Label& slow_case) { |
aoqi@1 | 174 | if (UseTLAB) { |
aoqi@1 | 175 | tlab_allocate(obj, var_size_in_bytes, con_size_in_bytes, t1, t2, slow_case); |
aoqi@1 | 176 | } else { |
aoqi@1 | 177 | eden_allocate(obj, var_size_in_bytes, con_size_in_bytes, t1, t2, slow_case); |
aoqi@1 | 178 | } |
aoqi@1 | 179 | } |
aoqi@1 | 180 | |
aoqi@1 | 181 | void C1_MacroAssembler::initialize_header(Register obj, Register klass, Register len, Register t1 , Register t2) { |
aoqi@1 | 182 | assert_different_registers(obj, klass, len, AT); |
aoqi@1 | 183 | |
aoqi@1 | 184 | if (UseBiasedLocking && !len->is_valid()) { |
aoqi@1 | 185 | assert_different_registers(obj, klass, len, t1, t2); |
aoqi@1 | 186 | ld_ptr(t1, klass, in_bytes(Klass::prototype_header_offset())); |
aoqi@1 | 187 | st_ptr(t1, obj, oopDesc::mark_offset_in_bytes()); |
aoqi@1 | 188 | } else { |
aoqi@1 | 189 | li(AT, (intptr_t)markOopDesc::prototype()); |
aoqi@1 | 190 | st_ptr(AT, obj, oopDesc::mark_offset_in_bytes()); |
aoqi@1 | 191 | } |
aoqi@1 | 192 | //st_ptr(klass, obj, oopDesc::klass_offset_in_bytes()); |
aoqi@1 | 193 | #ifdef _LP64 |
aoqi@1 | 194 | if (UseCompressedOops) { |
aoqi@1 | 195 | move(AT, klass); |
aoqi@1 | 196 | store_klass(obj, AT); |
aoqi@1 | 197 | } else |
aoqi@1 | 198 | #endif |
aoqi@1 | 199 | { |
aoqi@1 | 200 | st_ptr(klass, obj, oopDesc::klass_offset_in_bytes()); |
aoqi@1 | 201 | } |
aoqi@1 | 202 | |
aoqi@1 | 203 | if (len->is_valid()) { |
aoqi@1 | 204 | sw(len, obj, arrayOopDesc::length_offset_in_bytes()); |
aoqi@1 | 205 | } |
aoqi@1 | 206 | #ifdef _LP64 |
aoqi@1 | 207 | else if (UseCompressedOops) { |
aoqi@1 | 208 | store_klass_gap(obj, R0); |
aoqi@1 | 209 | } |
aoqi@1 | 210 | |
aoqi@1 | 211 | #endif |
aoqi@1 | 212 | } |
aoqi@1 | 213 | |
aoqi@1 | 214 | // preserves obj, destroys len_in_bytes |
aoqi@1 | 215 | void C1_MacroAssembler::initialize_body(Register obj, Register len_in_bytes, int hdr_size_in_bytes, Register t1) { |
aoqi@1 | 216 | Label done; |
aoqi@1 | 217 | Register ptr = t1; |
aoqi@1 | 218 | assert_different_registers(obj, ptr, len_in_bytes); |
aoqi@1 | 219 | assert((hdr_size_in_bytes & (BytesPerWord - 1)) == 0, |
aoqi@1 | 220 | "header size is not a multiple of BytesPerWord"); |
aoqi@1 | 221 | Register index = len_in_bytes; |
aoqi@1 | 222 | |
aoqi@1 | 223 | //tty->print_cr("C1_MacroAssembler::initialize_body LEN=0x%x, hdr_size=0x%x", len_in_bytes, hdr_size_in_bytes); |
aoqi@1 | 224 | assert(is_simm16(hdr_size_in_bytes), "change this code"); |
aoqi@1 | 225 | addi(index, index, - hdr_size_in_bytes); |
aoqi@1 | 226 | beq(index, R0, done); |
aoqi@1 | 227 | delayed(); |
aoqi@1 | 228 | |
aoqi@1 | 229 | // initialize topmost word, divide index by 2, check if odd and test if zero |
aoqi@1 | 230 | // note: for the remaining code to work, index must be a multiple of BytesPerWord |
aoqi@1 | 231 | #ifdef ASSERT |
aoqi@1 | 232 | { |
aoqi@1 | 233 | Label L; |
aoqi@1 | 234 | andi(AT, index, BytesPerWord - 1); |
aoqi@1 | 235 | beq(AT, R0, L); |
aoqi@1 | 236 | delayed()->nop(); |
aoqi@1 | 237 | stop("index is not a multiple of BytesPerWord"); |
aoqi@1 | 238 | bind(L); |
aoqi@1 | 239 | } |
aoqi@1 | 240 | #endif |
aoqi@1 | 241 | // index could have been not a multiple of 8 (i.e., bit 2 was set) |
aoqi@1 | 242 | { |
aoqi@1 | 243 | Label even; |
aoqi@1 | 244 | // note: if index was a multiple of 8, than it cannot |
aoqi@1 | 245 | // be 0 now otherwise it must have been 0 before |
aoqi@1 | 246 | // => if it is even, we don't need to check for 0 again |
aoqi@1 | 247 | #ifdef _LP64 |
aoqi@1 | 248 | andi(AT, index, 8); |
aoqi@1 | 249 | shr(index, 4); |
aoqi@1 | 250 | shl(index, 4); |
aoqi@1 | 251 | #else |
aoqi@1 | 252 | andi(AT, index, 4); |
aoqi@1 | 253 | shr(index, 3); |
aoqi@1 | 254 | shl(index, 3); |
aoqi@1 | 255 | #endif |
aoqi@1 | 256 | beq(AT, R0, even); |
aoqi@1 | 257 | delayed()->add(ptr, obj, index); |
aoqi@1 | 258 | // clear topmost word (no jump needed if conditional assignment would work here) |
aoqi@1 | 259 | st_ptr(R0, ptr, hdr_size_in_bytes); |
aoqi@1 | 260 | // index could be 0 now, need to check again |
aoqi@1 | 261 | beq(index, R0, done); |
aoqi@1 | 262 | delayed()->nop(); |
aoqi@1 | 263 | bind(even); |
aoqi@1 | 264 | } |
aoqi@1 | 265 | // initialize remaining object fields: edx is a multiple of 2 now |
aoqi@1 | 266 | { |
aoqi@1 | 267 | Label loop; |
aoqi@1 | 268 | bind(loop); |
aoqi@1 | 269 | st_ptr(R0, ptr, hdr_size_in_bytes - 1*BytesPerWord); |
aoqi@1 | 270 | st_ptr(R0, ptr, hdr_size_in_bytes - 2*BytesPerWord); |
aoqi@1 | 271 | |
aoqi@1 | 272 | addi(index, index, - 2 * wordSize); |
aoqi@1 | 273 | bne(index, R0, loop); |
aoqi@1 | 274 | delayed()->addi(ptr, ptr, - 2 * wordSize); |
aoqi@1 | 275 | } |
aoqi@1 | 276 | |
aoqi@1 | 277 | // done |
aoqi@1 | 278 | bind(done); |
aoqi@1 | 279 | } |
aoqi@1 | 280 | |
aoqi@1 | 281 | void C1_MacroAssembler::allocate_object(Register obj, Register t1, Register t2, int header_size, int object_size, Register klass, Label& slow_case) { |
aoqi@1 | 282 | //assert(obj == rax, "obj must be in rax, for cmpxchg"); |
aoqi@1 | 283 | assert(obj != t1 && obj != t2 && t1 != t2, "registers must be different"); // XXX really? |
aoqi@1 | 284 | assert(header_size >= 0 && object_size >= header_size, "illegal sizes"); |
aoqi@1 | 285 | |
aoqi@1 | 286 | try_allocate(obj, noreg, object_size * BytesPerWord, t1, t2, slow_case); |
aoqi@1 | 287 | |
aoqi@1 | 288 | initialize_object(obj, klass, noreg, object_size * HeapWordSize, t1, t2); |
aoqi@1 | 289 | } |
aoqi@1 | 290 | |
aoqi@1 | 291 | void C1_MacroAssembler::initialize_object(Register obj, Register klass, Register var_size_in_bytes, int con_size_in_bytes, Register t1, Register t2) { |
aoqi@1 | 292 | assert((con_size_in_bytes & MinObjAlignmentInBytesMask) == 0, |
aoqi@1 | 293 | "con_size_in_bytes is not multiple of alignment"); |
aoqi@1 | 294 | //Merged from b25 |
aoqi@1 | 295 | const int hdr_size_in_bytes = instanceOopDesc::header_size() * HeapWordSize; |
aoqi@1 | 296 | |
aoqi@1 | 297 | // initialize_header(obj, klass, NOREG); |
aoqi@1 | 298 | initialize_header(obj, klass, NOREG,t1,t2); |
aoqi@1 | 299 | |
aoqi@1 | 300 | // clear rest of allocated space |
aoqi@1 | 301 | const Register index = t2; |
aoqi@1 | 302 | //FIXME, x86 changed the value in jdk6 |
aoqi@1 | 303 | // const int threshold = hdr_size_in_bytes + 36; |
aoqi@1 | 304 | // // approximate break even point for code size (see comments below) |
aoqi@1 | 305 | const int threshold = 6 * BytesPerWord; |
aoqi@1 | 306 | // approximate break even point for code size (see comments below) |
aoqi@1 | 307 | if (var_size_in_bytes != NOREG) { |
aoqi@1 | 308 | move(index, var_size_in_bytes); |
aoqi@1 | 309 | initialize_body(obj, index, hdr_size_in_bytes, t1); |
aoqi@1 | 310 | } else if (con_size_in_bytes <= threshold) { |
aoqi@1 | 311 | // use explicit null stores |
aoqi@1 | 312 | // code size = 4*n bytes (n = number of fields to clear) |
aoqi@1 | 313 | |
aoqi@1 | 314 | for (int i = hdr_size_in_bytes; i < con_size_in_bytes; i += BytesPerWord) { |
aoqi@1 | 315 | st_ptr(R0, obj, i); |
aoqi@1 | 316 | } |
aoqi@1 | 317 | |
aoqi@1 | 318 | |
aoqi@1 | 319 | |
aoqi@1 | 320 | } else if(con_size_in_bytes > hdr_size_in_bytes) { |
aoqi@1 | 321 | // use loop to null out the fields |
aoqi@1 | 322 | // code size = 32 bytes for even n (n = number of fields to clear) |
aoqi@1 | 323 | // initialize last object field first if odd number of fields |
aoqi@1 | 324 | assert( ((con_size_in_bytes - hdr_size_in_bytes) >> 3)!=0, "change code here"); |
aoqi@1 | 325 | |
aoqi@1 | 326 | #ifdef _LP64 |
aoqi@1 | 327 | move(index, (con_size_in_bytes - hdr_size_in_bytes) >> 4); |
aoqi@1 | 328 | sll(t1, index, 4); |
aoqi@1 | 329 | #else |
aoqi@1 | 330 | move(index, (con_size_in_bytes - hdr_size_in_bytes) >> 3); |
aoqi@1 | 331 | sll(t1, index, 3); |
aoqi@1 | 332 | #endif |
aoqi@1 | 333 | add(t1, obj, t1); |
aoqi@1 | 334 | |
aoqi@1 | 335 | // initialize last object field if constant size is odd |
aoqi@1 | 336 | #ifdef _LP64 |
aoqi@1 | 337 | if (! UseCompressedOops) |
aoqi@1 | 338 | { |
aoqi@1 | 339 | if (((con_size_in_bytes - hdr_size_in_bytes) & 8) != 0) { |
aoqi@1 | 340 | sd(R0, t1, hdr_size_in_bytes); |
aoqi@1 | 341 | } |
aoqi@1 | 342 | } else if (UseCompressedOops) { |
aoqi@1 | 343 | int extra = (con_size_in_bytes - hdr_size_in_bytes) % 16; |
aoqi@1 | 344 | while (extra != 0) { |
aoqi@1 | 345 | sw(R0, t1, hdr_size_in_bytes + extra - 4); |
aoqi@1 | 346 | extra -= 4; |
aoqi@1 | 347 | } |
aoqi@1 | 348 | } |
aoqi@1 | 349 | #else |
aoqi@1 | 350 | if (((con_size_in_bytes - hdr_size_in_bytes) & 4) != 0) { |
aoqi@1 | 351 | sw(R0, t1, hdr_size_in_bytes); |
aoqi@1 | 352 | } |
aoqi@1 | 353 | #endif |
aoqi@1 | 354 | // initialize remaining object fields: edx is a multiple of 2 |
aoqi@1 | 355 | { |
aoqi@1 | 356 | Label loop; |
aoqi@1 | 357 | bind(loop); |
aoqi@1 | 358 | st_ptr(R0, t1, hdr_size_in_bytes - (1*BytesPerWord)); |
aoqi@1 | 359 | st_ptr(R0, t1, hdr_size_in_bytes - (2*BytesPerWord)); |
aoqi@1 | 360 | addi(index, index, -1); |
aoqi@1 | 361 | bne(index, R0, loop); |
aoqi@1 | 362 | delayed()->addi(t1, t1, - 2 * wordSize); |
aoqi@1 | 363 | } |
aoqi@1 | 364 | } |
aoqi@1 | 365 | |
aoqi@1 | 366 | if (DTraceAllocProbes) { |
aoqi@1 | 367 | //assert(obj == eax, "must be"); |
aoqi@1 | 368 | call(CAST_FROM_FN_PTR(address, |
aoqi@1 | 369 | Runtime1::entry_for(Runtime1::dtrace_object_alloc_id)), relocInfo::runtime_call_type); |
aoqi@1 | 370 | delayed()->nop(); |
aoqi@1 | 371 | } |
aoqi@1 | 372 | verify_oop(obj); |
aoqi@1 | 373 | } |
aoqi@1 | 374 | |
aoqi@1 | 375 | void C1_MacroAssembler::allocate_array(Register obj, Register len, Register t1, Register t2, Register t3,int header_size, |
aoqi@1 | 376 | int scale, Register klass, Label& slow_case) { |
aoqi@1 | 377 | assert(obj == V0, "obj must be in V0 for cmpxchg"); |
aoqi@1 | 378 | assert_different_registers(obj, len, t1, t2, t3,klass, AT); |
aoqi@1 | 379 | |
aoqi@1 | 380 | // determine alignment mask |
aoqi@1 | 381 | assert(BytesPerWord == 8, "must be a multiple of 2 for masking code to work"); |
aoqi@1 | 382 | |
aoqi@1 | 383 | // check for negative or excessive length |
aoqi@1 | 384 | //const int max_length = 0x00FFFFFF; |
aoqi@1 | 385 | // move(AT, max_length); |
aoqi@1 | 386 | move(AT, max_array_allocation_length); |
aoqi@1 | 387 | sltu(AT, AT, len); |
aoqi@1 | 388 | bne_far(AT, R0, slow_case); |
aoqi@1 | 389 | delayed()->nop(); |
aoqi@1 | 390 | |
aoqi@1 | 391 | const Register arr_size = t3; |
aoqi@1 | 392 | // align object end |
aoqi@1 | 393 | move(arr_size, header_size * BytesPerWord + MinObjAlignmentInBytesMask); |
aoqi@1 | 394 | sll(AT, len, scale); |
aoqi@1 | 395 | add(arr_size, arr_size, AT); |
aoqi@1 | 396 | move(AT, ~MinObjAlignmentInBytesMask); |
aoqi@1 | 397 | andr(arr_size, arr_size, AT); |
aoqi@1 | 398 | |
aoqi@1 | 399 | try_allocate(obj, arr_size, 0, t1, t2, slow_case); |
aoqi@1 | 400 | |
aoqi@1 | 401 | initialize_header(obj, klass, len,t1,t2); |
aoqi@1 | 402 | |
aoqi@1 | 403 | // clear rest of allocated space |
aoqi@1 | 404 | const Register len_zero = len; |
aoqi@1 | 405 | initialize_body(obj, arr_size, header_size * BytesPerWord, len_zero); |
aoqi@1 | 406 | if (DTraceAllocProbes) { |
aoqi@1 | 407 | // assert(obj == eax, "must be"); |
aoqi@1 | 408 | call(CAST_FROM_FN_PTR(address, |
aoqi@1 | 409 | Runtime1::entry_for(Runtime1::dtrace_object_alloc_id)), |
aoqi@1 | 410 | relocInfo::runtime_call_type); |
aoqi@1 | 411 | delayed()->nop(); |
aoqi@1 | 412 | } |
aoqi@1 | 413 | |
aoqi@1 | 414 | verify_oop(obj); |
aoqi@1 | 415 | } |
aoqi@1 | 416 | |
aoqi@1 | 417 | |
aoqi@1 | 418 | void C1_MacroAssembler::inline_cache_check(Register receiver, Register iCache) { |
aoqi@1 | 419 | verify_oop(receiver); |
aoqi@1 | 420 | // explicit NULL check not needed since load from [klass_offset] causes a trap |
aoqi@1 | 421 | // check against inline cache |
aoqi@1 | 422 | assert(!MacroAssembler::needs_explicit_null_check(oopDesc::klass_offset_in_bytes()), "must add explicit null check"); |
aoqi@1 | 423 | ///cmpl(iCache, Address(receiver, oopDesc::klass_offset_in_bytes())); |
aoqi@1 | 424 | // if icache check fails, then jump to runtime routine |
aoqi@1 | 425 | // Note: RECEIVER must still contain the receiver! |
aoqi@1 | 426 | Label L; |
aoqi@1 | 427 | #ifdef _LP64 |
aoqi@1 | 428 | //ld_ptr(AT, receiver, oopDesc::klass_offset_in_bytes()); |
aoqi@1 | 429 | //add for compressedoops |
aoqi@1 | 430 | load_klass(AT, receiver); |
aoqi@1 | 431 | #else |
aoqi@1 | 432 | lw(AT, receiver, oopDesc::klass_offset_in_bytes()); |
aoqi@1 | 433 | #endif |
aoqi@1 | 434 | beq(AT, iCache, L); |
aoqi@1 | 435 | delayed()->nop(); |
aoqi@1 | 436 | // jmp(Runtime1::entry_for(Runtime1::handle_ic_miss_id), relocInfo::runtime_call_type); |
aoqi@1 | 437 | jmp(SharedRuntime::get_ic_miss_stub(), relocInfo::runtime_call_type); |
aoqi@1 | 438 | delayed()->nop(); |
aoqi@1 | 439 | bind(L); |
aoqi@1 | 440 | // assert(UseCompressedOops, "check alignment in emit_method_entry"); |
aoqi@1 | 441 | } |
aoqi@1 | 442 | /* |
aoqi@1 | 443 | void C1_MacroAssembler::method_exit(bool restore_frame) { |
aoqi@1 | 444 | if (restore_frame) { |
aoqi@1 | 445 | leave(); |
aoqi@1 | 446 | } |
aoqi@1 | 447 | jr(RA); |
aoqi@1 | 448 | delayed()->nop(); |
aoqi@1 | 449 | }*/ |
aoqi@1 | 450 | |
aoqi@1 | 451 | |
aoqi@1 | 452 | void C1_MacroAssembler::build_frame(int frame_size_in_bytes, int bang_size_in_bytes) { |
aoqi@1 | 453 | // Make sure there is enough stack space for this method's activation. |
aoqi@1 | 454 | // Note that we do this before doing an enter(). This matches the |
aoqi@1 | 455 | // ordering of C2's stack overflow check / esp decrement and allows |
aoqi@1 | 456 | // the SharedRuntime stack overflow handling to be consistent |
aoqi@1 | 457 | // between the two compilers. |
aoqi@1 | 458 | generate_stack_overflow_check(frame_size_in_bytes); |
aoqi@1 | 459 | |
aoqi@1 | 460 | enter(); |
aoqi@1 | 461 | //FIXME |
aoqi@1 | 462 | #ifdef TIERED |
aoqi@1 | 463 | // c2 leaves fpu stack dirty. Clean it on entry |
aoqi@1 | 464 | // if (UseSSE < 2 ) { |
aoqi@1 | 465 | empty_FPU_stack(); |
aoqi@1 | 466 | // } |
aoqi@1 | 467 | #endif // TIERED |
aoqi@1 | 468 | |
aoqi@1 | 469 | decrement(SP, frame_size_in_bytes); // does not emit code for frame_size == 0 |
aoqi@1 | 470 | } |
aoqi@1 | 471 | |
aoqi@1 | 472 | void C1_MacroAssembler::unverified_entry(Register receiver, Register ic_klass) { |
aoqi@1 | 473 | if (C1Breakpoint) int3(); |
aoqi@1 | 474 | inline_cache_check(receiver, ic_klass); |
aoqi@1 | 475 | } |
aoqi@1 | 476 | |
aoqi@1 | 477 | |
aoqi@1 | 478 | void C1_MacroAssembler::verified_entry() { |
aoqi@1 | 479 | if (C1Breakpoint)int3(); |
aoqi@1 | 480 | // build frame |
aoqi@1 | 481 | verify_FPU(0, "method_entry"); |
aoqi@1 | 482 | } |
aoqi@1 | 483 | |
aoqi@1 | 484 | |
aoqi@1 | 485 | #ifndef PRODUCT |
aoqi@1 | 486 | void C1_MacroAssembler::verify_stack_oop(int stack_offset) { |
aoqi@1 | 487 | if (!VerifyOops) return; |
aoqi@1 | 488 | // verify_oop_addr(Address(esp, stack_offset)); |
aoqi@1 | 489 | verify_oop_addr(Address(SP, stack_offset)); |
aoqi@1 | 490 | } |
aoqi@1 | 491 | |
aoqi@1 | 492 | void C1_MacroAssembler::verify_not_null_oop(Register r) { |
aoqi@1 | 493 | if (!VerifyOops) return; |
aoqi@1 | 494 | Label not_null; |
aoqi@1 | 495 | // testl(r, r); |
aoqi@1 | 496 | //jcc(Assembler::notZero, not_null); |
aoqi@1 | 497 | bne(r,R0,not_null); |
aoqi@1 | 498 | delayed()->nop(); |
aoqi@1 | 499 | stop("non-null oop required"); |
aoqi@1 | 500 | bind(not_null); |
aoqi@1 | 501 | verify_oop(r); |
aoqi@1 | 502 | } |
aoqi@1 | 503 | |
aoqi@1 | 504 | void C1_MacroAssembler::invalidate_registers(bool inv_v0, bool inv_v1, bool inv_t3, bool inv_t7, bool inv_s0, bool inv_s7) { |
aoqi@1 | 505 | #ifdef ASSERT |
aoqi@1 | 506 | /* if (inv_eax) movl(eax, 0xDEAD); |
aoqi@1 | 507 | if (inv_ebx) movl(ebx, 0xDEAD); |
aoqi@1 | 508 | if (inv_ecx) movl(ecx, 0xDEAD); |
aoqi@1 | 509 | if (inv_edx) movl(edx, 0xDEAD); |
aoqi@1 | 510 | if (inv_esi) movl(esi, 0xDEAD); |
aoqi@1 | 511 | if (inv_edi) movl(edi, 0xDEAD); |
aoqi@1 | 512 | */ |
aoqi@1 | 513 | //if (inv_v0) move(V0, 0xDEAD); |
aoqi@1 | 514 | //if (inv_v1) move(V1, 0xDEAD); |
aoqi@1 | 515 | //if (inv_t3) move(T3, 0xDEAD); |
aoqi@1 | 516 | //if (inv_t7) move(T7, 0xDEAD); |
aoqi@1 | 517 | //if (inv_s0) move(S0, 0xDEAD); |
aoqi@1 | 518 | //if (inv_s7) move(S7, 0xDEAD); |
aoqi@1 | 519 | #endif |
aoqi@1 | 520 | } |
aoqi@1 | 521 | #endif // ifndef PRODUCT |
aoqi@1 | 522 | |
aoqi@1 | 523 |