Thu, 24 May 2018 19:49:50 +0800
some C1 fix
Contributed-by: chenhaoxuan, zhaixiang, aoqi
aoqi@1 | 1 | /* |
aoqi@1 | 2 | * Copyright (c) 1999, 2013, Oracle and/or its affiliates. All rights reserved. |
aoqi@1 | 3 | * Copyright (c) 2015, 2016, Loongson Technology. All rights reserved. |
aoqi@1 | 4 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
aoqi@1 | 5 | * |
aoqi@1 | 6 | * This code is free software; you can redistribute it and/or modify it |
aoqi@1 | 7 | * under the terms of the GNU General Public License version 2 only, as |
aoqi@1 | 8 | * published by the Free Software Foundation. |
aoqi@1 | 9 | * |
aoqi@1 | 10 | * This code is distributed in the hope that it will be useful, but WITHOUT |
aoqi@1 | 11 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
aoqi@1 | 12 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
aoqi@1 | 13 | * version 2 for more details (a copy is included in the LICENSE file that |
aoqi@1 | 14 | * accompanied this code). |
aoqi@1 | 15 | * |
aoqi@1 | 16 | * You should have received a copy of the GNU General Public License version |
aoqi@1 | 17 | * 2 along with this work; if not, write to the Free Software Foundation, |
aoqi@1 | 18 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
aoqi@1 | 19 | * |
aoqi@1 | 20 | * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
aoqi@1 | 21 | * or visit www.oracle.com if you need additional information or have any |
aoqi@1 | 22 | * questions. |
aoqi@1 | 23 | * |
aoqi@1 | 24 | */ |
aoqi@1 | 25 | |
aoqi@1 | 26 | #include "precompiled.hpp" |
aoqi@1 | 27 | #include "c1/c1_MacroAssembler.hpp" |
aoqi@1 | 28 | #include "c1/c1_Runtime1.hpp" |
aoqi@1 | 29 | #include "classfile/systemDictionary.hpp" |
aoqi@1 | 30 | #include "gc_interface/collectedHeap.hpp" |
aoqi@1 | 31 | #include "interpreter/interpreter.hpp" |
aoqi@1 | 32 | #include "oops/arrayOop.hpp" |
aoqi@1 | 33 | #include "oops/markOop.hpp" |
aoqi@1 | 34 | #include "runtime/basicLock.hpp" |
aoqi@1 | 35 | #include "runtime/biasedLocking.hpp" |
aoqi@1 | 36 | #include "runtime/os.hpp" |
aoqi@1 | 37 | #include "runtime/stubRoutines.hpp" |
aoqi@1 | 38 | |
aoqi@1 | 39 | int C1_MacroAssembler::lock_object(Register hdr, Register obj, Register disp_hdr,Register scratch, Label& slow_case) { |
aoqi@1 | 40 | const int aligned_mask = BytesPerWord -1; |
aoqi@1 | 41 | const int hdr_offset = oopDesc::mark_offset_in_bytes(); |
aoqi@1 | 42 | |
aoqi@1 | 43 | // hdr is just a temperary register, it cannot be AT, however |
aoqi@1 | 44 | if ( hdr == NOREG ) { |
aoqi@1 | 45 | hdr = T8; |
aoqi@1 | 46 | } |
aoqi@1 | 47 | |
aoqi@1 | 48 | assert_different_registers(hdr, obj, disp_hdr); |
aoqi@1 | 49 | Label done; |
aoqi@1 | 50 | // The following move must be the first instruction of emitted since debug |
aoqi@1 | 51 | // information may be generated for it. |
aoqi@1 | 52 | // Load object header |
aoqi@1 | 53 | int null_check_offset = -1; |
aoqi@1 | 54 | verify_oop(obj); |
aoqi@1 | 55 | |
aoqi@1 | 56 | // save object being locked into the BasicObjectLock |
aoqi@1 | 57 | st_ptr(obj, disp_hdr, BasicObjectLock::obj_offset_in_bytes()); |
aoqi@1 | 58 | if (UseBiasedLocking) { |
aoqi@1 | 59 | assert(scratch != noreg, "should have scratch register at this point"); |
aoqi@6880 | 60 | null_check_offset = biased_locking_enter(disp_hdr, obj, hdr, scratch, false, |
aoqi@6880 | 61 | done, &slow_case); |
aoqi@1 | 62 | } else { |
aoqi@1 | 63 | null_check_offset = offset(); |
aoqi@1 | 64 | } |
aoqi@1 | 65 | |
aoqi@1 | 66 | // Load object header |
aoqi@6880 | 67 | ld_ptr(hdr, obj, hdr_offset); |
aoqi@1 | 68 | // and mark it as unlocked |
aoqi@1 | 69 | ori(hdr, hdr, markOopDesc::unlocked_value); |
aoqi@1 | 70 | // save unlocked object header into the displaced header location on the stack |
aoqi@1 | 71 | sd(hdr, disp_hdr, 0); |
aoqi@1 | 72 | |
aoqi@1 | 73 | // test if object header is still the same (i.e. unlocked), and if so, store the |
aoqi@1 | 74 | // displaced header address in the object header - if it is not the same, get the |
aoqi@1 | 75 | // object header instead |
aoqi@1 | 76 | //if (os::is_MP()) MacroAssembler::lock(); // must be immediately before cmpxchg! |
aoqi@1 | 77 | cmpxchg(disp_hdr, Address(obj, hdr_offset), hdr); |
aoqi@1 | 78 | // if the object header was the same, we're done |
aoqi@1 | 79 | if (PrintBiasedLockingStatistics) { |
aoqi@29 | 80 | Label L; |
aoqi@29 | 81 | beq(AT, R0, L); |
aoqi@29 | 82 | delayed()->nop(); |
aoqi@29 | 83 | push(T0); |
aoqi@29 | 84 | push(T1); |
aoqi@29 | 85 | li(T0, (address) BiasedLocking::fast_path_entry_count_addr()); |
aoqi@29 | 86 | lw(T1, T0, 0); |
aoqi@29 | 87 | addi(T1, T1, 1); |
aoqi@29 | 88 | sw(T1, T0, 0); |
aoqi@29 | 89 | pop(T1); |
aoqi@29 | 90 | pop(T0); |
aoqi@29 | 91 | bind(L); |
aoqi@1 | 92 | } |
aoqi@1 | 93 | |
aoqi@1 | 94 | |
aoqi@1 | 95 | bne(AT, R0, done); |
aoqi@1 | 96 | delayed()->nop(); |
aoqi@1 | 97 | // if the object header was not the same, it is now in the hdr register |
aoqi@1 | 98 | // => test if it is a stack pointer into the same stack (recursive locking), i.e.: |
aoqi@1 | 99 | // |
aoqi@1 | 100 | // 1) (hdr & aligned_mask) == 0 |
aoqi@1 | 101 | // 2) SP <= hdr |
aoqi@1 | 102 | // 3) hdr <= SP + page_size |
aoqi@1 | 103 | // |
aoqi@1 | 104 | // these 3 tests can be done by evaluating the following expression: |
aoqi@1 | 105 | // |
aoqi@1 | 106 | // (hdr - SP) & (aligned_mask - page_size) |
aoqi@1 | 107 | // |
aoqi@1 | 108 | // assuming both the stack pointer and page_size have their least |
aoqi@1 | 109 | // significant 2 bits cleared and page_size is a power of 2 |
aoqi@1 | 110 | sub(hdr, hdr, SP); |
aoqi@1 | 111 | move(AT, aligned_mask - os::vm_page_size()); |
aoqi@1 | 112 | andr(hdr, hdr, AT); |
aoqi@1 | 113 | // for recursive locking, the result is zero => save it in the displaced header |
aoqi@1 | 114 | // location (NULL in the displaced hdr location indicates recursive locking) |
aoqi@1 | 115 | st_ptr(hdr, disp_hdr, 0); |
aoqi@1 | 116 | // otherwise we don't care about the result and handle locking via runtime call |
aoqi@1 | 117 | bne_far(hdr, R0, slow_case); |
aoqi@1 | 118 | delayed()->nop(); |
aoqi@1 | 119 | // done |
aoqi@1 | 120 | bind(done); |
aoqi@1 | 121 | return null_check_offset; |
aoqi@1 | 122 | } |
aoqi@1 | 123 | |
aoqi@1 | 124 | |
aoqi@1 | 125 | void C1_MacroAssembler::unlock_object(Register hdr, Register obj, Register disp_hdr, Label& slow_case) { |
aoqi@1 | 126 | const int aligned_mask = BytesPerWord -1; |
aoqi@1 | 127 | const int hdr_offset = oopDesc::mark_offset_in_bytes(); |
aoqi@1 | 128 | |
aoqi@1 | 129 | // hdr is just a temparay register, however, it cannot be AT |
aoqi@1 | 130 | if ( hdr == NOREG ) { |
aoqi@1 | 131 | hdr = T8; |
aoqi@1 | 132 | } |
aoqi@1 | 133 | |
aoqi@1 | 134 | assert_different_registers(hdr, obj, disp_hdr); |
aoqi@1 | 135 | assert(BytesPerWord == 8, "adjust aligned_mask and code"); |
aoqi@1 | 136 | Label done; |
aoqi@1 | 137 | if (UseBiasedLocking) { |
aoqi@1 | 138 | // load object |
aoqi@1 | 139 | ld_ptr(obj, Address(disp_hdr, BasicObjectLock::obj_offset_in_bytes())); |
aoqi@1 | 140 | biased_locking_exit(obj, hdr, done); |
aoqi@1 | 141 | } |
aoqi@1 | 142 | |
aoqi@1 | 143 | // load displaced header |
aoqi@1 | 144 | ld_ptr(hdr, disp_hdr, 0); |
aoqi@1 | 145 | // if the loaded hdr is NULL we had recursive locking |
aoqi@1 | 146 | // if we had recursive locking, we are done |
aoqi@1 | 147 | beq(hdr, R0, done); |
aoqi@1 | 148 | delayed()->nop(); |
aoqi@1 | 149 | // load object |
aoqi@1 | 150 | if(!UseBiasedLocking){ |
aoqi@1 | 151 | ld_ptr(obj, disp_hdr, BasicObjectLock::obj_offset_in_bytes()); |
aoqi@1 | 152 | } |
aoqi@1 | 153 | |
aoqi@1 | 154 | verify_oop(obj); |
aoqi@1 | 155 | // test if object header is pointing to the displaced header, and if so, restore |
aoqi@1 | 156 | // the displaced header in the object - if the object header is not pointing to |
aoqi@1 | 157 | // the displaced header, get the object header instead |
aoqi@1 | 158 | //if (os::is_MP()) MacroAssembler::lock(); // must be immediately before cmpxchg! |
aoqi@1 | 159 | cmpxchg(hdr, Address(obj, hdr_offset), disp_hdr); |
aoqi@1 | 160 | // if the object header was not pointing to the displaced header, |
aoqi@1 | 161 | // we do unlocking via runtime call |
aoqi@1 | 162 | beq_far(AT, R0, slow_case); |
aoqi@1 | 163 | delayed()->nop(); |
aoqi@1 | 164 | // done |
aoqi@1 | 165 | bind(done); |
aoqi@1 | 166 | } |
aoqi@1 | 167 | |
aoqi@1 | 168 | |
aoqi@1 | 169 | // Defines obj, preserves var_size_in_bytes |
aoqi@1 | 170 | void C1_MacroAssembler::try_allocate(Register obj, Register var_size_in_bytes, int con_size_in_bytes, Register t1, Register t2, Label& slow_case) { |
aoqi@1 | 171 | if (UseTLAB) { |
aoqi@1 | 172 | tlab_allocate(obj, var_size_in_bytes, con_size_in_bytes, t1, t2, slow_case); |
aoqi@1 | 173 | } else { |
aoqi@1 | 174 | eden_allocate(obj, var_size_in_bytes, con_size_in_bytes, t1, t2, slow_case); |
aoqi@1 | 175 | } |
aoqi@1 | 176 | } |
aoqi@1 | 177 | |
aoqi@1 | 178 | void C1_MacroAssembler::initialize_header(Register obj, Register klass, Register len, Register t1 , Register t2) { |
aoqi@8865 | 179 | assert_different_registers(obj, klass, len, T9); |
aoqi@1 | 180 | |
aoqi@1 | 181 | if (UseBiasedLocking && !len->is_valid()) { |
aoqi@1 | 182 | assert_different_registers(obj, klass, len, t1, t2); |
aoqi@1 | 183 | ld_ptr(t1, klass, in_bytes(Klass::prototype_header_offset())); |
aoqi@1 | 184 | st_ptr(t1, obj, oopDesc::mark_offset_in_bytes()); |
aoqi@1 | 185 | } else { |
aoqi@8865 | 186 | li(T9, (intptr_t)markOopDesc::prototype()); |
aoqi@8865 | 187 | st_ptr(T9, obj, oopDesc::mark_offset_in_bytes()); |
aoqi@6880 | 188 | } |
aoqi@1 | 189 | //st_ptr(klass, obj, oopDesc::klass_offset_in_bytes()); |
aoqi@1 | 190 | #ifdef _LP64 |
aoqi@8865 | 191 | if (UseCompressedClassPointers) { |
aoqi@8865 | 192 | move(T9, klass); |
aoqi@8865 | 193 | store_klass(obj, T9); |
aoqi@1 | 194 | } else |
aoqi@1 | 195 | #endif |
aoqi@1 | 196 | { |
aoqi@1 | 197 | st_ptr(klass, obj, oopDesc::klass_offset_in_bytes()); |
aoqi@1 | 198 | } |
aoqi@1 | 199 | |
aoqi@1 | 200 | if (len->is_valid()) { |
aoqi@1 | 201 | sw(len, obj, arrayOopDesc::length_offset_in_bytes()); |
aoqi@1 | 202 | } |
aoqi@1 | 203 | #ifdef _LP64 |
aoqi@8865 | 204 | else if (UseCompressedClassPointers) { |
aoqi@1 | 205 | store_klass_gap(obj, R0); |
aoqi@1 | 206 | } |
aoqi@1 | 207 | #endif |
aoqi@1 | 208 | } |
aoqi@1 | 209 | |
aoqi@6880 | 210 | |
aoqi@1 | 211 | // preserves obj, destroys len_in_bytes |
aoqi@1 | 212 | void C1_MacroAssembler::initialize_body(Register obj, Register len_in_bytes, int hdr_size_in_bytes, Register t1) { |
aoqi@1 | 213 | Label done; |
aoqi@1 | 214 | Register ptr = t1; |
aoqi@1 | 215 | assert_different_registers(obj, ptr, len_in_bytes); |
aoqi@6880 | 216 | assert((hdr_size_in_bytes & (BytesPerWord - 1)) == 0, |
aoqi@1 | 217 | "header size is not a multiple of BytesPerWord"); |
aoqi@1 | 218 | Register index = len_in_bytes; |
aoqi@1 | 219 | |
aoqi@1 | 220 | //tty->print_cr("C1_MacroAssembler::initialize_body LEN=0x%x, hdr_size=0x%x", len_in_bytes, hdr_size_in_bytes); |
aoqi@1 | 221 | assert(is_simm16(hdr_size_in_bytes), "change this code"); |
aoqi@1 | 222 | addi(index, index, - hdr_size_in_bytes); |
aoqi@1 | 223 | beq(index, R0, done); |
aoqi@1 | 224 | delayed(); |
aoqi@1 | 225 | |
aoqi@1 | 226 | // initialize topmost word, divide index by 2, check if odd and test if zero |
aoqi@1 | 227 | // note: for the remaining code to work, index must be a multiple of BytesPerWord |
aoqi@1 | 228 | #ifdef ASSERT |
aoqi@6880 | 229 | { |
aoqi@1 | 230 | Label L; |
aoqi@1 | 231 | andi(AT, index, BytesPerWord - 1); |
aoqi@1 | 232 | beq(AT, R0, L); |
aoqi@1 | 233 | delayed()->nop(); |
aoqi@1 | 234 | stop("index is not a multiple of BytesPerWord"); |
aoqi@1 | 235 | bind(L); |
aoqi@1 | 236 | } |
aoqi@1 | 237 | #endif |
aoqi@1 | 238 | // index could have been not a multiple of 8 (i.e., bit 2 was set) |
aoqi@6880 | 239 | { |
aoqi@1 | 240 | Label even; |
aoqi@1 | 241 | // note: if index was a multiple of 8, than it cannot |
aoqi@1 | 242 | // be 0 now otherwise it must have been 0 before |
aoqi@1 | 243 | // => if it is even, we don't need to check for 0 again |
aoqi@1 | 244 | #ifdef _LP64 |
aoqi@1 | 245 | andi(AT, index, 8); |
aoqi@1 | 246 | shr(index, 4); |
aoqi@1 | 247 | shl(index, 4); |
aoqi@1 | 248 | #else |
aoqi@1 | 249 | andi(AT, index, 4); |
aoqi@1 | 250 | shr(index, 3); |
aoqi@1 | 251 | shl(index, 3); |
aoqi@1 | 252 | #endif |
aoqi@1 | 253 | beq(AT, R0, even); |
aoqi@1 | 254 | delayed()->add(ptr, obj, index); |
aoqi@1 | 255 | // clear topmost word (no jump needed if conditional assignment would work here) |
aoqi@6880 | 256 | st_ptr(R0, ptr, hdr_size_in_bytes); |
aoqi@1 | 257 | // index could be 0 now, need to check again |
aoqi@1 | 258 | beq(index, R0, done); |
aoqi@1 | 259 | delayed()->nop(); |
aoqi@1 | 260 | bind(even); |
aoqi@1 | 261 | } |
aoqi@1 | 262 | // initialize remaining object fields: edx is a multiple of 2 now |
aoqi@6880 | 263 | { |
aoqi@1 | 264 | Label loop; |
aoqi@1 | 265 | bind(loop); |
aoqi@1 | 266 | st_ptr(R0, ptr, hdr_size_in_bytes - 1*BytesPerWord); |
aoqi@1 | 267 | st_ptr(R0, ptr, hdr_size_in_bytes - 2*BytesPerWord); |
aoqi@1 | 268 | |
aoqi@1 | 269 | addi(index, index, - 2 * wordSize); |
aoqi@1 | 270 | bne(index, R0, loop); |
aoqi@1 | 271 | delayed()->addi(ptr, ptr, - 2 * wordSize); |
aoqi@1 | 272 | } |
aoqi@1 | 273 | |
aoqi@1 | 274 | // done |
aoqi@1 | 275 | bind(done); |
aoqi@1 | 276 | } |
aoqi@1 | 277 | |
aoqi@1 | 278 | void C1_MacroAssembler::allocate_object(Register obj, Register t1, Register t2, int header_size, int object_size, Register klass, Label& slow_case) { |
aoqi@1 | 279 | //assert(obj == rax, "obj must be in rax, for cmpxchg"); |
aoqi@1 | 280 | assert(obj != t1 && obj != t2 && t1 != t2, "registers must be different"); // XXX really? |
aoqi@1 | 281 | assert(header_size >= 0 && object_size >= header_size, "illegal sizes"); |
aoqi@1 | 282 | |
aoqi@1 | 283 | try_allocate(obj, noreg, object_size * BytesPerWord, t1, t2, slow_case); |
aoqi@1 | 284 | |
aoqi@1 | 285 | initialize_object(obj, klass, noreg, object_size * HeapWordSize, t1, t2); |
aoqi@1 | 286 | } |
aoqi@1 | 287 | |
aoqi@1 | 288 | void C1_MacroAssembler::initialize_object(Register obj, Register klass, Register var_size_in_bytes, int con_size_in_bytes, Register t1, Register t2) { |
aoqi@6880 | 289 | assert((con_size_in_bytes & MinObjAlignmentInBytesMask) == 0, |
aoqi@6880 | 290 | "con_size_in_bytes is not multiple of alignment"); |
aoqi@6880 | 291 | //Merged from b25 |
aoqi@6880 | 292 | const int hdr_size_in_bytes = instanceOopDesc::header_size() * HeapWordSize; |
aoqi@1 | 293 | |
aoqi@6880 | 294 | // initialize_header(obj, klass, NOREG); |
aoqi@6880 | 295 | initialize_header(obj, klass, NOREG,t1,t2); |
aoqi@1 | 296 | |
aoqi@6880 | 297 | // clear rest of allocated space |
aoqi@6880 | 298 | const Register index = t2; |
aoqi@6880 | 299 | //FIXME, x86 changed the value in jdk6 |
aoqi@6880 | 300 | // const int threshold = hdr_size_in_bytes + 36; |
aoqi@6880 | 301 | // // approximate break even point for code size (see comments below) |
aoqi@6880 | 302 | const int threshold = 6 * BytesPerWord; |
aoqi@6880 | 303 | // approximate break even point for code size (see comments below) |
aoqi@6880 | 304 | if (var_size_in_bytes != NOREG) { |
aoqi@6880 | 305 | move(index, var_size_in_bytes); |
aoqi@6880 | 306 | initialize_body(obj, index, hdr_size_in_bytes, t1); |
aoqi@6880 | 307 | } else if (con_size_in_bytes <= threshold) { |
aoqi@6880 | 308 | // use explicit null stores |
aoqi@6880 | 309 | // code size = 4*n bytes (n = number of fields to clear) |
aoqi@1 | 310 | |
aoqi@6880 | 311 | for (int i = hdr_size_in_bytes; i < con_size_in_bytes; i += BytesPerWord) { |
aoqi@6880 | 312 | st_ptr(R0, obj, i); |
aoqi@6880 | 313 | } |
aoqi@6880 | 314 | |
aoqi@6880 | 315 | |
aoqi@6880 | 316 | |
aoqi@6880 | 317 | } else if(con_size_in_bytes > hdr_size_in_bytes) { |
aoqi@6880 | 318 | // use loop to null out the fields |
aoqi@6880 | 319 | // code size = 32 bytes for even n (n = number of fields to clear) |
aoqi@6880 | 320 | // initialize last object field first if odd number of fields |
aoqi@6880 | 321 | assert( ((con_size_in_bytes - hdr_size_in_bytes) >> 3)!=0, "change code here"); |
aoqi@1 | 322 | |
aoqi@1 | 323 | #ifdef _LP64 |
aoqi@6880 | 324 | move(index, (con_size_in_bytes - hdr_size_in_bytes) >> 4); |
aoqi@6880 | 325 | sll(t1, index, 4); |
aoqi@1 | 326 | #else |
aoqi@6880 | 327 | move(index, (con_size_in_bytes - hdr_size_in_bytes) >> 3); |
aoqi@6880 | 328 | sll(t1, index, 3); |
aoqi@1 | 329 | #endif |
aoqi@6880 | 330 | add(t1, obj, t1); |
aoqi@1 | 331 | |
aoqi@6880 | 332 | // initialize last object field if constant size is odd |
aoqi@1 | 333 | #ifdef _LP64 |
aoqi@6880 | 334 | if (! UseCompressedOops) |
aoqi@6880 | 335 | { |
aoqi@6880 | 336 | if (((con_size_in_bytes - hdr_size_in_bytes) & 8) != 0) { |
aoqi@6880 | 337 | sd(R0, t1, hdr_size_in_bytes); |
aoqi@6880 | 338 | } |
aoqi@6880 | 339 | } else if (UseCompressedOops) { |
aoqi@6880 | 340 | int extra = (con_size_in_bytes - hdr_size_in_bytes) % 16; |
aoqi@6880 | 341 | while (extra != 0) { |
aoqi@6880 | 342 | sw(R0, t1, hdr_size_in_bytes + extra - 4); |
aoqi@6880 | 343 | extra -= 4; |
aoqi@6880 | 344 | } |
aoqi@6880 | 345 | } |
aoqi@1 | 346 | #else |
aoqi@6880 | 347 | if (((con_size_in_bytes - hdr_size_in_bytes) & 4) != 0) { |
aoqi@6880 | 348 | sw(R0, t1, hdr_size_in_bytes); |
aoqi@6880 | 349 | } |
aoqi@1 | 350 | #endif |
aoqi@6880 | 351 | // initialize remaining object fields: edx is a multiple of 2 |
aoqi@6880 | 352 | { |
aoqi@6880 | 353 | Label loop; |
aoqi@6880 | 354 | bind(loop); |
aoqi@6880 | 355 | st_ptr(R0, t1, hdr_size_in_bytes - (1*BytesPerWord)); |
aoqi@6880 | 356 | st_ptr(R0, t1, hdr_size_in_bytes - (2*BytesPerWord)); |
aoqi@6880 | 357 | addi(index, index, -1); |
aoqi@6880 | 358 | bne(index, R0, loop); |
aoqi@6880 | 359 | delayed()->addi(t1, t1, - 2 * wordSize); |
aoqi@6880 | 360 | } |
aoqi@6880 | 361 | } |
aoqi@1 | 362 | |
aoqi@6880 | 363 | if (DTraceAllocProbes) { |
aoqi@6880 | 364 | //assert(obj == eax, "must be"); |
aoqi@6880 | 365 | call(CAST_FROM_FN_PTR(address, |
aoqi@6880 | 366 | Runtime1::entry_for(Runtime1::dtrace_object_alloc_id)), relocInfo::runtime_call_type); |
aoqi@6880 | 367 | delayed()->nop(); |
aoqi@6880 | 368 | } |
aoqi@6880 | 369 | verify_oop(obj); |
aoqi@1 | 370 | } |
aoqi@1 | 371 | |
aoqi@6880 | 372 | void C1_MacroAssembler::allocate_array(Register obj, Register len, Register t1, Register t2, Register t3,int header_size, |
aoqi@6880 | 373 | int scale, Register klass, Label& slow_case) { |
aoqi@6880 | 374 | assert(obj == V0, "obj must be in V0 for cmpxchg"); |
aoqi@6880 | 375 | assert_different_registers(obj, len, t1, t2, t3,klass, AT); |
aoqi@1 | 376 | |
aoqi@1 | 377 | // determine alignment mask |
aoqi@6880 | 378 | assert(BytesPerWord == 8, "must be a multiple of 2 for masking code to work"); |
aoqi@1 | 379 | |
aoqi@1 | 380 | // check for negative or excessive length |
aoqi@1 | 381 | //const int max_length = 0x00FFFFFF; |
aoqi@1 | 382 | // move(AT, max_length); |
aoqi@1 | 383 | move(AT, max_array_allocation_length); |
aoqi@6880 | 384 | sltu(AT, AT, len); |
aoqi@6880 | 385 | bne_far(AT, R0, slow_case); |
aoqi@6880 | 386 | delayed()->nop(); |
aoqi@1 | 387 | |
aoqi@6880 | 388 | const Register arr_size = t3; |
aoqi@6880 | 389 | // align object end |
aoqi@6880 | 390 | move(arr_size, header_size * BytesPerWord + MinObjAlignmentInBytesMask); |
aoqi@6880 | 391 | sll(AT, len, scale); |
aoqi@6880 | 392 | add(arr_size, arr_size, AT); |
aoqi@6880 | 393 | move(AT, ~MinObjAlignmentInBytesMask); |
aoqi@6880 | 394 | andr(arr_size, arr_size, AT); |
aoqi@1 | 395 | |
aoqi@6880 | 396 | try_allocate(obj, arr_size, 0, t1, t2, slow_case); |
aoqi@1 | 397 | |
aoqi@6880 | 398 | initialize_header(obj, klass, len,t1,t2); |
aoqi@1 | 399 | |
aoqi@1 | 400 | // clear rest of allocated space |
aoqi@6880 | 401 | const Register len_zero = len; |
aoqi@6880 | 402 | initialize_body(obj, arr_size, header_size * BytesPerWord, len_zero); |
aoqi@6880 | 403 | if (DTraceAllocProbes) { |
aoqi@6880 | 404 | // assert(obj == eax, "must be"); |
aoqi@6880 | 405 | call(CAST_FROM_FN_PTR(address, |
aoqi@6880 | 406 | Runtime1::entry_for(Runtime1::dtrace_object_alloc_id)), |
aoqi@6880 | 407 | relocInfo::runtime_call_type); |
aoqi@6880 | 408 | delayed()->nop(); |
aoqi@6880 | 409 | } |
aoqi@1 | 410 | |
aoqi@6880 | 411 | verify_oop(obj); |
aoqi@1 | 412 | } |
aoqi@1 | 413 | |
aoqi@1 | 414 | |
aoqi@1 | 415 | void C1_MacroAssembler::inline_cache_check(Register receiver, Register iCache) { |
aoqi@6880 | 416 | verify_oop(receiver); |
aoqi@6880 | 417 | // explicit NULL check not needed since load from [klass_offset] causes a trap |
aoqi@6880 | 418 | // check against inline cache |
aoqi@6880 | 419 | assert(!MacroAssembler::needs_explicit_null_check(oopDesc::klass_offset_in_bytes()), "must add explicit null check"); |
aoqi@6880 | 420 | ///cmpl(iCache, Address(receiver, oopDesc::klass_offset_in_bytes())); |
aoqi@6880 | 421 | // if icache check fails, then jump to runtime routine |
aoqi@6880 | 422 | // Note: RECEIVER must still contain the receiver! |
aoqi@6880 | 423 | Label L; |
aoqi@1 | 424 | #ifdef _LP64 |
aoqi@6880 | 425 | //ld_ptr(AT, receiver, oopDesc::klass_offset_in_bytes()); |
aoqi@6880 | 426 | //add for compressedoops |
aoqi@8865 | 427 | load_klass(T9, receiver); |
aoqi@1 | 428 | #else |
aoqi@8865 | 429 | lw(T9, receiver, oopDesc::klass_offset_in_bytes()); |
aoqi@1 | 430 | #endif |
aoqi@8865 | 431 | beq(T9, iCache, L); |
aoqi@6880 | 432 | delayed()->nop(); |
aoqi@6880 | 433 | // jmp(Runtime1::entry_for(Runtime1::handle_ic_miss_id), relocInfo::runtime_call_type); |
aoqi@8865 | 434 | jmp(SharedRuntime::get_ic_miss_stub(), relocInfo::runtime_call_type); |
aoqi@6880 | 435 | delayed()->nop(); |
aoqi@6880 | 436 | bind(L); |
aoqi@6880 | 437 | // assert(UseCompressedOops, "check alignment in emit_method_entry"); |
aoqi@1 | 438 | } |
aoqi@1 | 439 | /* |
aoqi@1 | 440 | void C1_MacroAssembler::method_exit(bool restore_frame) { |
aoqi@6880 | 441 | if (restore_frame) { |
aoqi@6880 | 442 | leave(); |
aoqi@6880 | 443 | } |
aoqi@6880 | 444 | jr(RA); |
aoqi@6880 | 445 | delayed()->nop(); |
aoqi@1 | 446 | }*/ |
aoqi@1 | 447 | |
aoqi@1 | 448 | |
aoqi@1 | 449 | void C1_MacroAssembler::build_frame(int frame_size_in_bytes, int bang_size_in_bytes) { |
aoqi@1 | 450 | // Make sure there is enough stack space for this method's activation. |
aoqi@1 | 451 | // Note that we do this before doing an enter(). This matches the |
aoqi@1 | 452 | // ordering of C2's stack overflow check / esp decrement and allows |
aoqi@1 | 453 | // the SharedRuntime stack overflow handling to be consistent |
aoqi@1 | 454 | // between the two compilers. |
aoqi@8865 | 455 | generate_stack_overflow_check(bang_size_in_bytes); |
aoqi@1 | 456 | |
aoqi@6880 | 457 | enter(); |
aoqi@1 | 458 | //FIXME |
aoqi@1 | 459 | #ifdef TIERED |
aoqi@8865 | 460 | // c2 leaves fpu stack dirty. Clean it on entry |
aoqi@8865 | 461 | // if (UseSSE < 2 ) { |
aoqi@8865 | 462 | empty_FPU_stack(); |
aoqi@8865 | 463 | // } |
aoqi@1 | 464 | #endif // TIERED |
aoqi@6880 | 465 | |
aoqi@1 | 466 | decrement(SP, frame_size_in_bytes); // does not emit code for frame_size == 0 |
aoqi@1 | 467 | } |
aoqi@1 | 468 | |
aoqi@8865 | 469 | void C1_MacroAssembler::remove_frame(int frame_size_in_bytes) { |
aoqi@8865 | 470 | increment(SP, frame_size_in_bytes); // Does not emit code for frame_size == 0 |
aoqi@8865 | 471 | pop(FP); |
aoqi@8865 | 472 | } |
aoqi@8865 | 473 | |
aoqi@1 | 474 | void C1_MacroAssembler::unverified_entry(Register receiver, Register ic_klass) { |
aoqi@1 | 475 | if (C1Breakpoint) int3(); |
aoqi@1 | 476 | inline_cache_check(receiver, ic_klass); |
aoqi@1 | 477 | } |
aoqi@1 | 478 | |
aoqi@1 | 479 | |
aoqi@1 | 480 | void C1_MacroAssembler::verified_entry() { |
aoqi@1 | 481 | if (C1Breakpoint)int3(); |
aoqi@1 | 482 | // build frame |
aoqi@1 | 483 | verify_FPU(0, "method_entry"); |
aoqi@1 | 484 | } |
aoqi@1 | 485 | |
aoqi@1 | 486 | |
aoqi@1 | 487 | #ifndef PRODUCT |
aoqi@1 | 488 | void C1_MacroAssembler::verify_stack_oop(int stack_offset) { |
aoqi@6880 | 489 | if (!VerifyOops) return; |
aoqi@6880 | 490 | // verify_oop_addr(Address(esp, stack_offset)); |
aoqi@6880 | 491 | verify_oop_addr(Address(SP, stack_offset)); |
aoqi@1 | 492 | } |
aoqi@1 | 493 | |
aoqi@1 | 494 | void C1_MacroAssembler::verify_not_null_oop(Register r) { |
aoqi@6880 | 495 | if (!VerifyOops) return; |
aoqi@6880 | 496 | Label not_null; |
aoqi@6880 | 497 | // testl(r, r); |
aoqi@6880 | 498 | //jcc(Assembler::notZero, not_null); |
aoqi@6880 | 499 | bne(r,R0,not_null); |
aoqi@6880 | 500 | delayed()->nop(); |
aoqi@6880 | 501 | stop("non-null oop required"); |
aoqi@6880 | 502 | bind(not_null); |
aoqi@6880 | 503 | verify_oop(r); |
aoqi@1 | 504 | } |
aoqi@1 | 505 | |
aoqi@1 | 506 | void C1_MacroAssembler::invalidate_registers(bool inv_v0, bool inv_v1, bool inv_t3, bool inv_t7, bool inv_s0, bool inv_s7) { |
aoqi@1 | 507 | #ifdef ASSERT |
aoqi@6880 | 508 | /* if (inv_eax) movl(eax, 0xDEAD); |
aoqi@6880 | 509 | if (inv_ebx) movl(ebx, 0xDEAD); |
aoqi@6880 | 510 | if (inv_ecx) movl(ecx, 0xDEAD); |
aoqi@6880 | 511 | if (inv_edx) movl(edx, 0xDEAD); |
aoqi@6880 | 512 | if (inv_esi) movl(esi, 0xDEAD); |
aoqi@6880 | 513 | if (inv_edi) movl(edi, 0xDEAD); |
aoqi@6880 | 514 | */ |
aoqi@6880 | 515 | //if (inv_v0) move(V0, 0xDEAD); |
aoqi@6880 | 516 | //if (inv_v1) move(V1, 0xDEAD); |
aoqi@6880 | 517 | //if (inv_t3) move(T3, 0xDEAD); |
aoqi@6880 | 518 | //if (inv_t7) move(T7, 0xDEAD); |
aoqi@6880 | 519 | //if (inv_s0) move(S0, 0xDEAD); |
aoqi@6880 | 520 | //if (inv_s7) move(S7, 0xDEAD); |
aoqi@1 | 521 | #endif |
aoqi@1 | 522 | } |
aoqi@1 | 523 | #endif // ifndef PRODUCT |