Thu, 03 Jan 2013 16:30:47 -0800
8005544: Use 256bit YMM registers in arraycopy stubs on x86
Summary: Use YMM registers in arraycopy and array_fill stubs.
Reviewed-by: roland, twisti
duke@435 | 1 | /* |
coleenp@4037 | 2 | * Copyright (c) 1997, 2012, Oracle and/or its affiliates. All rights reserved. |
duke@435 | 3 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
duke@435 | 4 | * |
duke@435 | 5 | * This code is free software; you can redistribute it and/or modify it |
duke@435 | 6 | * under the terms of the GNU General Public License version 2 only, as |
duke@435 | 7 | * published by the Free Software Foundation. |
duke@435 | 8 | * |
duke@435 | 9 | * This code is distributed in the hope that it will be useful, but WITHOUT |
duke@435 | 10 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
duke@435 | 11 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
duke@435 | 12 | * version 2 for more details (a copy is included in the LICENSE file that |
duke@435 | 13 | * accompanied this code). |
duke@435 | 14 | * |
duke@435 | 15 | * You should have received a copy of the GNU General Public License version |
duke@435 | 16 | * 2 along with this work; if not, write to the Free Software Foundation, |
duke@435 | 17 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
duke@435 | 18 | * |
trims@1907 | 19 | * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
trims@1907 | 20 | * or visit www.oracle.com if you need additional information or have any |
trims@1907 | 21 | * questions. |
duke@435 | 22 | * |
duke@435 | 23 | */ |
duke@435 | 24 | |
stefank@2314 | 25 | #include "precompiled.hpp" |
stefank@2314 | 26 | #include "interp_masm_x86_32.hpp" |
stefank@2314 | 27 | #include "interpreter/interpreter.hpp" |
stefank@2314 | 28 | #include "interpreter/interpreterRuntime.hpp" |
stefank@2314 | 29 | #include "oops/arrayOop.hpp" |
stefank@2314 | 30 | #include "oops/markOop.hpp" |
coleenp@4037 | 31 | #include "oops/methodData.hpp" |
coleenp@4037 | 32 | #include "oops/method.hpp" |
stefank@2314 | 33 | #include "prims/jvmtiExport.hpp" |
stefank@2314 | 34 | #include "prims/jvmtiRedefineClassesTrace.hpp" |
stefank@2314 | 35 | #include "prims/jvmtiThreadState.hpp" |
stefank@2314 | 36 | #include "runtime/basicLock.hpp" |
stefank@2314 | 37 | #include "runtime/biasedLocking.hpp" |
stefank@2314 | 38 | #include "runtime/sharedRuntime.hpp" |
stefank@4299 | 39 | #include "runtime/thread.inline.hpp" |
duke@435 | 40 | |
duke@435 | 41 | |
duke@435 | 42 | // Implementation of InterpreterMacroAssembler |
duke@435 | 43 | #ifdef CC_INTERP |
duke@435 | 44 | void InterpreterMacroAssembler::get_method(Register reg) { |
never@739 | 45 | movptr(reg, Address(rbp, -(sizeof(BytecodeInterpreter) + 2 * wordSize))); |
never@739 | 46 | movptr(reg, Address(reg, byte_offset_of(BytecodeInterpreter, _method))); |
duke@435 | 47 | } |
duke@435 | 48 | #endif // CC_INTERP |
duke@435 | 49 | |
duke@435 | 50 | |
duke@435 | 51 | #ifndef CC_INTERP |
duke@435 | 52 | void InterpreterMacroAssembler::call_VM_leaf_base( |
duke@435 | 53 | address entry_point, |
duke@435 | 54 | int number_of_arguments |
duke@435 | 55 | ) { |
duke@435 | 56 | // interpreter specific |
duke@435 | 57 | // |
duke@435 | 58 | // Note: No need to save/restore bcp & locals (rsi & rdi) pointer |
duke@435 | 59 | // since these are callee saved registers and no blocking/ |
duke@435 | 60 | // GC can happen in leaf calls. |
duke@435 | 61 | // Further Note: DO NOT save/restore bcp/locals. If a caller has |
duke@435 | 62 | // already saved them so that it can use rsi/rdi as temporaries |
duke@435 | 63 | // then a save/restore here will DESTROY the copy the caller |
duke@435 | 64 | // saved! There used to be a save_bcp() that only happened in |
duke@435 | 65 | // the ASSERT path (no restore_bcp). Which caused bizarre failures |
duke@435 | 66 | // when jvm built with ASSERTs. |
duke@435 | 67 | #ifdef ASSERT |
duke@435 | 68 | { Label L; |
never@739 | 69 | cmpptr(Address(rbp, frame::interpreter_frame_last_sp_offset * wordSize), (int32_t)NULL_WORD); |
duke@435 | 70 | jcc(Assembler::equal, L); |
duke@435 | 71 | stop("InterpreterMacroAssembler::call_VM_leaf_base: last_sp != NULL"); |
duke@435 | 72 | bind(L); |
duke@435 | 73 | } |
duke@435 | 74 | #endif |
duke@435 | 75 | // super call |
duke@435 | 76 | MacroAssembler::call_VM_leaf_base(entry_point, number_of_arguments); |
duke@435 | 77 | // interpreter specific |
duke@435 | 78 | |
duke@435 | 79 | // Used to ASSERT that rsi/rdi were equal to frame's bcp/locals |
duke@435 | 80 | // but since they may not have been saved (and we don't want to |
duke@435 | 81 | // save them here (see note above) the assert is invalid. |
duke@435 | 82 | } |
duke@435 | 83 | |
duke@435 | 84 | |
duke@435 | 85 | void InterpreterMacroAssembler::call_VM_base( |
duke@435 | 86 | Register oop_result, |
duke@435 | 87 | Register java_thread, |
duke@435 | 88 | Register last_java_sp, |
duke@435 | 89 | address entry_point, |
duke@435 | 90 | int number_of_arguments, |
duke@435 | 91 | bool check_exceptions |
duke@435 | 92 | ) { |
duke@435 | 93 | #ifdef ASSERT |
duke@435 | 94 | { Label L; |
never@739 | 95 | cmpptr(Address(rbp, frame::interpreter_frame_last_sp_offset * wordSize), (int32_t)NULL_WORD); |
duke@435 | 96 | jcc(Assembler::equal, L); |
duke@435 | 97 | stop("InterpreterMacroAssembler::call_VM_base: last_sp != NULL"); |
duke@435 | 98 | bind(L); |
duke@435 | 99 | } |
duke@435 | 100 | #endif /* ASSERT */ |
duke@435 | 101 | // interpreter specific |
duke@435 | 102 | // |
duke@435 | 103 | // Note: Could avoid restoring locals ptr (callee saved) - however doesn't |
duke@435 | 104 | // really make a difference for these runtime calls, since they are |
duke@435 | 105 | // slow anyway. Btw., bcp must be saved/restored since it may change |
duke@435 | 106 | // due to GC. |
duke@435 | 107 | assert(java_thread == noreg , "not expecting a precomputed java thread"); |
duke@435 | 108 | save_bcp(); |
duke@435 | 109 | // super call |
duke@435 | 110 | MacroAssembler::call_VM_base(oop_result, java_thread, last_java_sp, entry_point, number_of_arguments, check_exceptions); |
duke@435 | 111 | // interpreter specific |
duke@435 | 112 | restore_bcp(); |
duke@435 | 113 | restore_locals(); |
duke@435 | 114 | } |
duke@435 | 115 | |
duke@435 | 116 | |
duke@435 | 117 | void InterpreterMacroAssembler::check_and_handle_popframe(Register java_thread) { |
duke@435 | 118 | if (JvmtiExport::can_pop_frame()) { |
duke@435 | 119 | Label L; |
duke@435 | 120 | // Initiate popframe handling only if it is not already being processed. If the flag |
duke@435 | 121 | // has the popframe_processing bit set, it means that this code is called *during* popframe |
duke@435 | 122 | // handling - we don't want to reenter. |
duke@435 | 123 | Register pop_cond = java_thread; // Not clear if any other register is available... |
duke@435 | 124 | movl(pop_cond, Address(java_thread, JavaThread::popframe_condition_offset())); |
duke@435 | 125 | testl(pop_cond, JavaThread::popframe_pending_bit); |
duke@435 | 126 | jcc(Assembler::zero, L); |
duke@435 | 127 | testl(pop_cond, JavaThread::popframe_processing_bit); |
duke@435 | 128 | jcc(Assembler::notZero, L); |
duke@435 | 129 | // Call Interpreter::remove_activation_preserving_args_entry() to get the |
duke@435 | 130 | // address of the same-named entrypoint in the generated interpreter code. |
duke@435 | 131 | call_VM_leaf(CAST_FROM_FN_PTR(address, Interpreter::remove_activation_preserving_args_entry)); |
duke@435 | 132 | jmp(rax); |
duke@435 | 133 | bind(L); |
duke@435 | 134 | get_thread(java_thread); |
duke@435 | 135 | } |
duke@435 | 136 | } |
duke@435 | 137 | |
duke@435 | 138 | |
duke@435 | 139 | void InterpreterMacroAssembler::load_earlyret_value(TosState state) { |
duke@435 | 140 | get_thread(rcx); |
duke@435 | 141 | movl(rcx, Address(rcx, JavaThread::jvmti_thread_state_offset())); |
duke@435 | 142 | const Address tos_addr (rcx, JvmtiThreadState::earlyret_tos_offset()); |
duke@435 | 143 | const Address oop_addr (rcx, JvmtiThreadState::earlyret_oop_offset()); |
duke@435 | 144 | const Address val_addr (rcx, JvmtiThreadState::earlyret_value_offset()); |
duke@435 | 145 | const Address val_addr1(rcx, JvmtiThreadState::earlyret_value_offset() |
duke@435 | 146 | + in_ByteSize(wordSize)); |
duke@435 | 147 | switch (state) { |
never@739 | 148 | case atos: movptr(rax, oop_addr); |
xlu@947 | 149 | movptr(oop_addr, NULL_WORD); |
duke@435 | 150 | verify_oop(rax, state); break; |
never@739 | 151 | case ltos: |
never@739 | 152 | movl(rdx, val_addr1); // fall through |
duke@435 | 153 | case btos: // fall through |
duke@435 | 154 | case ctos: // fall through |
duke@435 | 155 | case stos: // fall through |
duke@435 | 156 | case itos: movl(rax, val_addr); break; |
duke@435 | 157 | case ftos: fld_s(val_addr); break; |
duke@435 | 158 | case dtos: fld_d(val_addr); break; |
duke@435 | 159 | case vtos: /* nothing to do */ break; |
duke@435 | 160 | default : ShouldNotReachHere(); |
duke@435 | 161 | } |
duke@435 | 162 | // Clean up tos value in the thread object |
never@739 | 163 | movl(tos_addr, (int32_t) ilgl); |
xlu@947 | 164 | movptr(val_addr, NULL_WORD); |
xlu@968 | 165 | NOT_LP64(movptr(val_addr1, NULL_WORD)); |
duke@435 | 166 | } |
duke@435 | 167 | |
duke@435 | 168 | |
duke@435 | 169 | void InterpreterMacroAssembler::check_and_handle_earlyret(Register java_thread) { |
duke@435 | 170 | if (JvmtiExport::can_force_early_return()) { |
duke@435 | 171 | Label L; |
duke@435 | 172 | Register tmp = java_thread; |
never@739 | 173 | movptr(tmp, Address(tmp, JavaThread::jvmti_thread_state_offset())); |
never@739 | 174 | testptr(tmp, tmp); |
duke@435 | 175 | jcc(Assembler::zero, L); // if (thread->jvmti_thread_state() == NULL) exit; |
duke@435 | 176 | |
duke@435 | 177 | // Initiate earlyret handling only if it is not already being processed. |
duke@435 | 178 | // If the flag has the earlyret_processing bit set, it means that this code |
duke@435 | 179 | // is called *during* earlyret handling - we don't want to reenter. |
duke@435 | 180 | movl(tmp, Address(tmp, JvmtiThreadState::earlyret_state_offset())); |
duke@435 | 181 | cmpl(tmp, JvmtiThreadState::earlyret_pending); |
duke@435 | 182 | jcc(Assembler::notEqual, L); |
duke@435 | 183 | |
duke@435 | 184 | // Call Interpreter::remove_activation_early_entry() to get the address of the |
duke@435 | 185 | // same-named entrypoint in the generated interpreter code. |
duke@435 | 186 | get_thread(java_thread); |
never@739 | 187 | movptr(tmp, Address(java_thread, JavaThread::jvmti_thread_state_offset())); |
duke@435 | 188 | pushl(Address(tmp, JvmtiThreadState::earlyret_tos_offset())); |
duke@435 | 189 | call_VM_leaf(CAST_FROM_FN_PTR(address, Interpreter::remove_activation_early_entry), 1); |
duke@435 | 190 | jmp(rax); |
duke@435 | 191 | bind(L); |
duke@435 | 192 | get_thread(java_thread); |
duke@435 | 193 | } |
duke@435 | 194 | } |
duke@435 | 195 | |
duke@435 | 196 | |
duke@435 | 197 | void InterpreterMacroAssembler::get_unsigned_2_byte_index_at_bcp(Register reg, int bcp_offset) { |
duke@435 | 198 | assert(bcp_offset >= 0, "bcp is still pointing to start of bytecode"); |
duke@435 | 199 | movl(reg, Address(rsi, bcp_offset)); |
never@739 | 200 | bswapl(reg); |
duke@435 | 201 | shrl(reg, 16); |
duke@435 | 202 | } |
duke@435 | 203 | |
duke@435 | 204 | |
jrose@1920 | 205 | void InterpreterMacroAssembler::get_cache_index_at_bcp(Register reg, int bcp_offset, size_t index_size) { |
duke@435 | 206 | assert(bcp_offset > 0, "bcp is still pointing to start of bytecode"); |
jrose@1920 | 207 | if (index_size == sizeof(u2)) { |
jrose@1161 | 208 | load_unsigned_short(reg, Address(rsi, bcp_offset)); |
jrose@1920 | 209 | } else if (index_size == sizeof(u4)) { |
twisti@2698 | 210 | assert(EnableInvokeDynamic, "giant index used only for JSR 292"); |
jrose@1161 | 211 | movl(reg, Address(rsi, bcp_offset)); |
twisti@1543 | 212 | // Check if the secondary index definition is still ~x, otherwise |
twisti@1543 | 213 | // we have to change the following assembler code to calculate the |
twisti@1543 | 214 | // plain index. |
coleenp@4037 | 215 | assert(ConstantPool::decode_invokedynamic_index(~123) == 123, "else change next line"); |
jrose@1161 | 216 | notl(reg); // convert to plain index |
jrose@1920 | 217 | } else if (index_size == sizeof(u1)) { |
jrose@1920 | 218 | load_unsigned_byte(reg, Address(rsi, bcp_offset)); |
jrose@1920 | 219 | } else { |
jrose@1920 | 220 | ShouldNotReachHere(); |
jrose@1161 | 221 | } |
jrose@1161 | 222 | } |
jrose@1161 | 223 | |
jrose@1161 | 224 | |
jrose@1161 | 225 | void InterpreterMacroAssembler::get_cache_and_index_at_bcp(Register cache, Register index, |
jrose@1920 | 226 | int bcp_offset, size_t index_size) { |
twisti@3050 | 227 | assert_different_registers(cache, index); |
jrose@1920 | 228 | get_cache_index_at_bcp(index, bcp_offset, index_size); |
never@739 | 229 | movptr(cache, Address(rbp, frame::interpreter_frame_cache_offset * wordSize)); |
duke@435 | 230 | assert(sizeof(ConstantPoolCacheEntry) == 4*wordSize, "adjust code below"); |
coleenp@4037 | 231 | assert(exact_log2(in_words(ConstantPoolCacheEntry::size())) == 2, "else change next line"); |
never@739 | 232 | shlptr(index, 2); // convert from field index to ConstantPoolCacheEntry index |
duke@435 | 233 | } |
duke@435 | 234 | |
duke@435 | 235 | |
twisti@3050 | 236 | void InterpreterMacroAssembler::get_cache_and_index_and_bytecode_at_bcp(Register cache, |
twisti@3050 | 237 | Register index, |
twisti@3050 | 238 | Register bytecode, |
twisti@3050 | 239 | int byte_no, |
twisti@3050 | 240 | int bcp_offset, |
twisti@3050 | 241 | size_t index_size) { |
twisti@3050 | 242 | get_cache_and_index_at_bcp(cache, index, bcp_offset, index_size); |
coleenp@4037 | 243 | movptr(bytecode, Address(cache, index, Address::times_ptr, ConstantPoolCache::base_offset() + ConstantPoolCacheEntry::indices_offset())); |
twisti@3050 | 244 | const int shift_count = (1 + byte_no) * BitsPerByte; |
twisti@3969 | 245 | assert((byte_no == TemplateTable::f1_byte && shift_count == ConstantPoolCacheEntry::bytecode_1_shift) || |
twisti@3969 | 246 | (byte_no == TemplateTable::f2_byte && shift_count == ConstantPoolCacheEntry::bytecode_2_shift), |
twisti@3969 | 247 | "correct shift count"); |
twisti@3050 | 248 | shrptr(bytecode, shift_count); |
twisti@3969 | 249 | assert(ConstantPoolCacheEntry::bytecode_1_mask == ConstantPoolCacheEntry::bytecode_2_mask, "common mask"); |
twisti@3969 | 250 | andptr(bytecode, ConstantPoolCacheEntry::bytecode_1_mask); |
twisti@3050 | 251 | } |
twisti@3050 | 252 | |
twisti@3050 | 253 | |
jrose@1161 | 254 | void InterpreterMacroAssembler::get_cache_entry_pointer_at_bcp(Register cache, Register tmp, |
jrose@1920 | 255 | int bcp_offset, size_t index_size) { |
duke@435 | 256 | assert(cache != tmp, "must use different register"); |
jrose@1920 | 257 | get_cache_index_at_bcp(tmp, bcp_offset, index_size); |
duke@435 | 258 | assert(sizeof(ConstantPoolCacheEntry) == 4*wordSize, "adjust code below"); |
duke@435 | 259 | // convert from field index to ConstantPoolCacheEntry index |
duke@435 | 260 | // and from word offset to byte offset |
coleenp@4037 | 261 | assert(exact_log2(in_bytes(ConstantPoolCacheEntry::size_in_bytes())) == 2 + LogBytesPerWord, "else change next line"); |
duke@435 | 262 | shll(tmp, 2 + LogBytesPerWord); |
never@739 | 263 | movptr(cache, Address(rbp, frame::interpreter_frame_cache_offset * wordSize)); |
duke@435 | 264 | // skip past the header |
coleenp@4037 | 265 | addptr(cache, in_bytes(ConstantPoolCache::base_offset())); |
never@739 | 266 | addptr(cache, tmp); // construct pointer to cache entry |
duke@435 | 267 | } |
duke@435 | 268 | |
coleenp@4037 | 269 | // Load object from cpool->resolved_references(index) |
coleenp@4037 | 270 | void InterpreterMacroAssembler::load_resolved_reference_at_index( |
coleenp@4037 | 271 | Register result, Register index) { |
coleenp@4037 | 272 | assert_different_registers(result, index); |
coleenp@4037 | 273 | // convert from field index to resolved_references() index and from |
coleenp@4037 | 274 | // word index to byte offset. Since this is a java object, it can be compressed |
coleenp@4037 | 275 | Register tmp = index; // reuse |
coleenp@4037 | 276 | shll(tmp, LogBytesPerHeapOop); |
coleenp@4037 | 277 | |
coleenp@4037 | 278 | get_constant_pool(result); |
coleenp@4037 | 279 | // load pointer for resolved_references[] objArray |
coleenp@4037 | 280 | movptr(result, Address(result, ConstantPool::resolved_references_offset_in_bytes())); |
coleenp@4037 | 281 | // JNIHandles::resolve(obj); |
coleenp@4037 | 282 | movptr(result, Address(result, 0)); |
coleenp@4037 | 283 | // Add in the index |
coleenp@4037 | 284 | addptr(result, tmp); |
coleenp@4037 | 285 | load_heap_oop(result, Address(result, arrayOopDesc::base_offset_in_bytes(T_OBJECT))); |
coleenp@4037 | 286 | } |
duke@435 | 287 | |
duke@435 | 288 | // Generate a subtype check: branch to ok_is_subtype if sub_klass is |
duke@435 | 289 | // a subtype of super_klass. EAX holds the super_klass. Blows ECX. |
duke@435 | 290 | // Resets EDI to locals. Register sub_klass cannot be any of the above. |
duke@435 | 291 | void InterpreterMacroAssembler::gen_subtype_check( Register Rsub_klass, Label &ok_is_subtype ) { |
duke@435 | 292 | assert( Rsub_klass != rax, "rax, holds superklass" ); |
jrose@1079 | 293 | assert( Rsub_klass != rcx, "used as a temp" ); |
jrose@1079 | 294 | assert( Rsub_klass != rdi, "used as a temp, restored from locals" ); |
duke@435 | 295 | |
duke@435 | 296 | // Profile the not-null value's klass. |
jrose@1079 | 297 | profile_typecheck(rcx, Rsub_klass, rdi); // blows rcx, reloads rdi |
duke@435 | 298 | |
jrose@1079 | 299 | // Do the check. |
jrose@1079 | 300 | check_klass_subtype(Rsub_klass, rax, rcx, ok_is_subtype); // blows rcx |
duke@435 | 301 | |
jrose@1079 | 302 | // Profile the failure of the check. |
duke@435 | 303 | profile_typecheck_failed(rcx); // blows rcx |
duke@435 | 304 | } |
duke@435 | 305 | |
duke@435 | 306 | void InterpreterMacroAssembler::f2ieee() { |
duke@435 | 307 | if (IEEEPrecision) { |
duke@435 | 308 | fstp_s(Address(rsp, 0)); |
duke@435 | 309 | fld_s(Address(rsp, 0)); |
duke@435 | 310 | } |
duke@435 | 311 | } |
duke@435 | 312 | |
duke@435 | 313 | |
duke@435 | 314 | void InterpreterMacroAssembler::d2ieee() { |
duke@435 | 315 | if (IEEEPrecision) { |
duke@435 | 316 | fstp_d(Address(rsp, 0)); |
duke@435 | 317 | fld_d(Address(rsp, 0)); |
duke@435 | 318 | } |
duke@435 | 319 | } |
duke@435 | 320 | |
duke@435 | 321 | // Java Expression Stack |
duke@435 | 322 | |
duke@435 | 323 | void InterpreterMacroAssembler::pop_ptr(Register r) { |
never@739 | 324 | pop(r); |
duke@435 | 325 | } |
duke@435 | 326 | |
duke@435 | 327 | void InterpreterMacroAssembler::pop_i(Register r) { |
never@739 | 328 | pop(r); |
duke@435 | 329 | } |
duke@435 | 330 | |
duke@435 | 331 | void InterpreterMacroAssembler::pop_l(Register lo, Register hi) { |
never@739 | 332 | pop(lo); |
never@739 | 333 | pop(hi); |
duke@435 | 334 | } |
duke@435 | 335 | |
duke@435 | 336 | void InterpreterMacroAssembler::pop_f() { |
duke@435 | 337 | fld_s(Address(rsp, 0)); |
never@739 | 338 | addptr(rsp, 1 * wordSize); |
duke@435 | 339 | } |
duke@435 | 340 | |
duke@435 | 341 | void InterpreterMacroAssembler::pop_d() { |
duke@435 | 342 | fld_d(Address(rsp, 0)); |
never@739 | 343 | addptr(rsp, 2 * wordSize); |
duke@435 | 344 | } |
duke@435 | 345 | |
duke@435 | 346 | |
duke@435 | 347 | void InterpreterMacroAssembler::pop(TosState state) { |
duke@435 | 348 | switch (state) { |
duke@435 | 349 | case atos: pop_ptr(rax); break; |
duke@435 | 350 | case btos: // fall through |
duke@435 | 351 | case ctos: // fall through |
duke@435 | 352 | case stos: // fall through |
duke@435 | 353 | case itos: pop_i(rax); break; |
duke@435 | 354 | case ltos: pop_l(rax, rdx); break; |
duke@435 | 355 | case ftos: pop_f(); break; |
duke@435 | 356 | case dtos: pop_d(); break; |
duke@435 | 357 | case vtos: /* nothing to do */ break; |
duke@435 | 358 | default : ShouldNotReachHere(); |
duke@435 | 359 | } |
duke@435 | 360 | verify_oop(rax, state); |
duke@435 | 361 | } |
duke@435 | 362 | |
duke@435 | 363 | void InterpreterMacroAssembler::push_ptr(Register r) { |
never@739 | 364 | push(r); |
duke@435 | 365 | } |
duke@435 | 366 | |
duke@435 | 367 | void InterpreterMacroAssembler::push_i(Register r) { |
never@739 | 368 | push(r); |
duke@435 | 369 | } |
duke@435 | 370 | |
duke@435 | 371 | void InterpreterMacroAssembler::push_l(Register lo, Register hi) { |
never@739 | 372 | push(hi); |
never@739 | 373 | push(lo); |
duke@435 | 374 | } |
duke@435 | 375 | |
duke@435 | 376 | void InterpreterMacroAssembler::push_f() { |
duke@435 | 377 | // Do not schedule for no AGI! Never write beyond rsp! |
never@739 | 378 | subptr(rsp, 1 * wordSize); |
duke@435 | 379 | fstp_s(Address(rsp, 0)); |
duke@435 | 380 | } |
duke@435 | 381 | |
duke@435 | 382 | void InterpreterMacroAssembler::push_d(Register r) { |
twisti@1861 | 383 | // Do not schedule for no AGI! Never write beyond rsp! |
twisti@1861 | 384 | subptr(rsp, 2 * wordSize); |
twisti@1861 | 385 | fstp_d(Address(rsp, 0)); |
duke@435 | 386 | } |
duke@435 | 387 | |
duke@435 | 388 | |
duke@435 | 389 | void InterpreterMacroAssembler::push(TosState state) { |
duke@435 | 390 | verify_oop(rax, state); |
duke@435 | 391 | switch (state) { |
duke@435 | 392 | case atos: push_ptr(rax); break; |
duke@435 | 393 | case btos: // fall through |
duke@435 | 394 | case ctos: // fall through |
duke@435 | 395 | case stos: // fall through |
duke@435 | 396 | case itos: push_i(rax); break; |
duke@435 | 397 | case ltos: push_l(rax, rdx); break; |
duke@435 | 398 | case ftos: push_f(); break; |
duke@435 | 399 | case dtos: push_d(rax); break; |
duke@435 | 400 | case vtos: /* nothing to do */ break; |
duke@435 | 401 | default : ShouldNotReachHere(); |
duke@435 | 402 | } |
duke@435 | 403 | } |
duke@435 | 404 | |
duke@435 | 405 | |
twisti@1861 | 406 | // Helpers for swap and dup |
twisti@1861 | 407 | void InterpreterMacroAssembler::load_ptr(int n, Register val) { |
never@739 | 408 | movptr(val, Address(rsp, Interpreter::expr_offset_in_bytes(n))); |
duke@435 | 409 | } |
duke@435 | 410 | |
twisti@1861 | 411 | void InterpreterMacroAssembler::store_ptr(int n, Register val) { |
never@739 | 412 | movptr(Address(rsp, Interpreter::expr_offset_in_bytes(n)), val); |
duke@435 | 413 | } |
duke@435 | 414 | |
jrose@1145 | 415 | void InterpreterMacroAssembler::prepare_to_jump_from_interpreted() { |
duke@435 | 416 | // set sender sp |
never@739 | 417 | lea(rsi, Address(rsp, wordSize)); |
duke@435 | 418 | // record last_sp |
never@739 | 419 | movptr(Address(rbp, frame::interpreter_frame_last_sp_offset * wordSize), rsi); |
jrose@1145 | 420 | } |
jrose@1145 | 421 | |
jrose@1145 | 422 | |
jrose@1145 | 423 | // Jump to from_interpreted entry of a call unless single stepping is possible |
jrose@1145 | 424 | // in this thread in which case we must call the i2i entry |
jrose@1145 | 425 | void InterpreterMacroAssembler::jump_from_interpreted(Register method, Register temp) { |
jrose@1145 | 426 | prepare_to_jump_from_interpreted(); |
duke@435 | 427 | |
duke@435 | 428 | if (JvmtiExport::can_post_interpreter_events()) { |
duke@435 | 429 | Label run_compiled_code; |
duke@435 | 430 | // JVMTI events, such as single-stepping, are implemented partly by avoiding running |
duke@435 | 431 | // compiled code in threads for which the event is enabled. Check here for |
duke@435 | 432 | // interp_only_mode if these events CAN be enabled. |
duke@435 | 433 | get_thread(temp); |
duke@435 | 434 | // interp_only is an int, on little endian it is sufficient to test the byte only |
never@3005 | 435 | // Is a cmpl faster? |
duke@435 | 436 | cmpb(Address(temp, JavaThread::interp_only_mode_offset()), 0); |
never@3005 | 437 | jccb(Assembler::zero, run_compiled_code); |
coleenp@4037 | 438 | jmp(Address(method, Method::interpreter_entry_offset())); |
duke@435 | 439 | bind(run_compiled_code); |
duke@435 | 440 | } |
duke@435 | 441 | |
coleenp@4037 | 442 | jmp(Address(method, Method::from_interpreted_offset())); |
duke@435 | 443 | |
duke@435 | 444 | } |
duke@435 | 445 | |
duke@435 | 446 | |
duke@435 | 447 | // The following two routines provide a hook so that an implementation |
duke@435 | 448 | // can schedule the dispatch in two parts. Intel does not do this. |
duke@435 | 449 | void InterpreterMacroAssembler::dispatch_prolog(TosState state, int step) { |
duke@435 | 450 | // Nothing Intel-specific to be done here. |
duke@435 | 451 | } |
duke@435 | 452 | |
duke@435 | 453 | void InterpreterMacroAssembler::dispatch_epilog(TosState state, int step) { |
duke@435 | 454 | dispatch_next(state, step); |
duke@435 | 455 | } |
duke@435 | 456 | |
duke@435 | 457 | void InterpreterMacroAssembler::dispatch_base(TosState state, address* table, |
duke@435 | 458 | bool verifyoop) { |
duke@435 | 459 | verify_FPU(1, state); |
duke@435 | 460 | if (VerifyActivationFrameSize) { |
duke@435 | 461 | Label L; |
never@739 | 462 | mov(rcx, rbp); |
never@739 | 463 | subptr(rcx, rsp); |
duke@435 | 464 | int min_frame_size = (frame::link_offset - frame::interpreter_frame_initial_sp_offset) * wordSize; |
never@739 | 465 | cmpptr(rcx, min_frame_size); |
duke@435 | 466 | jcc(Assembler::greaterEqual, L); |
duke@435 | 467 | stop("broken stack frame"); |
duke@435 | 468 | bind(L); |
duke@435 | 469 | } |
duke@435 | 470 | if (verifyoop) verify_oop(rax, state); |
never@739 | 471 | Address index(noreg, rbx, Address::times_ptr); |
duke@435 | 472 | ExternalAddress tbl((address)table); |
duke@435 | 473 | ArrayAddress dispatch(tbl, index); |
duke@435 | 474 | jump(dispatch); |
duke@435 | 475 | } |
duke@435 | 476 | |
duke@435 | 477 | |
duke@435 | 478 | void InterpreterMacroAssembler::dispatch_only(TosState state) { |
duke@435 | 479 | dispatch_base(state, Interpreter::dispatch_table(state)); |
duke@435 | 480 | } |
duke@435 | 481 | |
duke@435 | 482 | |
duke@435 | 483 | void InterpreterMacroAssembler::dispatch_only_normal(TosState state) { |
duke@435 | 484 | dispatch_base(state, Interpreter::normal_table(state)); |
duke@435 | 485 | } |
duke@435 | 486 | |
duke@435 | 487 | void InterpreterMacroAssembler::dispatch_only_noverify(TosState state) { |
duke@435 | 488 | dispatch_base(state, Interpreter::normal_table(state), false); |
duke@435 | 489 | } |
duke@435 | 490 | |
duke@435 | 491 | |
duke@435 | 492 | void InterpreterMacroAssembler::dispatch_next(TosState state, int step) { |
duke@435 | 493 | // load next bytecode (load before advancing rsi to prevent AGI) |
duke@435 | 494 | load_unsigned_byte(rbx, Address(rsi, step)); |
duke@435 | 495 | // advance rsi |
duke@435 | 496 | increment(rsi, step); |
duke@435 | 497 | dispatch_base(state, Interpreter::dispatch_table(state)); |
duke@435 | 498 | } |
duke@435 | 499 | |
duke@435 | 500 | |
duke@435 | 501 | void InterpreterMacroAssembler::dispatch_via(TosState state, address* table) { |
duke@435 | 502 | // load current bytecode |
duke@435 | 503 | load_unsigned_byte(rbx, Address(rsi, 0)); |
duke@435 | 504 | dispatch_base(state, table); |
duke@435 | 505 | } |
duke@435 | 506 | |
duke@435 | 507 | // remove activation |
duke@435 | 508 | // |
duke@435 | 509 | // Unlock the receiver if this is a synchronized method. |
duke@435 | 510 | // Unlock any Java monitors from syncronized blocks. |
duke@435 | 511 | // Remove the activation from the stack. |
duke@435 | 512 | // |
duke@435 | 513 | // If there are locked Java monitors |
duke@435 | 514 | // If throw_monitor_exception |
duke@435 | 515 | // throws IllegalMonitorStateException |
duke@435 | 516 | // Else if install_monitor_exception |
duke@435 | 517 | // installs IllegalMonitorStateException |
duke@435 | 518 | // Else |
duke@435 | 519 | // no error processing |
duke@435 | 520 | void InterpreterMacroAssembler::remove_activation(TosState state, Register ret_addr, |
duke@435 | 521 | bool throw_monitor_exception, |
duke@435 | 522 | bool install_monitor_exception, |
duke@435 | 523 | bool notify_jvmdi) { |
duke@435 | 524 | // Note: Registers rax, rdx and FPU ST(0) may be in use for the result |
duke@435 | 525 | // check if synchronized method |
duke@435 | 526 | Label unlocked, unlock, no_unlock; |
duke@435 | 527 | |
duke@435 | 528 | get_thread(rcx); |
duke@435 | 529 | const Address do_not_unlock_if_synchronized(rcx, |
duke@435 | 530 | in_bytes(JavaThread::do_not_unlock_if_synchronized_offset())); |
duke@435 | 531 | |
duke@435 | 532 | movbool(rbx, do_not_unlock_if_synchronized); |
never@739 | 533 | mov(rdi,rbx); |
duke@435 | 534 | movbool(do_not_unlock_if_synchronized, false); // reset the flag |
duke@435 | 535 | |
never@739 | 536 | movptr(rbx, Address(rbp, frame::interpreter_frame_method_offset * wordSize)); // get method access flags |
coleenp@4037 | 537 | movl(rcx, Address(rbx, Method::access_flags_offset())); |
duke@435 | 538 | |
duke@435 | 539 | testl(rcx, JVM_ACC_SYNCHRONIZED); |
duke@435 | 540 | jcc(Assembler::zero, unlocked); |
duke@435 | 541 | |
duke@435 | 542 | // Don't unlock anything if the _do_not_unlock_if_synchronized flag |
duke@435 | 543 | // is set. |
never@739 | 544 | mov(rcx,rdi); |
duke@435 | 545 | testbool(rcx); |
duke@435 | 546 | jcc(Assembler::notZero, no_unlock); |
duke@435 | 547 | |
duke@435 | 548 | // unlock monitor |
duke@435 | 549 | push(state); // save result |
duke@435 | 550 | |
duke@435 | 551 | // BasicObjectLock will be first in list, since this is a synchronized method. However, need |
duke@435 | 552 | // to check that the object has not been unlocked by an explicit monitorexit bytecode. |
duke@435 | 553 | const Address monitor(rbp, frame::interpreter_frame_initial_sp_offset * wordSize - (int)sizeof(BasicObjectLock)); |
never@739 | 554 | lea (rdx, monitor); // address of first monitor |
duke@435 | 555 | |
never@739 | 556 | movptr (rax, Address(rdx, BasicObjectLock::obj_offset_in_bytes())); |
never@739 | 557 | testptr(rax, rax); |
never@739 | 558 | jcc (Assembler::notZero, unlock); |
duke@435 | 559 | |
duke@435 | 560 | pop(state); |
duke@435 | 561 | if (throw_monitor_exception) { |
duke@435 | 562 | empty_FPU_stack(); // remove possible return value from FPU-stack, otherwise stack could overflow |
duke@435 | 563 | |
duke@435 | 564 | // Entry already unlocked, need to throw exception |
duke@435 | 565 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::throw_illegal_monitor_state_exception)); |
duke@435 | 566 | should_not_reach_here(); |
duke@435 | 567 | } else { |
duke@435 | 568 | // Monitor already unlocked during a stack unroll. |
duke@435 | 569 | // If requested, install an illegal_monitor_state_exception. |
duke@435 | 570 | // Continue with stack unrolling. |
duke@435 | 571 | if (install_monitor_exception) { |
duke@435 | 572 | empty_FPU_stack(); // remove possible return value from FPU-stack, otherwise stack could overflow |
duke@435 | 573 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::new_illegal_monitor_state_exception)); |
duke@435 | 574 | } |
duke@435 | 575 | jmp(unlocked); |
duke@435 | 576 | } |
duke@435 | 577 | |
duke@435 | 578 | bind(unlock); |
duke@435 | 579 | unlock_object(rdx); |
duke@435 | 580 | pop(state); |
duke@435 | 581 | |
duke@435 | 582 | // Check that for block-structured locking (i.e., that all locked objects has been unlocked) |
duke@435 | 583 | bind(unlocked); |
duke@435 | 584 | |
duke@435 | 585 | // rax, rdx: Might contain return value |
duke@435 | 586 | |
duke@435 | 587 | // Check that all monitors are unlocked |
duke@435 | 588 | { |
duke@435 | 589 | Label loop, exception, entry, restart; |
duke@435 | 590 | const int entry_size = frame::interpreter_frame_monitor_size() * wordSize; |
duke@435 | 591 | const Address monitor_block_top(rbp, frame::interpreter_frame_monitor_block_top_offset * wordSize); |
duke@435 | 592 | const Address monitor_block_bot(rbp, frame::interpreter_frame_initial_sp_offset * wordSize); |
duke@435 | 593 | |
duke@435 | 594 | bind(restart); |
never@739 | 595 | movptr(rcx, monitor_block_top); // points to current entry, starting with top-most entry |
never@739 | 596 | lea(rbx, monitor_block_bot); // points to word before bottom of monitor block |
duke@435 | 597 | jmp(entry); |
duke@435 | 598 | |
duke@435 | 599 | // Entry already locked, need to throw exception |
duke@435 | 600 | bind(exception); |
duke@435 | 601 | |
duke@435 | 602 | if (throw_monitor_exception) { |
duke@435 | 603 | empty_FPU_stack(); // remove possible return value from FPU-stack, otherwise stack could overflow |
duke@435 | 604 | |
duke@435 | 605 | // Throw exception |
duke@435 | 606 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::throw_illegal_monitor_state_exception)); |
duke@435 | 607 | should_not_reach_here(); |
duke@435 | 608 | } else { |
duke@435 | 609 | // Stack unrolling. Unlock object and install illegal_monitor_exception |
duke@435 | 610 | // Unlock does not block, so don't have to worry about the frame |
duke@435 | 611 | |
duke@435 | 612 | push(state); |
never@739 | 613 | mov(rdx, rcx); |
duke@435 | 614 | unlock_object(rdx); |
duke@435 | 615 | pop(state); |
duke@435 | 616 | |
duke@435 | 617 | if (install_monitor_exception) { |
duke@435 | 618 | empty_FPU_stack(); // remove possible return value from FPU-stack, otherwise stack could overflow |
duke@435 | 619 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::new_illegal_monitor_state_exception)); |
duke@435 | 620 | } |
duke@435 | 621 | |
duke@435 | 622 | jmp(restart); |
duke@435 | 623 | } |
duke@435 | 624 | |
duke@435 | 625 | bind(loop); |
never@739 | 626 | cmpptr(Address(rcx, BasicObjectLock::obj_offset_in_bytes()), (int32_t)NULL_WORD); // check if current entry is used |
duke@435 | 627 | jcc(Assembler::notEqual, exception); |
duke@435 | 628 | |
never@739 | 629 | addptr(rcx, entry_size); // otherwise advance to next entry |
duke@435 | 630 | bind(entry); |
never@739 | 631 | cmpptr(rcx, rbx); // check if bottom reached |
duke@435 | 632 | jcc(Assembler::notEqual, loop); // if not at bottom then check this entry |
duke@435 | 633 | } |
duke@435 | 634 | |
duke@435 | 635 | bind(no_unlock); |
duke@435 | 636 | |
duke@435 | 637 | // jvmti support |
duke@435 | 638 | if (notify_jvmdi) { |
duke@435 | 639 | notify_method_exit(state, NotifyJVMTI); // preserve TOSCA |
duke@435 | 640 | } else { |
duke@435 | 641 | notify_method_exit(state, SkipNotifyJVMTI); // preserve TOSCA |
duke@435 | 642 | } |
duke@435 | 643 | |
duke@435 | 644 | // remove activation |
never@739 | 645 | movptr(rbx, Address(rbp, frame::interpreter_frame_sender_sp_offset * wordSize)); // get sender sp |
duke@435 | 646 | leave(); // remove frame anchor |
never@739 | 647 | pop(ret_addr); // get return address |
never@739 | 648 | mov(rsp, rbx); // set sp to sender sp |
duke@435 | 649 | if (UseSSE) { |
duke@435 | 650 | // float and double are returned in xmm register in SSE-mode |
duke@435 | 651 | if (state == ftos && UseSSE >= 1) { |
never@739 | 652 | subptr(rsp, wordSize); |
duke@435 | 653 | fstp_s(Address(rsp, 0)); |
duke@435 | 654 | movflt(xmm0, Address(rsp, 0)); |
never@739 | 655 | addptr(rsp, wordSize); |
duke@435 | 656 | } else if (state == dtos && UseSSE >= 2) { |
never@739 | 657 | subptr(rsp, 2*wordSize); |
duke@435 | 658 | fstp_d(Address(rsp, 0)); |
duke@435 | 659 | movdbl(xmm0, Address(rsp, 0)); |
never@739 | 660 | addptr(rsp, 2*wordSize); |
duke@435 | 661 | } |
duke@435 | 662 | } |
duke@435 | 663 | } |
duke@435 | 664 | |
duke@435 | 665 | #endif /* !CC_INTERP */ |
duke@435 | 666 | |
duke@435 | 667 | |
duke@435 | 668 | // Lock object |
duke@435 | 669 | // |
duke@435 | 670 | // Argument: rdx : Points to BasicObjectLock to be used for locking. Must |
duke@435 | 671 | // be initialized with object to lock |
duke@435 | 672 | void InterpreterMacroAssembler::lock_object(Register lock_reg) { |
duke@435 | 673 | assert(lock_reg == rdx, "The argument is only for looks. It must be rdx"); |
duke@435 | 674 | |
duke@435 | 675 | if (UseHeavyMonitors) { |
duke@435 | 676 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::monitorenter), lock_reg); |
duke@435 | 677 | } else { |
duke@435 | 678 | |
duke@435 | 679 | Label done; |
duke@435 | 680 | |
duke@435 | 681 | const Register swap_reg = rax; // Must use rax, for cmpxchg instruction |
duke@435 | 682 | const Register obj_reg = rcx; // Will contain the oop |
duke@435 | 683 | |
duke@435 | 684 | const int obj_offset = BasicObjectLock::obj_offset_in_bytes(); |
duke@435 | 685 | const int lock_offset = BasicObjectLock::lock_offset_in_bytes (); |
duke@435 | 686 | const int mark_offset = lock_offset + BasicLock::displaced_header_offset_in_bytes(); |
duke@435 | 687 | |
duke@435 | 688 | Label slow_case; |
duke@435 | 689 | |
duke@435 | 690 | // Load object pointer into obj_reg %rcx |
never@739 | 691 | movptr(obj_reg, Address(lock_reg, obj_offset)); |
duke@435 | 692 | |
duke@435 | 693 | if (UseBiasedLocking) { |
duke@435 | 694 | // Note: we use noreg for the temporary register since it's hard |
duke@435 | 695 | // to come up with a free register on all incoming code paths |
duke@435 | 696 | biased_locking_enter(lock_reg, obj_reg, swap_reg, noreg, false, done, &slow_case); |
duke@435 | 697 | } |
duke@435 | 698 | |
duke@435 | 699 | // Load immediate 1 into swap_reg %rax, |
never@739 | 700 | movptr(swap_reg, (int32_t)1); |
duke@435 | 701 | |
duke@435 | 702 | // Load (object->mark() | 1) into swap_reg %rax, |
never@739 | 703 | orptr(swap_reg, Address(obj_reg, 0)); |
duke@435 | 704 | |
duke@435 | 705 | // Save (object->mark() | 1) into BasicLock's displaced header |
never@739 | 706 | movptr(Address(lock_reg, mark_offset), swap_reg); |
duke@435 | 707 | |
duke@435 | 708 | assert(lock_offset == 0, "displached header must be first word in BasicObjectLock"); |
duke@435 | 709 | if (os::is_MP()) { |
duke@435 | 710 | lock(); |
duke@435 | 711 | } |
never@739 | 712 | cmpxchgptr(lock_reg, Address(obj_reg, 0)); |
duke@435 | 713 | if (PrintBiasedLockingStatistics) { |
duke@435 | 714 | cond_inc32(Assembler::zero, |
duke@435 | 715 | ExternalAddress((address) BiasedLocking::fast_path_entry_count_addr())); |
duke@435 | 716 | } |
duke@435 | 717 | jcc(Assembler::zero, done); |
duke@435 | 718 | |
duke@435 | 719 | // Test if the oopMark is an obvious stack pointer, i.e., |
duke@435 | 720 | // 1) (mark & 3) == 0, and |
duke@435 | 721 | // 2) rsp <= mark < mark + os::pagesize() |
duke@435 | 722 | // |
duke@435 | 723 | // These 3 tests can be done by evaluating the following |
duke@435 | 724 | // expression: ((mark - rsp) & (3 - os::vm_page_size())), |
duke@435 | 725 | // assuming both stack pointer and pagesize have their |
duke@435 | 726 | // least significant 2 bits clear. |
duke@435 | 727 | // NOTE: the oopMark is in swap_reg %rax, as the result of cmpxchg |
never@739 | 728 | subptr(swap_reg, rsp); |
never@739 | 729 | andptr(swap_reg, 3 - os::vm_page_size()); |
duke@435 | 730 | |
duke@435 | 731 | // Save the test result, for recursive case, the result is zero |
never@739 | 732 | movptr(Address(lock_reg, mark_offset), swap_reg); |
duke@435 | 733 | |
duke@435 | 734 | if (PrintBiasedLockingStatistics) { |
duke@435 | 735 | cond_inc32(Assembler::zero, |
duke@435 | 736 | ExternalAddress((address) BiasedLocking::fast_path_entry_count_addr())); |
duke@435 | 737 | } |
duke@435 | 738 | jcc(Assembler::zero, done); |
duke@435 | 739 | |
duke@435 | 740 | bind(slow_case); |
duke@435 | 741 | |
duke@435 | 742 | // Call the runtime routine for slow case |
duke@435 | 743 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::monitorenter), lock_reg); |
duke@435 | 744 | |
duke@435 | 745 | bind(done); |
duke@435 | 746 | } |
duke@435 | 747 | } |
duke@435 | 748 | |
duke@435 | 749 | |
duke@435 | 750 | // Unlocks an object. Used in monitorexit bytecode and remove_activation. |
duke@435 | 751 | // |
duke@435 | 752 | // Argument: rdx : Points to BasicObjectLock structure for lock |
duke@435 | 753 | // Throw an IllegalMonitorException if object is not locked by current thread |
duke@435 | 754 | // |
duke@435 | 755 | // Uses: rax, rbx, rcx, rdx |
duke@435 | 756 | void InterpreterMacroAssembler::unlock_object(Register lock_reg) { |
duke@435 | 757 | assert(lock_reg == rdx, "The argument is only for looks. It must be rdx"); |
duke@435 | 758 | |
duke@435 | 759 | if (UseHeavyMonitors) { |
duke@435 | 760 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::monitorexit), lock_reg); |
duke@435 | 761 | } else { |
duke@435 | 762 | Label done; |
duke@435 | 763 | |
duke@435 | 764 | const Register swap_reg = rax; // Must use rax, for cmpxchg instruction |
duke@435 | 765 | const Register header_reg = rbx; // Will contain the old oopMark |
duke@435 | 766 | const Register obj_reg = rcx; // Will contain the oop |
duke@435 | 767 | |
duke@435 | 768 | save_bcp(); // Save in case of exception |
duke@435 | 769 | |
duke@435 | 770 | // Convert from BasicObjectLock structure to object and BasicLock structure |
duke@435 | 771 | // Store the BasicLock address into %rax, |
never@739 | 772 | lea(swap_reg, Address(lock_reg, BasicObjectLock::lock_offset_in_bytes())); |
duke@435 | 773 | |
duke@435 | 774 | // Load oop into obj_reg(%rcx) |
never@739 | 775 | movptr(obj_reg, Address(lock_reg, BasicObjectLock::obj_offset_in_bytes ())); |
duke@435 | 776 | |
duke@435 | 777 | // Free entry |
xlu@947 | 778 | movptr(Address(lock_reg, BasicObjectLock::obj_offset_in_bytes()), NULL_WORD); |
duke@435 | 779 | |
duke@435 | 780 | if (UseBiasedLocking) { |
duke@435 | 781 | biased_locking_exit(obj_reg, header_reg, done); |
duke@435 | 782 | } |
duke@435 | 783 | |
duke@435 | 784 | // Load the old header from BasicLock structure |
never@739 | 785 | movptr(header_reg, Address(swap_reg, BasicLock::displaced_header_offset_in_bytes())); |
duke@435 | 786 | |
duke@435 | 787 | // Test for recursion |
never@739 | 788 | testptr(header_reg, header_reg); |
duke@435 | 789 | |
duke@435 | 790 | // zero for recursive case |
duke@435 | 791 | jcc(Assembler::zero, done); |
duke@435 | 792 | |
duke@435 | 793 | // Atomic swap back the old header |
duke@435 | 794 | if (os::is_MP()) lock(); |
never@739 | 795 | cmpxchgptr(header_reg, Address(obj_reg, 0)); |
duke@435 | 796 | |
duke@435 | 797 | // zero for recursive case |
duke@435 | 798 | jcc(Assembler::zero, done); |
duke@435 | 799 | |
duke@435 | 800 | // Call the runtime routine for slow case. |
never@739 | 801 | movptr(Address(lock_reg, BasicObjectLock::obj_offset_in_bytes()), obj_reg); // restore obj |
duke@435 | 802 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::monitorexit), lock_reg); |
duke@435 | 803 | |
duke@435 | 804 | bind(done); |
duke@435 | 805 | |
duke@435 | 806 | restore_bcp(); |
duke@435 | 807 | } |
duke@435 | 808 | } |
duke@435 | 809 | |
duke@435 | 810 | |
duke@435 | 811 | #ifndef CC_INTERP |
duke@435 | 812 | |
duke@435 | 813 | // Test ImethodDataPtr. If it is null, continue at the specified label |
duke@435 | 814 | void InterpreterMacroAssembler::test_method_data_pointer(Register mdp, Label& zero_continue) { |
duke@435 | 815 | assert(ProfileInterpreter, "must be profiling interpreter"); |
never@739 | 816 | movptr(mdp, Address(rbp, frame::interpreter_frame_mdx_offset * wordSize)); |
never@739 | 817 | testptr(mdp, mdp); |
duke@435 | 818 | jcc(Assembler::zero, zero_continue); |
duke@435 | 819 | } |
duke@435 | 820 | |
duke@435 | 821 | |
duke@435 | 822 | // Set the method data pointer for the current bcp. |
duke@435 | 823 | void InterpreterMacroAssembler::set_method_data_pointer_for_bcp() { |
duke@435 | 824 | assert(ProfileInterpreter, "must be profiling interpreter"); |
iveresov@2438 | 825 | Label set_mdp; |
never@739 | 826 | push(rax); |
never@739 | 827 | push(rbx); |
duke@435 | 828 | |
duke@435 | 829 | get_method(rbx); |
duke@435 | 830 | // Test MDO to avoid the call if it is NULL. |
coleenp@4037 | 831 | movptr(rax, Address(rbx, in_bytes(Method::method_data_offset()))); |
never@739 | 832 | testptr(rax, rax); |
iveresov@2438 | 833 | jcc(Assembler::zero, set_mdp); |
duke@435 | 834 | // rbx,: method |
duke@435 | 835 | // rsi: bcp |
duke@435 | 836 | call_VM_leaf(CAST_FROM_FN_PTR(address, InterpreterRuntime::bcp_to_di), rbx, rsi); |
duke@435 | 837 | // rax,: mdi |
iveresov@2438 | 838 | // mdo is guaranteed to be non-zero here, we checked for it before the call. |
coleenp@4037 | 839 | movptr(rbx, Address(rbx, in_bytes(Method::method_data_offset()))); |
coleenp@4037 | 840 | addptr(rbx, in_bytes(MethodData::data_offset())); |
iveresov@2438 | 841 | addptr(rax, rbx); |
iveresov@2438 | 842 | bind(set_mdp); |
iveresov@2438 | 843 | movptr(Address(rbp, frame::interpreter_frame_mdx_offset * wordSize), rax); |
never@739 | 844 | pop(rbx); |
never@739 | 845 | pop(rax); |
duke@435 | 846 | } |
duke@435 | 847 | |
duke@435 | 848 | void InterpreterMacroAssembler::verify_method_data_pointer() { |
duke@435 | 849 | assert(ProfileInterpreter, "must be profiling interpreter"); |
duke@435 | 850 | #ifdef ASSERT |
duke@435 | 851 | Label verify_continue; |
never@739 | 852 | push(rax); |
never@739 | 853 | push(rbx); |
never@739 | 854 | push(rcx); |
never@739 | 855 | push(rdx); |
duke@435 | 856 | test_method_data_pointer(rcx, verify_continue); // If mdp is zero, continue |
duke@435 | 857 | get_method(rbx); |
duke@435 | 858 | |
duke@435 | 859 | // If the mdp is valid, it will point to a DataLayout header which is |
duke@435 | 860 | // consistent with the bcp. The converse is highly probable also. |
jrose@1057 | 861 | load_unsigned_short(rdx, Address(rcx, in_bytes(DataLayout::bci_offset()))); |
coleenp@4037 | 862 | addptr(rdx, Address(rbx, Method::const_offset())); |
coleenp@4037 | 863 | lea(rdx, Address(rdx, ConstMethod::codes_offset())); |
never@739 | 864 | cmpptr(rdx, rsi); |
duke@435 | 865 | jcc(Assembler::equal, verify_continue); |
duke@435 | 866 | // rbx,: method |
duke@435 | 867 | // rsi: bcp |
duke@435 | 868 | // rcx: mdp |
duke@435 | 869 | call_VM_leaf(CAST_FROM_FN_PTR(address, InterpreterRuntime::verify_mdp), rbx, rsi, rcx); |
duke@435 | 870 | bind(verify_continue); |
never@739 | 871 | pop(rdx); |
never@739 | 872 | pop(rcx); |
never@739 | 873 | pop(rbx); |
never@739 | 874 | pop(rax); |
duke@435 | 875 | #endif // ASSERT |
duke@435 | 876 | } |
duke@435 | 877 | |
duke@435 | 878 | |
duke@435 | 879 | void InterpreterMacroAssembler::set_mdp_data_at(Register mdp_in, int constant, Register value) { |
never@739 | 880 | // %%% this seems to be used to store counter data which is surely 32bits |
never@739 | 881 | // however 64bit side stores 64 bits which seems wrong |
duke@435 | 882 | assert(ProfileInterpreter, "must be profiling interpreter"); |
duke@435 | 883 | Address data(mdp_in, constant); |
never@739 | 884 | movptr(data, value); |
duke@435 | 885 | } |
duke@435 | 886 | |
duke@435 | 887 | |
duke@435 | 888 | void InterpreterMacroAssembler::increment_mdp_data_at(Register mdp_in, |
duke@435 | 889 | int constant, |
duke@435 | 890 | bool decrement) { |
duke@435 | 891 | // Counter address |
duke@435 | 892 | Address data(mdp_in, constant); |
duke@435 | 893 | |
duke@435 | 894 | increment_mdp_data_at(data, decrement); |
duke@435 | 895 | } |
duke@435 | 896 | |
duke@435 | 897 | |
duke@435 | 898 | void InterpreterMacroAssembler::increment_mdp_data_at(Address data, |
duke@435 | 899 | bool decrement) { |
duke@435 | 900 | |
duke@435 | 901 | assert( DataLayout::counter_increment==1, "flow-free idiom only works with 1" ); |
duke@435 | 902 | assert(ProfileInterpreter, "must be profiling interpreter"); |
duke@435 | 903 | |
never@739 | 904 | // %%% 64bit treats this as 64 bit which seems unlikely |
duke@435 | 905 | if (decrement) { |
duke@435 | 906 | // Decrement the register. Set condition codes. |
duke@435 | 907 | addl(data, -DataLayout::counter_increment); |
duke@435 | 908 | // If the decrement causes the counter to overflow, stay negative |
duke@435 | 909 | Label L; |
duke@435 | 910 | jcc(Assembler::negative, L); |
duke@435 | 911 | addl(data, DataLayout::counter_increment); |
duke@435 | 912 | bind(L); |
duke@435 | 913 | } else { |
duke@435 | 914 | assert(DataLayout::counter_increment == 1, |
duke@435 | 915 | "flow-free idiom only works with 1"); |
duke@435 | 916 | // Increment the register. Set carry flag. |
duke@435 | 917 | addl(data, DataLayout::counter_increment); |
duke@435 | 918 | // If the increment causes the counter to overflow, pull back by 1. |
duke@435 | 919 | sbbl(data, 0); |
duke@435 | 920 | } |
duke@435 | 921 | } |
duke@435 | 922 | |
duke@435 | 923 | |
duke@435 | 924 | void InterpreterMacroAssembler::increment_mdp_data_at(Register mdp_in, |
duke@435 | 925 | Register reg, |
duke@435 | 926 | int constant, |
duke@435 | 927 | bool decrement) { |
duke@435 | 928 | Address data(mdp_in, reg, Address::times_1, constant); |
duke@435 | 929 | |
duke@435 | 930 | increment_mdp_data_at(data, decrement); |
duke@435 | 931 | } |
duke@435 | 932 | |
duke@435 | 933 | |
duke@435 | 934 | void InterpreterMacroAssembler::set_mdp_flag_at(Register mdp_in, int flag_byte_constant) { |
duke@435 | 935 | assert(ProfileInterpreter, "must be profiling interpreter"); |
duke@435 | 936 | int header_offset = in_bytes(DataLayout::header_offset()); |
duke@435 | 937 | int header_bits = DataLayout::flag_mask_to_header_mask(flag_byte_constant); |
duke@435 | 938 | // Set the flag |
duke@435 | 939 | orl(Address(mdp_in, header_offset), header_bits); |
duke@435 | 940 | } |
duke@435 | 941 | |
duke@435 | 942 | |
duke@435 | 943 | |
duke@435 | 944 | void InterpreterMacroAssembler::test_mdp_data_at(Register mdp_in, |
duke@435 | 945 | int offset, |
duke@435 | 946 | Register value, |
duke@435 | 947 | Register test_value_out, |
duke@435 | 948 | Label& not_equal_continue) { |
duke@435 | 949 | assert(ProfileInterpreter, "must be profiling interpreter"); |
duke@435 | 950 | if (test_value_out == noreg) { |
never@739 | 951 | cmpptr(value, Address(mdp_in, offset)); |
duke@435 | 952 | } else { |
duke@435 | 953 | // Put the test value into a register, so caller can use it: |
never@739 | 954 | movptr(test_value_out, Address(mdp_in, offset)); |
never@739 | 955 | cmpptr(test_value_out, value); |
duke@435 | 956 | } |
duke@435 | 957 | jcc(Assembler::notEqual, not_equal_continue); |
duke@435 | 958 | } |
duke@435 | 959 | |
duke@435 | 960 | |
duke@435 | 961 | void InterpreterMacroAssembler::update_mdp_by_offset(Register mdp_in, int offset_of_disp) { |
duke@435 | 962 | assert(ProfileInterpreter, "must be profiling interpreter"); |
duke@435 | 963 | Address disp_address(mdp_in, offset_of_disp); |
never@739 | 964 | addptr(mdp_in,disp_address); |
never@739 | 965 | movptr(Address(rbp, frame::interpreter_frame_mdx_offset * wordSize), mdp_in); |
duke@435 | 966 | } |
duke@435 | 967 | |
duke@435 | 968 | |
duke@435 | 969 | void InterpreterMacroAssembler::update_mdp_by_offset(Register mdp_in, Register reg, int offset_of_disp) { |
duke@435 | 970 | assert(ProfileInterpreter, "must be profiling interpreter"); |
duke@435 | 971 | Address disp_address(mdp_in, reg, Address::times_1, offset_of_disp); |
never@739 | 972 | addptr(mdp_in, disp_address); |
never@739 | 973 | movptr(Address(rbp, frame::interpreter_frame_mdx_offset * wordSize), mdp_in); |
duke@435 | 974 | } |
duke@435 | 975 | |
duke@435 | 976 | |
duke@435 | 977 | void InterpreterMacroAssembler::update_mdp_by_constant(Register mdp_in, int constant) { |
duke@435 | 978 | assert(ProfileInterpreter, "must be profiling interpreter"); |
never@739 | 979 | addptr(mdp_in, constant); |
never@739 | 980 | movptr(Address(rbp, frame::interpreter_frame_mdx_offset * wordSize), mdp_in); |
duke@435 | 981 | } |
duke@435 | 982 | |
duke@435 | 983 | |
duke@435 | 984 | void InterpreterMacroAssembler::update_mdp_for_ret(Register return_bci) { |
duke@435 | 985 | assert(ProfileInterpreter, "must be profiling interpreter"); |
never@739 | 986 | push(return_bci); // save/restore across call_VM |
duke@435 | 987 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::update_mdp_for_ret), return_bci); |
never@739 | 988 | pop(return_bci); |
duke@435 | 989 | } |
duke@435 | 990 | |
duke@435 | 991 | |
duke@435 | 992 | void InterpreterMacroAssembler::profile_taken_branch(Register mdp, Register bumped_count) { |
duke@435 | 993 | if (ProfileInterpreter) { |
duke@435 | 994 | Label profile_continue; |
duke@435 | 995 | |
duke@435 | 996 | // If no method data exists, go to profile_continue. |
duke@435 | 997 | // Otherwise, assign to mdp |
duke@435 | 998 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 999 | |
duke@435 | 1000 | // We are taking a branch. Increment the taken count. |
duke@435 | 1001 | // We inline increment_mdp_data_at to return bumped_count in a register |
duke@435 | 1002 | //increment_mdp_data_at(mdp, in_bytes(JumpData::taken_offset())); |
duke@435 | 1003 | Address data(mdp, in_bytes(JumpData::taken_offset())); |
never@739 | 1004 | |
never@739 | 1005 | // %%% 64bit treats these cells as 64 bit but they seem to be 32 bit |
duke@435 | 1006 | movl(bumped_count,data); |
duke@435 | 1007 | assert( DataLayout::counter_increment==1, "flow-free idiom only works with 1" ); |
duke@435 | 1008 | addl(bumped_count, DataLayout::counter_increment); |
duke@435 | 1009 | sbbl(bumped_count, 0); |
duke@435 | 1010 | movl(data,bumped_count); // Store back out |
duke@435 | 1011 | |
duke@435 | 1012 | // The method data pointer needs to be updated to reflect the new target. |
duke@435 | 1013 | update_mdp_by_offset(mdp, in_bytes(JumpData::displacement_offset())); |
duke@435 | 1014 | bind (profile_continue); |
duke@435 | 1015 | } |
duke@435 | 1016 | } |
duke@435 | 1017 | |
duke@435 | 1018 | |
duke@435 | 1019 | void InterpreterMacroAssembler::profile_not_taken_branch(Register mdp) { |
duke@435 | 1020 | if (ProfileInterpreter) { |
duke@435 | 1021 | Label profile_continue; |
duke@435 | 1022 | |
duke@435 | 1023 | // If no method data exists, go to profile_continue. |
duke@435 | 1024 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1025 | |
duke@435 | 1026 | // We are taking a branch. Increment the not taken count. |
duke@435 | 1027 | increment_mdp_data_at(mdp, in_bytes(BranchData::not_taken_offset())); |
duke@435 | 1028 | |
duke@435 | 1029 | // The method data pointer needs to be updated to correspond to the next bytecode |
duke@435 | 1030 | update_mdp_by_constant(mdp, in_bytes(BranchData::branch_data_size())); |
duke@435 | 1031 | bind (profile_continue); |
duke@435 | 1032 | } |
duke@435 | 1033 | } |
duke@435 | 1034 | |
duke@435 | 1035 | |
duke@435 | 1036 | void InterpreterMacroAssembler::profile_call(Register mdp) { |
duke@435 | 1037 | if (ProfileInterpreter) { |
duke@435 | 1038 | Label profile_continue; |
duke@435 | 1039 | |
duke@435 | 1040 | // If no method data exists, go to profile_continue. |
duke@435 | 1041 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1042 | |
duke@435 | 1043 | // We are making a call. Increment the count. |
duke@435 | 1044 | increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset())); |
duke@435 | 1045 | |
duke@435 | 1046 | // The method data pointer needs to be updated to reflect the new target. |
duke@435 | 1047 | update_mdp_by_constant(mdp, in_bytes(CounterData::counter_data_size())); |
duke@435 | 1048 | bind (profile_continue); |
duke@435 | 1049 | } |
duke@435 | 1050 | } |
duke@435 | 1051 | |
duke@435 | 1052 | |
duke@435 | 1053 | void InterpreterMacroAssembler::profile_final_call(Register mdp) { |
duke@435 | 1054 | if (ProfileInterpreter) { |
duke@435 | 1055 | Label profile_continue; |
duke@435 | 1056 | |
duke@435 | 1057 | // If no method data exists, go to profile_continue. |
duke@435 | 1058 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1059 | |
duke@435 | 1060 | // We are making a call. Increment the count. |
duke@435 | 1061 | increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset())); |
duke@435 | 1062 | |
duke@435 | 1063 | // The method data pointer needs to be updated to reflect the new target. |
duke@435 | 1064 | update_mdp_by_constant(mdp, in_bytes(VirtualCallData::virtual_call_data_size())); |
duke@435 | 1065 | bind (profile_continue); |
duke@435 | 1066 | } |
duke@435 | 1067 | } |
duke@435 | 1068 | |
duke@435 | 1069 | |
jrose@1161 | 1070 | void InterpreterMacroAssembler::profile_virtual_call(Register receiver, Register mdp, |
jrose@1161 | 1071 | Register reg2, |
jrose@1161 | 1072 | bool receiver_can_be_null) { |
duke@435 | 1073 | if (ProfileInterpreter) { |
duke@435 | 1074 | Label profile_continue; |
duke@435 | 1075 | |
duke@435 | 1076 | // If no method data exists, go to profile_continue. |
duke@435 | 1077 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1078 | |
jrose@1161 | 1079 | Label skip_receiver_profile; |
jrose@1161 | 1080 | if (receiver_can_be_null) { |
kvn@1641 | 1081 | Label not_null; |
jrose@1161 | 1082 | testptr(receiver, receiver); |
kvn@1641 | 1083 | jccb(Assembler::notZero, not_null); |
kvn@1641 | 1084 | // We are making a call. Increment the count for null receiver. |
kvn@1641 | 1085 | increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset())); |
kvn@1641 | 1086 | jmp(skip_receiver_profile); |
kvn@1641 | 1087 | bind(not_null); |
jrose@1161 | 1088 | } |
jrose@1161 | 1089 | |
duke@435 | 1090 | // Record the receiver type. |
kvn@1641 | 1091 | record_klass_in_profile(receiver, mdp, reg2, true); |
jrose@1161 | 1092 | bind(skip_receiver_profile); |
duke@435 | 1093 | |
duke@435 | 1094 | // The method data pointer needs to be updated to reflect the new target. |
duke@435 | 1095 | update_mdp_by_constant(mdp, |
duke@435 | 1096 | in_bytes(VirtualCallData:: |
duke@435 | 1097 | virtual_call_data_size())); |
duke@435 | 1098 | bind(profile_continue); |
duke@435 | 1099 | } |
duke@435 | 1100 | } |
duke@435 | 1101 | |
duke@435 | 1102 | |
duke@435 | 1103 | void InterpreterMacroAssembler::record_klass_in_profile_helper( |
duke@435 | 1104 | Register receiver, Register mdp, |
kvn@1641 | 1105 | Register reg2, int start_row, |
kvn@1641 | 1106 | Label& done, bool is_virtual_call) { |
kvn@1641 | 1107 | if (TypeProfileWidth == 0) { |
kvn@1641 | 1108 | if (is_virtual_call) { |
kvn@1641 | 1109 | increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset())); |
kvn@1641 | 1110 | } |
poonam@1402 | 1111 | return; |
kvn@1641 | 1112 | } |
poonam@1402 | 1113 | |
duke@435 | 1114 | int last_row = VirtualCallData::row_limit() - 1; |
duke@435 | 1115 | assert(start_row <= last_row, "must be work left to do"); |
duke@435 | 1116 | // Test this row for both the receiver and for null. |
duke@435 | 1117 | // Take any of three different outcomes: |
duke@435 | 1118 | // 1. found receiver => increment count and goto done |
duke@435 | 1119 | // 2. found null => keep looking for case 1, maybe allocate this cell |
duke@435 | 1120 | // 3. found something else => keep looking for cases 1 and 2 |
duke@435 | 1121 | // Case 3 is handled by a recursive call. |
duke@435 | 1122 | for (int row = start_row; row <= last_row; row++) { |
duke@435 | 1123 | Label next_test; |
duke@435 | 1124 | bool test_for_null_also = (row == start_row); |
duke@435 | 1125 | |
duke@435 | 1126 | // See if the receiver is receiver[n]. |
duke@435 | 1127 | int recvr_offset = in_bytes(VirtualCallData::receiver_offset(row)); |
duke@435 | 1128 | test_mdp_data_at(mdp, recvr_offset, receiver, |
duke@435 | 1129 | (test_for_null_also ? reg2 : noreg), |
duke@435 | 1130 | next_test); |
duke@435 | 1131 | // (Reg2 now contains the receiver from the CallData.) |
duke@435 | 1132 | |
duke@435 | 1133 | // The receiver is receiver[n]. Increment count[n]. |
duke@435 | 1134 | int count_offset = in_bytes(VirtualCallData::receiver_count_offset(row)); |
duke@435 | 1135 | increment_mdp_data_at(mdp, count_offset); |
duke@435 | 1136 | jmp(done); |
duke@435 | 1137 | bind(next_test); |
duke@435 | 1138 | |
duke@435 | 1139 | if (row == start_row) { |
kvn@1641 | 1140 | Label found_null; |
duke@435 | 1141 | // Failed the equality check on receiver[n]... Test for null. |
never@739 | 1142 | testptr(reg2, reg2); |
duke@435 | 1143 | if (start_row == last_row) { |
duke@435 | 1144 | // The only thing left to do is handle the null case. |
kvn@1641 | 1145 | if (is_virtual_call) { |
kvn@1641 | 1146 | jccb(Assembler::zero, found_null); |
kvn@1641 | 1147 | // Receiver did not match any saved receiver and there is no empty row for it. |
kvn@1686 | 1148 | // Increment total counter to indicate polymorphic case. |
kvn@1641 | 1149 | increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset())); |
kvn@1641 | 1150 | jmp(done); |
kvn@1641 | 1151 | bind(found_null); |
kvn@1641 | 1152 | } else { |
kvn@1641 | 1153 | jcc(Assembler::notZero, done); |
kvn@1641 | 1154 | } |
duke@435 | 1155 | break; |
duke@435 | 1156 | } |
duke@435 | 1157 | // Since null is rare, make it be the branch-taken case. |
duke@435 | 1158 | jcc(Assembler::zero, found_null); |
duke@435 | 1159 | |
duke@435 | 1160 | // Put all the "Case 3" tests here. |
kvn@1641 | 1161 | record_klass_in_profile_helper(receiver, mdp, reg2, start_row + 1, done, is_virtual_call); |
duke@435 | 1162 | |
duke@435 | 1163 | // Found a null. Keep searching for a matching receiver, |
duke@435 | 1164 | // but remember that this is an empty (unused) slot. |
duke@435 | 1165 | bind(found_null); |
duke@435 | 1166 | } |
duke@435 | 1167 | } |
duke@435 | 1168 | |
duke@435 | 1169 | // In the fall-through case, we found no matching receiver, but we |
duke@435 | 1170 | // observed the receiver[start_row] is NULL. |
duke@435 | 1171 | |
duke@435 | 1172 | // Fill in the receiver field and increment the count. |
duke@435 | 1173 | int recvr_offset = in_bytes(VirtualCallData::receiver_offset(start_row)); |
duke@435 | 1174 | set_mdp_data_at(mdp, recvr_offset, receiver); |
duke@435 | 1175 | int count_offset = in_bytes(VirtualCallData::receiver_count_offset(start_row)); |
never@3156 | 1176 | movptr(reg2, (intptr_t)DataLayout::counter_increment); |
duke@435 | 1177 | set_mdp_data_at(mdp, count_offset, reg2); |
kvn@1641 | 1178 | if (start_row > 0) { |
kvn@1641 | 1179 | jmp(done); |
kvn@1641 | 1180 | } |
duke@435 | 1181 | } |
duke@435 | 1182 | |
duke@435 | 1183 | void InterpreterMacroAssembler::record_klass_in_profile(Register receiver, |
kvn@1641 | 1184 | Register mdp, Register reg2, |
kvn@1641 | 1185 | bool is_virtual_call) { |
duke@435 | 1186 | assert(ProfileInterpreter, "must be profiling"); |
duke@435 | 1187 | Label done; |
duke@435 | 1188 | |
kvn@1641 | 1189 | record_klass_in_profile_helper(receiver, mdp, reg2, 0, done, is_virtual_call); |
duke@435 | 1190 | |
duke@435 | 1191 | bind (done); |
duke@435 | 1192 | } |
duke@435 | 1193 | |
duke@435 | 1194 | void InterpreterMacroAssembler::profile_ret(Register return_bci, Register mdp) { |
duke@435 | 1195 | if (ProfileInterpreter) { |
duke@435 | 1196 | Label profile_continue; |
duke@435 | 1197 | uint row; |
duke@435 | 1198 | |
duke@435 | 1199 | // If no method data exists, go to profile_continue. |
duke@435 | 1200 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1201 | |
duke@435 | 1202 | // Update the total ret count. |
duke@435 | 1203 | increment_mdp_data_at(mdp, in_bytes(CounterData::count_offset())); |
duke@435 | 1204 | |
duke@435 | 1205 | for (row = 0; row < RetData::row_limit(); row++) { |
duke@435 | 1206 | Label next_test; |
duke@435 | 1207 | |
duke@435 | 1208 | // See if return_bci is equal to bci[n]: |
duke@435 | 1209 | test_mdp_data_at(mdp, in_bytes(RetData::bci_offset(row)), return_bci, |
duke@435 | 1210 | noreg, next_test); |
duke@435 | 1211 | |
duke@435 | 1212 | // return_bci is equal to bci[n]. Increment the count. |
duke@435 | 1213 | increment_mdp_data_at(mdp, in_bytes(RetData::bci_count_offset(row))); |
duke@435 | 1214 | |
duke@435 | 1215 | // The method data pointer needs to be updated to reflect the new target. |
duke@435 | 1216 | update_mdp_by_offset(mdp, in_bytes(RetData::bci_displacement_offset(row))); |
duke@435 | 1217 | jmp(profile_continue); |
duke@435 | 1218 | bind(next_test); |
duke@435 | 1219 | } |
duke@435 | 1220 | |
duke@435 | 1221 | update_mdp_for_ret(return_bci); |
duke@435 | 1222 | |
duke@435 | 1223 | bind (profile_continue); |
duke@435 | 1224 | } |
duke@435 | 1225 | } |
duke@435 | 1226 | |
duke@435 | 1227 | |
duke@435 | 1228 | void InterpreterMacroAssembler::profile_null_seen(Register mdp) { |
duke@435 | 1229 | if (ProfileInterpreter) { |
duke@435 | 1230 | Label profile_continue; |
duke@435 | 1231 | |
duke@435 | 1232 | // If no method data exists, go to profile_continue. |
duke@435 | 1233 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1234 | |
never@1261 | 1235 | set_mdp_flag_at(mdp, BitData::null_seen_byte_constant()); |
never@1261 | 1236 | |
duke@435 | 1237 | // The method data pointer needs to be updated. |
duke@435 | 1238 | int mdp_delta = in_bytes(BitData::bit_data_size()); |
duke@435 | 1239 | if (TypeProfileCasts) { |
duke@435 | 1240 | mdp_delta = in_bytes(VirtualCallData::virtual_call_data_size()); |
duke@435 | 1241 | } |
duke@435 | 1242 | update_mdp_by_constant(mdp, mdp_delta); |
duke@435 | 1243 | |
duke@435 | 1244 | bind (profile_continue); |
duke@435 | 1245 | } |
duke@435 | 1246 | } |
duke@435 | 1247 | |
duke@435 | 1248 | |
duke@435 | 1249 | void InterpreterMacroAssembler::profile_typecheck_failed(Register mdp) { |
duke@435 | 1250 | if (ProfileInterpreter && TypeProfileCasts) { |
duke@435 | 1251 | Label profile_continue; |
duke@435 | 1252 | |
duke@435 | 1253 | // If no method data exists, go to profile_continue. |
duke@435 | 1254 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1255 | |
duke@435 | 1256 | int count_offset = in_bytes(CounterData::count_offset()); |
duke@435 | 1257 | // Back up the address, since we have already bumped the mdp. |
duke@435 | 1258 | count_offset -= in_bytes(VirtualCallData::virtual_call_data_size()); |
duke@435 | 1259 | |
duke@435 | 1260 | // *Decrement* the counter. We expect to see zero or small negatives. |
duke@435 | 1261 | increment_mdp_data_at(mdp, count_offset, true); |
duke@435 | 1262 | |
duke@435 | 1263 | bind (profile_continue); |
duke@435 | 1264 | } |
duke@435 | 1265 | } |
duke@435 | 1266 | |
duke@435 | 1267 | |
duke@435 | 1268 | void InterpreterMacroAssembler::profile_typecheck(Register mdp, Register klass, Register reg2) |
duke@435 | 1269 | { |
duke@435 | 1270 | if (ProfileInterpreter) { |
duke@435 | 1271 | Label profile_continue; |
duke@435 | 1272 | |
duke@435 | 1273 | // If no method data exists, go to profile_continue. |
duke@435 | 1274 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1275 | |
duke@435 | 1276 | // The method data pointer needs to be updated. |
duke@435 | 1277 | int mdp_delta = in_bytes(BitData::bit_data_size()); |
duke@435 | 1278 | if (TypeProfileCasts) { |
duke@435 | 1279 | mdp_delta = in_bytes(VirtualCallData::virtual_call_data_size()); |
duke@435 | 1280 | |
duke@435 | 1281 | // Record the object type. |
kvn@1641 | 1282 | record_klass_in_profile(klass, mdp, reg2, false); |
duke@435 | 1283 | assert(reg2 == rdi, "we know how to fix this blown reg"); |
duke@435 | 1284 | restore_locals(); // Restore EDI |
duke@435 | 1285 | } |
duke@435 | 1286 | update_mdp_by_constant(mdp, mdp_delta); |
duke@435 | 1287 | |
duke@435 | 1288 | bind(profile_continue); |
duke@435 | 1289 | } |
duke@435 | 1290 | } |
duke@435 | 1291 | |
duke@435 | 1292 | |
duke@435 | 1293 | void InterpreterMacroAssembler::profile_switch_default(Register mdp) { |
duke@435 | 1294 | if (ProfileInterpreter) { |
duke@435 | 1295 | Label profile_continue; |
duke@435 | 1296 | |
duke@435 | 1297 | // If no method data exists, go to profile_continue. |
duke@435 | 1298 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1299 | |
duke@435 | 1300 | // Update the default case count |
duke@435 | 1301 | increment_mdp_data_at(mdp, in_bytes(MultiBranchData::default_count_offset())); |
duke@435 | 1302 | |
duke@435 | 1303 | // The method data pointer needs to be updated. |
duke@435 | 1304 | update_mdp_by_offset(mdp, in_bytes(MultiBranchData::default_displacement_offset())); |
duke@435 | 1305 | |
duke@435 | 1306 | bind (profile_continue); |
duke@435 | 1307 | } |
duke@435 | 1308 | } |
duke@435 | 1309 | |
duke@435 | 1310 | |
duke@435 | 1311 | void InterpreterMacroAssembler::profile_switch_case(Register index, Register mdp, Register reg2) { |
duke@435 | 1312 | if (ProfileInterpreter) { |
duke@435 | 1313 | Label profile_continue; |
duke@435 | 1314 | |
duke@435 | 1315 | // If no method data exists, go to profile_continue. |
duke@435 | 1316 | test_method_data_pointer(mdp, profile_continue); |
duke@435 | 1317 | |
duke@435 | 1318 | // Build the base (index * per_case_size_in_bytes()) + case_array_offset_in_bytes() |
never@3156 | 1319 | movptr(reg2, (intptr_t)in_bytes(MultiBranchData::per_case_size())); |
never@739 | 1320 | // index is positive and so should have correct value if this code were |
never@739 | 1321 | // used on 64bits |
never@739 | 1322 | imulptr(index, reg2); |
never@739 | 1323 | addptr(index, in_bytes(MultiBranchData::case_array_offset())); |
duke@435 | 1324 | |
duke@435 | 1325 | // Update the case count |
duke@435 | 1326 | increment_mdp_data_at(mdp, index, in_bytes(MultiBranchData::relative_count_offset())); |
duke@435 | 1327 | |
duke@435 | 1328 | // The method data pointer needs to be updated. |
duke@435 | 1329 | update_mdp_by_offset(mdp, index, in_bytes(MultiBranchData::relative_displacement_offset())); |
duke@435 | 1330 | |
duke@435 | 1331 | bind (profile_continue); |
duke@435 | 1332 | } |
duke@435 | 1333 | } |
duke@435 | 1334 | |
duke@435 | 1335 | #endif // !CC_INTERP |
duke@435 | 1336 | |
duke@435 | 1337 | |
duke@435 | 1338 | |
duke@435 | 1339 | void InterpreterMacroAssembler::verify_oop(Register reg, TosState state) { |
duke@435 | 1340 | if (state == atos) MacroAssembler::verify_oop(reg); |
duke@435 | 1341 | } |
duke@435 | 1342 | |
duke@435 | 1343 | |
duke@435 | 1344 | #ifndef CC_INTERP |
duke@435 | 1345 | void InterpreterMacroAssembler::verify_FPU(int stack_depth, TosState state) { |
duke@435 | 1346 | if (state == ftos || state == dtos) MacroAssembler::verify_FPU(stack_depth); |
duke@435 | 1347 | } |
duke@435 | 1348 | |
duke@435 | 1349 | #endif /* CC_INTERP */ |
duke@435 | 1350 | |
duke@435 | 1351 | |
duke@435 | 1352 | void InterpreterMacroAssembler::notify_method_entry() { |
duke@435 | 1353 | // Whenever JVMTI is interp_only_mode, method entry/exit events are sent to |
duke@435 | 1354 | // track stack depth. If it is possible to enter interp_only_mode we add |
duke@435 | 1355 | // the code to check if the event should be sent. |
duke@435 | 1356 | if (JvmtiExport::can_post_interpreter_events()) { |
duke@435 | 1357 | Label L; |
duke@435 | 1358 | get_thread(rcx); |
duke@435 | 1359 | movl(rcx, Address(rcx, JavaThread::interp_only_mode_offset())); |
duke@435 | 1360 | testl(rcx,rcx); |
duke@435 | 1361 | jcc(Assembler::zero, L); |
duke@435 | 1362 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::post_method_entry)); |
duke@435 | 1363 | bind(L); |
duke@435 | 1364 | } |
duke@435 | 1365 | |
duke@435 | 1366 | { |
duke@435 | 1367 | SkipIfEqual skip_if(this, &DTraceMethodProbes, 0); |
duke@435 | 1368 | get_thread(rcx); |
duke@435 | 1369 | get_method(rbx); |
duke@435 | 1370 | call_VM_leaf( |
duke@435 | 1371 | CAST_FROM_FN_PTR(address, SharedRuntime::dtrace_method_entry), rcx, rbx); |
duke@435 | 1372 | } |
dcubed@1045 | 1373 | |
dcubed@1045 | 1374 | // RedefineClasses() tracing support for obsolete method entry |
dcubed@1045 | 1375 | if (RC_TRACE_IN_RANGE(0x00001000, 0x00002000)) { |
dcubed@1045 | 1376 | get_thread(rcx); |
dcubed@1045 | 1377 | get_method(rbx); |
dcubed@1045 | 1378 | call_VM_leaf( |
dcubed@1045 | 1379 | CAST_FROM_FN_PTR(address, SharedRuntime::rc_trace_method_entry), |
dcubed@1045 | 1380 | rcx, rbx); |
dcubed@1045 | 1381 | } |
duke@435 | 1382 | } |
duke@435 | 1383 | |
duke@435 | 1384 | |
duke@435 | 1385 | void InterpreterMacroAssembler::notify_method_exit( |
duke@435 | 1386 | TosState state, NotifyMethodExitMode mode) { |
duke@435 | 1387 | // Whenever JVMTI is interp_only_mode, method entry/exit events are sent to |
duke@435 | 1388 | // track stack depth. If it is possible to enter interp_only_mode we add |
duke@435 | 1389 | // the code to check if the event should be sent. |
duke@435 | 1390 | if (mode == NotifyJVMTI && JvmtiExport::can_post_interpreter_events()) { |
duke@435 | 1391 | Label L; |
duke@435 | 1392 | // Note: frame::interpreter_frame_result has a dependency on how the |
duke@435 | 1393 | // method result is saved across the call to post_method_exit. If this |
duke@435 | 1394 | // is changed then the interpreter_frame_result implementation will |
duke@435 | 1395 | // need to be updated too. |
duke@435 | 1396 | |
duke@435 | 1397 | // For c++ interpreter the result is always stored at a known location in the frame |
duke@435 | 1398 | // template interpreter will leave it on the top of the stack. |
duke@435 | 1399 | NOT_CC_INTERP(push(state);) |
duke@435 | 1400 | get_thread(rcx); |
duke@435 | 1401 | movl(rcx, Address(rcx, JavaThread::interp_only_mode_offset())); |
duke@435 | 1402 | testl(rcx,rcx); |
duke@435 | 1403 | jcc(Assembler::zero, L); |
duke@435 | 1404 | call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::post_method_exit)); |
duke@435 | 1405 | bind(L); |
duke@435 | 1406 | NOT_CC_INTERP(pop(state);) |
duke@435 | 1407 | } |
duke@435 | 1408 | |
duke@435 | 1409 | { |
duke@435 | 1410 | SkipIfEqual skip_if(this, &DTraceMethodProbes, 0); |
never@739 | 1411 | NOT_CC_INTERP(push(state)); |
duke@435 | 1412 | get_thread(rbx); |
duke@435 | 1413 | get_method(rcx); |
duke@435 | 1414 | call_VM_leaf( |
duke@435 | 1415 | CAST_FROM_FN_PTR(address, SharedRuntime::dtrace_method_exit), |
duke@435 | 1416 | rbx, rcx); |
never@739 | 1417 | NOT_CC_INTERP(pop(state)); |
duke@435 | 1418 | } |
duke@435 | 1419 | } |
iveresov@2138 | 1420 | |
iveresov@2138 | 1421 | // Jump if ((*counter_addr += increment) & mask) satisfies the condition. |
iveresov@2138 | 1422 | void InterpreterMacroAssembler::increment_mask_and_jump(Address counter_addr, |
iveresov@2138 | 1423 | int increment, int mask, |
iveresov@2138 | 1424 | Register scratch, bool preloaded, |
iveresov@2138 | 1425 | Condition cond, Label* where) { |
iveresov@2138 | 1426 | if (!preloaded) { |
iveresov@2138 | 1427 | movl(scratch, counter_addr); |
iveresov@2138 | 1428 | } |
iveresov@2138 | 1429 | incrementl(scratch, increment); |
iveresov@2138 | 1430 | movl(counter_addr, scratch); |
iveresov@2138 | 1431 | andl(scratch, mask); |
iveresov@2138 | 1432 | jcc(cond, *where); |
iveresov@2138 | 1433 | } |