src/cpu/sparc/vm/vtableStubs_sparc.cpp

Tue, 24 Jul 2012 10:51:00 -0700

author
twisti
date
Tue, 24 Jul 2012 10:51:00 -0700
changeset 3969
1d7922586cf6
parent 3310
6729bbc1fcd6
child 4037
da91efe96a93
permissions
-rw-r--r--

7023639: JSR 292 method handle invocation needs a fast path for compiled code
6984705: JSR 292 method handle creation should not go through JNI
Summary: remove assembly code for JDK 7 chained method handles
Reviewed-by: jrose, twisti, kvn, mhaupt
Contributed-by: John Rose <john.r.rose@oracle.com>, Christian Thalinger <christian.thalinger@oracle.com>, Michael Haupt <michael.haupt@oracle.com>

duke@435 1 /*
twisti@3310 2 * Copyright (c) 1997, 2011, Oracle and/or its affiliates. All rights reserved.
duke@435 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
duke@435 4 *
duke@435 5 * This code is free software; you can redistribute it and/or modify it
duke@435 6 * under the terms of the GNU General Public License version 2 only, as
duke@435 7 * published by the Free Software Foundation.
duke@435 8 *
duke@435 9 * This code is distributed in the hope that it will be useful, but WITHOUT
duke@435 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
duke@435 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
duke@435 12 * version 2 for more details (a copy is included in the LICENSE file that
duke@435 13 * accompanied this code).
duke@435 14 *
duke@435 15 * You should have received a copy of the GNU General Public License version
duke@435 16 * 2 along with this work; if not, write to the Free Software Foundation,
duke@435 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
duke@435 18 *
trims@1907 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
trims@1907 20 * or visit www.oracle.com if you need additional information or have any
trims@1907 21 * questions.
duke@435 22 *
duke@435 23 */
duke@435 24
stefank@2314 25 #include "precompiled.hpp"
stefank@2314 26 #include "asm/assembler.hpp"
stefank@2314 27 #include "assembler_sparc.inline.hpp"
stefank@2314 28 #include "code/vtableStubs.hpp"
stefank@2314 29 #include "interp_masm_sparc.hpp"
stefank@2314 30 #include "memory/resourceArea.hpp"
stefank@2314 31 #include "oops/instanceKlass.hpp"
stefank@2314 32 #include "oops/klassVtable.hpp"
stefank@2314 33 #include "runtime/sharedRuntime.hpp"
stefank@2314 34 #include "vmreg_sparc.inline.hpp"
stefank@2314 35 #ifdef COMPILER2
stefank@2314 36 #include "opto/runtime.hpp"
stefank@2314 37 #endif
duke@435 38
duke@435 39 // machine-dependent part of VtableStubs: create vtableStub of correct size and
duke@435 40 // initialize its code
duke@435 41
duke@435 42 #define __ masm->
duke@435 43
duke@435 44
duke@435 45 #ifndef PRODUCT
duke@435 46 extern "C" void bad_compiled_vtable_index(JavaThread* thread, oopDesc* receiver, int index);
duke@435 47 #endif
duke@435 48
duke@435 49
duke@435 50 // Used by compiler only; may use only caller saved, non-argument registers
duke@435 51 // NOTE: %%%% if any change is made to this stub make sure that the function
duke@435 52 // pd_code_size_limit is changed to ensure the correct size for VtableStub
duke@435 53 VtableStub* VtableStubs::create_vtable_stub(int vtable_index) {
duke@435 54 const int sparc_code_length = VtableStub::pd_code_size_limit(true);
duke@435 55 VtableStub* s = new(sparc_code_length) VtableStub(true, vtable_index);
duke@435 56 ResourceMark rm;
duke@435 57 CodeBuffer cb(s->entry_point(), sparc_code_length);
duke@435 58 MacroAssembler* masm = new MacroAssembler(&cb);
duke@435 59
duke@435 60 #ifndef PRODUCT
duke@435 61 if (CountCompiledCalls) {
twisti@1162 62 __ inc_counter(SharedRuntime::nof_megamorphic_calls_addr(), G5, G3_scratch);
duke@435 63 }
duke@435 64 #endif /* PRODUCT */
duke@435 65
duke@435 66 assert(VtableStub::receiver_location() == O0->as_VMReg(), "receiver expected in O0");
duke@435 67
duke@435 68 // get receiver klass
duke@435 69 address npe_addr = __ pc();
coleenp@548 70 __ load_klass(O0, G3_scratch);
duke@435 71
duke@435 72 // set methodOop (in case of interpreted method), and destination address
duke@435 73 #ifndef PRODUCT
duke@435 74 if (DebugVtables) {
duke@435 75 Label L;
duke@435 76 // check offset vs vtable length
duke@435 77 __ ld(G3_scratch, instanceKlass::vtable_length_offset()*wordSize, G5);
kvn@3037 78 __ cmp_and_br_short(G5, vtable_index*vtableEntry::size(), Assembler::greaterUnsigned, Assembler::pt, L);
duke@435 79 __ set(vtable_index, O2);
duke@435 80 __ call_VM(noreg, CAST_FROM_FN_PTR(address, bad_compiled_vtable_index), O0, O2);
duke@435 81 __ bind(L);
duke@435 82 }
duke@435 83 #endif
twisti@3969 84
twisti@3969 85 __ lookup_virtual_method(G3_scratch, vtable_index, G5_method);
duke@435 86
duke@435 87 #ifndef PRODUCT
duke@435 88 if (DebugVtables) {
duke@435 89 Label L;
kvn@3037 90 __ br_notnull_short(G5_method, Assembler::pt, L);
duke@435 91 __ stop("Vtable entry is ZERO");
duke@435 92 __ bind(L);
duke@435 93 }
duke@435 94 #endif
duke@435 95
duke@435 96 address ame_addr = __ pc(); // if the vtable entry is null, the method is abstract
duke@435 97 // NOTE: for vtable dispatches, the vtable entry will never be null.
duke@435 98
duke@435 99 __ ld_ptr(G5_method, in_bytes(methodOopDesc::from_compiled_offset()), G3_scratch);
duke@435 100
duke@435 101 // jump to target (either compiled code or c2iadapter)
duke@435 102 __ JMP(G3_scratch, 0);
duke@435 103 // load methodOop (in case we call c2iadapter)
duke@435 104 __ delayed()->nop();
duke@435 105
duke@435 106 masm->flush();
jrose@1058 107
jrose@1058 108 if (PrintMiscellaneous && (WizardMode || Verbose)) {
jrose@1058 109 tty->print_cr("vtable #%d at "PTR_FORMAT"[%d] left over: %d",
jrose@1058 110 vtable_index, s->entry_point(),
jrose@1058 111 (int)(s->code_end() - s->entry_point()),
jrose@1058 112 (int)(s->code_end() - __ pc()));
jrose@1058 113 }
jrose@1058 114 guarantee(__ pc() <= s->code_end(), "overflowed buffer");
jrose@1144 115 // shut the door on sizing bugs
jrose@1144 116 int slop = 2*BytesPerInstWord; // 32-bit offset is this much larger than a 13-bit one
jrose@1144 117 assert(vtable_index > 10 || __ pc() + slop <= s->code_end(), "room for sethi;add");
jrose@1058 118
duke@435 119 s->set_exception_points(npe_addr, ame_addr);
duke@435 120 return s;
duke@435 121 }
duke@435 122
duke@435 123
duke@435 124 // NOTE: %%%% if any change is made to this stub make sure that the function
duke@435 125 // pd_code_size_limit is changed to ensure the correct size for VtableStub
jrose@1058 126 VtableStub* VtableStubs::create_itable_stub(int itable_index) {
duke@435 127 const int sparc_code_length = VtableStub::pd_code_size_limit(false);
jrose@1058 128 VtableStub* s = new(sparc_code_length) VtableStub(false, itable_index);
duke@435 129 ResourceMark rm;
duke@435 130 CodeBuffer cb(s->entry_point(), sparc_code_length);
duke@435 131 MacroAssembler* masm = new MacroAssembler(&cb);
duke@435 132
duke@435 133 Register G3_klassOop = G3_scratch;
duke@435 134 Register G5_interface = G5; // Passed in as an argument
duke@435 135 Label search;
duke@435 136
duke@435 137 // Entry arguments:
duke@435 138 // G5_interface: Interface
duke@435 139 // O0: Receiver
duke@435 140 assert(VtableStub::receiver_location() == O0->as_VMReg(), "receiver expected in O0");
duke@435 141
duke@435 142 // get receiver klass (also an implicit null-check)
duke@435 143 address npe_addr = __ pc();
coleenp@548 144 __ load_klass(O0, G3_klassOop);
duke@435 145 __ verify_oop(G3_klassOop);
duke@435 146
duke@435 147 // Push a new window to get some temp registers. This chops the head of all
duke@435 148 // my 64-bit %o registers in the LION build, but this is OK because no longs
duke@435 149 // are passed in the %o registers. Instead, longs are passed in G1 and G4
duke@435 150 // and so those registers are not available here.
duke@435 151 __ save(SP,-frame::register_save_words*wordSize,SP);
duke@435 152
duke@435 153 #ifndef PRODUCT
duke@435 154 if (CountCompiledCalls) {
twisti@1162 155 __ inc_counter(SharedRuntime::nof_megamorphic_calls_addr(), L0, L1);
duke@435 156 }
duke@435 157 #endif /* PRODUCT */
duke@435 158
jrose@1058 159 Label throw_icce;
duke@435 160
jrose@1058 161 Register L5_method = L5;
jrose@1058 162 __ lookup_interface_method(// inputs: rec. class, interface, itable index
jrose@1058 163 G3_klassOop, G5_interface, itable_index,
jrose@1058 164 // outputs: method, scan temp. reg
jrose@1058 165 L5_method, L2, L3,
jrose@1058 166 throw_icce);
duke@435 167
duke@435 168 #ifndef PRODUCT
duke@435 169 if (DebugVtables) {
duke@435 170 Label L01;
kvn@3037 171 __ br_notnull_short(L5_method, Assembler::pt, L01);
duke@435 172 __ stop("methodOop is null");
duke@435 173 __ bind(L01);
jrose@1058 174 __ verify_oop(L5_method);
duke@435 175 }
duke@435 176 #endif
duke@435 177
duke@435 178 // If the following load is through a NULL pointer, we'll take an OS
duke@435 179 // exception that should translate into an AbstractMethodError. We need the
duke@435 180 // window count to be correct at that time.
jrose@1058 181 __ restore(L5_method, 0, G5_method);
jrose@1058 182 // Restore registers *before* the AME point.
duke@435 183
duke@435 184 address ame_addr = __ pc(); // if the vtable entry is null, the method is abstract
duke@435 185 __ ld_ptr(G5_method, in_bytes(methodOopDesc::from_compiled_offset()), G3_scratch);
duke@435 186
duke@435 187 // G5_method: methodOop
duke@435 188 // O0: Receiver
duke@435 189 // G3_scratch: entry point
duke@435 190 __ JMP(G3_scratch, 0);
duke@435 191 __ delayed()->nop();
duke@435 192
dcubed@451 193 __ bind(throw_icce);
twisti@1162 194 AddressLiteral icce(StubRoutines::throw_IncompatibleClassChangeError_entry());
twisti@1162 195 __ jump_to(icce, G3_scratch);
dcubed@451 196 __ delayed()->restore();
dcubed@451 197
duke@435 198 masm->flush();
dcubed@451 199
jrose@1058 200 if (PrintMiscellaneous && (WizardMode || Verbose)) {
jrose@1058 201 tty->print_cr("itable #%d at "PTR_FORMAT"[%d] left over: %d",
jrose@1058 202 itable_index, s->entry_point(),
jrose@1058 203 (int)(s->code_end() - s->entry_point()),
jrose@1058 204 (int)(s->code_end() - __ pc()));
jrose@1058 205 }
dcubed@451 206 guarantee(__ pc() <= s->code_end(), "overflowed buffer");
jrose@1144 207 // shut the door on sizing bugs
jrose@1144 208 int slop = 2*BytesPerInstWord; // 32-bit offset is this much larger than a 13-bit one
jrose@1144 209 assert(itable_index > 10 || __ pc() + slop <= s->code_end(), "room for sethi;add");
dcubed@451 210
duke@435 211 s->set_exception_points(npe_addr, ame_addr);
duke@435 212 return s;
duke@435 213 }
duke@435 214
duke@435 215
duke@435 216 int VtableStub::pd_code_size_limit(bool is_vtable_stub) {
dcubed@451 217 if (TraceJumps || DebugVtables || CountCompiledCalls || VerifyOops) return 1000;
duke@435 218 else {
duke@435 219 const int slop = 2*BytesPerInstWord; // sethi;add (needed for long offsets)
duke@435 220 if (is_vtable_stub) {
coleenp@548 221 // ld;ld;ld,jmp,nop
coleenp@548 222 const int basic = 5*BytesPerInstWord +
kvn@1077 223 // shift;add for load_klass (only shift with zero heap based)
kvn@1077 224 (UseCompressedOops ?
kvn@1077 225 ((Universe::narrow_oop_base() == NULL) ? BytesPerInstWord : 2*BytesPerInstWord) : 0);
duke@435 226 return basic + slop;
duke@435 227 } else {
jrose@1058 228 const int basic = (28 LP64_ONLY(+ 6)) * BytesPerInstWord +
kvn@1077 229 // shift;add for load_klass (only shift with zero heap based)
kvn@1077 230 (UseCompressedOops ?
kvn@1077 231 ((Universe::narrow_oop_base() == NULL) ? BytesPerInstWord : 2*BytesPerInstWord) : 0);
duke@435 232 return (basic + slop);
duke@435 233 }
duke@435 234 }
jrose@1144 235
jrose@1144 236 // In order to tune these parameters, run the JVM with VM options
jrose@1144 237 // +PrintMiscellaneous and +WizardMode to see information about
jrose@1144 238 // actual itable stubs. Look for lines like this:
jrose@1144 239 // itable #1 at 0x5551212[116] left over: 8
jrose@1144 240 // Reduce the constants so that the "left over" number is 8
jrose@1144 241 // Do not aim at a left-over number of zero, because a very
jrose@1144 242 // large vtable or itable offset (> 4K) will require an extra
jrose@1144 243 // sethi/or pair of instructions.
jrose@1144 244 //
jrose@1144 245 // The JVM98 app. _202_jess has a megamorphic interface call.
jrose@1144 246 // The itable code looks like this:
jrose@1144 247 // Decoding VtableStub itbl[1]@16
jrose@1144 248 // ld [ %o0 + 4 ], %g3
jrose@1144 249 // save %sp, -64, %sp
jrose@1144 250 // ld [ %g3 + 0xe8 ], %l2
jrose@1144 251 // sll %l2, 2, %l2
jrose@1144 252 // add %l2, 0x134, %l2
jrose@1144 253 // and %l2, -8, %l2 ! NOT_LP64 only
jrose@1144 254 // add %g3, %l2, %l2
jrose@1144 255 // add %g3, 4, %g3
jrose@1144 256 // ld [ %l2 ], %l5
jrose@1144 257 // brz,pn %l5, throw_icce
jrose@1144 258 // cmp %l5, %g5
jrose@1144 259 // be %icc, success
jrose@1144 260 // add %l2, 8, %l2
jrose@1144 261 // loop:
jrose@1144 262 // ld [ %l2 ], %l5
jrose@1144 263 // brz,pn %l5, throw_icce
jrose@1144 264 // cmp %l5, %g5
jrose@1144 265 // bne,pn %icc, loop
jrose@1144 266 // add %l2, 8, %l2
jrose@1144 267 // success:
jrose@1144 268 // ld [ %l2 + -4 ], %l2
jrose@1144 269 // ld [ %g3 + %l2 ], %l5
jrose@1144 270 // restore %l5, 0, %g5
jrose@1144 271 // ld [ %g5 + 0x44 ], %g3
jrose@1144 272 // jmp %g3
jrose@1144 273 // nop
jrose@1144 274 // throw_icce:
jrose@1144 275 // sethi %hi(throw_ICCE_entry), %g3
jrose@1144 276 // ! 5 more instructions here, LP64_ONLY
jrose@1144 277 // jmp %g3 + %lo(throw_ICCE_entry)
jrose@1144 278 // restore
duke@435 279 }
duke@435 280
duke@435 281
duke@435 282 int VtableStub::pd_code_alignment() {
duke@435 283 // UltraSPARC cache line size is 8 instructions:
duke@435 284 const unsigned int icache_line_size = 32;
duke@435 285 return icache_line_size;
duke@435 286 }

mercurial