1.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 1.2 +++ b/src/cpu/x86/vm/jniFastGetField_x86_32.cpp Sat Dec 01 00:00:00 2007 +0000 1.3 @@ -0,0 +1,356 @@ 1.4 +/* 1.5 + * Copyright 2004-2006 Sun Microsystems, Inc. All Rights Reserved. 1.6 + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 1.7 + * 1.8 + * This code is free software; you can redistribute it and/or modify it 1.9 + * under the terms of the GNU General Public License version 2 only, as 1.10 + * published by the Free Software Foundation. 1.11 + * 1.12 + * This code is distributed in the hope that it will be useful, but WITHOUT 1.13 + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 1.14 + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 1.15 + * version 2 for more details (a copy is included in the LICENSE file that 1.16 + * accompanied this code). 1.17 + * 1.18 + * You should have received a copy of the GNU General Public License version 1.19 + * 2 along with this work; if not, write to the Free Software Foundation, 1.20 + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 1.21 + * 1.22 + * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara, 1.23 + * CA 95054 USA or visit www.sun.com if you need additional information or 1.24 + * have any questions. 1.25 + * 1.26 + */ 1.27 + 1.28 +# include "incls/_precompiled.incl" 1.29 +# include "incls/_jniFastGetField_x86_32.cpp.incl" 1.30 + 1.31 +#define __ masm-> 1.32 + 1.33 +#define BUFFER_SIZE 30 1.34 + 1.35 +#ifdef _WINDOWS 1.36 +GetBooleanField_t JNI_FastGetField::jni_fast_GetBooleanField_fp; 1.37 +GetByteField_t JNI_FastGetField::jni_fast_GetByteField_fp; 1.38 +GetCharField_t JNI_FastGetField::jni_fast_GetCharField_fp; 1.39 +GetShortField_t JNI_FastGetField::jni_fast_GetShortField_fp; 1.40 +GetIntField_t JNI_FastGetField::jni_fast_GetIntField_fp; 1.41 +GetLongField_t JNI_FastGetField::jni_fast_GetLongField_fp; 1.42 +GetFloatField_t JNI_FastGetField::jni_fast_GetFloatField_fp; 1.43 +GetDoubleField_t JNI_FastGetField::jni_fast_GetDoubleField_fp; 1.44 +#endif 1.45 + 1.46 +// Instead of issuing lfence for LoadLoad barrier, we create data dependency 1.47 +// between loads, which is much more efficient than lfence. 1.48 + 1.49 +address JNI_FastGetField::generate_fast_get_int_field0(BasicType type) { 1.50 + const char *name; 1.51 + switch (type) { 1.52 + case T_BOOLEAN: name = "jni_fast_GetBooleanField"; break; 1.53 + case T_BYTE: name = "jni_fast_GetByteField"; break; 1.54 + case T_CHAR: name = "jni_fast_GetCharField"; break; 1.55 + case T_SHORT: name = "jni_fast_GetShortField"; break; 1.56 + case T_INT: name = "jni_fast_GetIntField"; break; 1.57 + default: ShouldNotReachHere(); 1.58 + } 1.59 + ResourceMark rm; 1.60 + BufferBlob* b = BufferBlob::create(name, BUFFER_SIZE*wordSize); 1.61 + address fast_entry = b->instructions_begin(); 1.62 + CodeBuffer cbuf(fast_entry, b->instructions_size()); 1.63 + MacroAssembler* masm = new MacroAssembler(&cbuf); 1.64 + 1.65 + Label slow; 1.66 + 1.67 + // stack layout: offset from rsp (in words): 1.68 + // return pc 0 1.69 + // jni env 1 1.70 + // obj 2 1.71 + // jfieldID 3 1.72 + 1.73 + ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr()); 1.74 + __ mov32 (rcx, counter); 1.75 + __ testb (rcx, 1); 1.76 + __ jcc (Assembler::notZero, slow); 1.77 + if (os::is_MP()) { 1.78 + __ movl (rax, rcx); 1.79 + __ andl (rax, 1); // rax, must end up 0 1.80 + __ movl (rdx, Address(rsp, rax, Address::times_1, 2*wordSize)); 1.81 + // obj, notice rax, is 0. 1.82 + // rdx is data dependent on rcx. 1.83 + } else { 1.84 + __ movl (rdx, Address(rsp, 2*wordSize)); // obj 1.85 + } 1.86 + __ movl (rax, Address(rsp, 3*wordSize)); // jfieldID 1.87 + __ movl (rdx, Address(rdx, 0)); // *obj 1.88 + __ shrl (rax, 2); // offset 1.89 + 1.90 + assert(count < LIST_CAPACITY, "LIST_CAPACITY too small"); 1.91 + speculative_load_pclist[count] = __ pc(); 1.92 + switch (type) { 1.93 + case T_BOOLEAN: __ movzxb (rax, Address(rdx, rax, Address::times_1)); break; 1.94 + case T_BYTE: __ movsxb (rax, Address(rdx, rax, Address::times_1)); break; 1.95 + case T_CHAR: __ movzxw (rax, Address(rdx, rax, Address::times_1)); break; 1.96 + case T_SHORT: __ movsxw (rax, Address(rdx, rax, Address::times_1)); break; 1.97 + case T_INT: __ movl (rax, Address(rdx, rax, Address::times_1)); break; 1.98 + default: ShouldNotReachHere(); 1.99 + } 1.100 + 1.101 + Address ca1; 1.102 + if (os::is_MP()) { 1.103 + __ lea(rdx, counter); 1.104 + __ xorl(rdx, rax); 1.105 + __ xorl(rdx, rax); 1.106 + __ cmp32(rcx, Address(rdx, 0)); 1.107 + // ca1 is the same as ca because 1.108 + // rax, ^ counter_addr ^ rax, = address 1.109 + // ca1 is data dependent on rax,. 1.110 + } else { 1.111 + __ cmp32(rcx, counter); 1.112 + } 1.113 + __ jcc (Assembler::notEqual, slow); 1.114 + 1.115 +#ifndef _WINDOWS 1.116 + __ ret (0); 1.117 +#else 1.118 + // __stdcall calling convention 1.119 + __ ret (3*wordSize); 1.120 +#endif 1.121 + 1.122 + slowcase_entry_pclist[count++] = __ pc(); 1.123 + __ bind (slow); 1.124 + address slow_case_addr; 1.125 + switch (type) { 1.126 + case T_BOOLEAN: slow_case_addr = jni_GetBooleanField_addr(); break; 1.127 + case T_BYTE: slow_case_addr = jni_GetByteField_addr(); break; 1.128 + case T_CHAR: slow_case_addr = jni_GetCharField_addr(); break; 1.129 + case T_SHORT: slow_case_addr = jni_GetShortField_addr(); break; 1.130 + case T_INT: slow_case_addr = jni_GetIntField_addr(); 1.131 + } 1.132 + // tail call 1.133 + __ jump (ExternalAddress(slow_case_addr)); 1.134 + 1.135 + __ flush (); 1.136 + 1.137 +#ifndef _WINDOWS 1.138 + return fast_entry; 1.139 +#else 1.140 + switch (type) { 1.141 + case T_BOOLEAN: jni_fast_GetBooleanField_fp = (GetBooleanField_t)fast_entry; break; 1.142 + case T_BYTE: jni_fast_GetByteField_fp = (GetByteField_t)fast_entry; break; 1.143 + case T_CHAR: jni_fast_GetCharField_fp = (GetCharField_t)fast_entry; break; 1.144 + case T_SHORT: jni_fast_GetShortField_fp = (GetShortField_t)fast_entry; break; 1.145 + case T_INT: jni_fast_GetIntField_fp = (GetIntField_t)fast_entry; 1.146 + } 1.147 + return os::win32::fast_jni_accessor_wrapper(type); 1.148 +#endif 1.149 +} 1.150 + 1.151 +address JNI_FastGetField::generate_fast_get_boolean_field() { 1.152 + return generate_fast_get_int_field0(T_BOOLEAN); 1.153 +} 1.154 + 1.155 +address JNI_FastGetField::generate_fast_get_byte_field() { 1.156 + return generate_fast_get_int_field0(T_BYTE); 1.157 +} 1.158 + 1.159 +address JNI_FastGetField::generate_fast_get_char_field() { 1.160 + return generate_fast_get_int_field0(T_CHAR); 1.161 +} 1.162 + 1.163 +address JNI_FastGetField::generate_fast_get_short_field() { 1.164 + return generate_fast_get_int_field0(T_SHORT); 1.165 +} 1.166 + 1.167 +address JNI_FastGetField::generate_fast_get_int_field() { 1.168 + return generate_fast_get_int_field0(T_INT); 1.169 +} 1.170 + 1.171 +address JNI_FastGetField::generate_fast_get_long_field() { 1.172 + const char *name = "jni_fast_GetLongField"; 1.173 + ResourceMark rm; 1.174 + BufferBlob* b = BufferBlob::create(name, BUFFER_SIZE*wordSize); 1.175 + address fast_entry = b->instructions_begin(); 1.176 + CodeBuffer cbuf(fast_entry, b->instructions_size()); 1.177 + MacroAssembler* masm = new MacroAssembler(&cbuf); 1.178 + 1.179 + Label slow; 1.180 + 1.181 + // stack layout: offset from rsp (in words): 1.182 + // old rsi 0 1.183 + // return pc 1 1.184 + // jni env 2 1.185 + // obj 3 1.186 + // jfieldID 4 1.187 + 1.188 + ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr()); 1.189 + 1.190 + __ pushl (rsi); 1.191 + __ mov32 (rcx, counter); 1.192 + __ testb (rcx, 1); 1.193 + __ jcc (Assembler::notZero, slow); 1.194 + if (os::is_MP()) { 1.195 + __ movl (rax, rcx); 1.196 + __ andl (rax, 1); // rax, must end up 0 1.197 + __ movl (rdx, Address(rsp, rax, Address::times_1, 3*wordSize)); 1.198 + // obj, notice rax, is 0. 1.199 + // rdx is data dependent on rcx. 1.200 + } else { 1.201 + __ movl (rdx, Address(rsp, 3*wordSize)); // obj 1.202 + } 1.203 + __ movl (rsi, Address(rsp, 4*wordSize)); // jfieldID 1.204 + __ movl (rdx, Address(rdx, 0)); // *obj 1.205 + __ shrl (rsi, 2); // offset 1.206 + 1.207 + assert(count < LIST_CAPACITY-1, "LIST_CAPACITY too small"); 1.208 + speculative_load_pclist[count++] = __ pc(); 1.209 + __ movl (rax, Address(rdx, rsi, Address::times_1)); 1.210 + speculative_load_pclist[count] = __ pc(); 1.211 + __ movl (rdx, Address(rdx, rsi, Address::times_1, 4)); 1.212 + 1.213 + if (os::is_MP()) { 1.214 + __ lea (rsi, counter); 1.215 + __ xorl (rsi, rdx); 1.216 + __ xorl (rsi, rax); 1.217 + __ xorl (rsi, rdx); 1.218 + __ xorl (rsi, rax); 1.219 + __ cmp32(rcx, Address(rsi, 0)); 1.220 + // ca1 is the same as ca because 1.221 + // rax, ^ rdx ^ counter_addr ^ rax, ^ rdx = address 1.222 + // ca1 is data dependent on both rax, and rdx. 1.223 + } else { 1.224 + __ cmp32(rcx, counter); 1.225 + } 1.226 + __ jcc (Assembler::notEqual, slow); 1.227 + 1.228 + __ popl (rsi); 1.229 + 1.230 +#ifndef _WINDOWS 1.231 + __ ret (0); 1.232 +#else 1.233 + // __stdcall calling convention 1.234 + __ ret (3*wordSize); 1.235 +#endif 1.236 + 1.237 + slowcase_entry_pclist[count-1] = __ pc(); 1.238 + slowcase_entry_pclist[count++] = __ pc(); 1.239 + __ bind (slow); 1.240 + __ popl (rsi); 1.241 + address slow_case_addr = jni_GetLongField_addr();; 1.242 + // tail call 1.243 + __ jump (ExternalAddress(slow_case_addr)); 1.244 + 1.245 + __ flush (); 1.246 + 1.247 +#ifndef _WINDOWS 1.248 + return fast_entry; 1.249 +#else 1.250 + jni_fast_GetLongField_fp = (GetLongField_t)fast_entry; 1.251 + return os::win32::fast_jni_accessor_wrapper(T_LONG); 1.252 +#endif 1.253 +} 1.254 + 1.255 +address JNI_FastGetField::generate_fast_get_float_field0(BasicType type) { 1.256 + const char *name; 1.257 + switch (type) { 1.258 + case T_FLOAT: name = "jni_fast_GetFloatField"; break; 1.259 + case T_DOUBLE: name = "jni_fast_GetDoubleField"; break; 1.260 + default: ShouldNotReachHere(); 1.261 + } 1.262 + ResourceMark rm; 1.263 + BufferBlob* b = BufferBlob::create(name, BUFFER_SIZE*wordSize); 1.264 + address fast_entry = b->instructions_begin(); 1.265 + CodeBuffer cbuf(fast_entry, b->instructions_size()); 1.266 + MacroAssembler* masm = new MacroAssembler(&cbuf); 1.267 + 1.268 + Label slow_with_pop, slow; 1.269 + 1.270 + // stack layout: offset from rsp (in words): 1.271 + // return pc 0 1.272 + // jni env 1 1.273 + // obj 2 1.274 + // jfieldID 3 1.275 + 1.276 + ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr()); 1.277 + 1.278 + __ mov32 (rcx, counter); 1.279 + __ testb (rcx, 1); 1.280 + __ jcc (Assembler::notZero, slow); 1.281 + if (os::is_MP()) { 1.282 + __ movl (rax, rcx); 1.283 + __ andl (rax, 1); // rax, must end up 0 1.284 + __ movl (rdx, Address(rsp, rax, Address::times_1, 2*wordSize)); 1.285 + // obj, notice rax, is 0. 1.286 + // rdx is data dependent on rcx. 1.287 + } else { 1.288 + __ movl (rdx, Address(rsp, 2*wordSize)); // obj 1.289 + } 1.290 + __ movl (rax, Address(rsp, 3*wordSize)); // jfieldID 1.291 + __ movl (rdx, Address(rdx, 0)); // *obj 1.292 + __ shrl (rax, 2); // offset 1.293 + 1.294 + assert(count < LIST_CAPACITY, "LIST_CAPACITY too small"); 1.295 + speculative_load_pclist[count] = __ pc(); 1.296 + switch (type) { 1.297 + case T_FLOAT: __ fld_s (Address(rdx, rax, Address::times_1)); break; 1.298 + case T_DOUBLE: __ fld_d (Address(rdx, rax, Address::times_1)); break; 1.299 + default: ShouldNotReachHere(); 1.300 + } 1.301 + 1.302 + Address ca1; 1.303 + if (os::is_MP()) { 1.304 + __ fst_s (Address(rsp, -4)); 1.305 + __ lea(rdx, counter); 1.306 + __ movl (rax, Address(rsp, -4)); 1.307 + __ xorl(rdx, rax); 1.308 + __ xorl(rdx, rax); 1.309 + __ cmp32(rcx, Address(rdx, 0)); 1.310 + // rax, ^ counter_addr ^ rax, = address 1.311 + // ca1 is data dependent on the field 1.312 + // access. 1.313 + } else { 1.314 + __ cmp32(rcx, counter); 1.315 + } 1.316 + __ jcc (Assembler::notEqual, slow_with_pop); 1.317 + 1.318 +#ifndef _WINDOWS 1.319 + __ ret (0); 1.320 +#else 1.321 + // __stdcall calling convention 1.322 + __ ret (3*wordSize); 1.323 +#endif 1.324 + 1.325 + __ bind (slow_with_pop); 1.326 + // invalid load. pop FPU stack. 1.327 + __ fstp_d (0); 1.328 + 1.329 + slowcase_entry_pclist[count++] = __ pc(); 1.330 + __ bind (slow); 1.331 + address slow_case_addr; 1.332 + switch (type) { 1.333 + case T_FLOAT: slow_case_addr = jni_GetFloatField_addr(); break; 1.334 + case T_DOUBLE: slow_case_addr = jni_GetDoubleField_addr(); break; 1.335 + default: ShouldNotReachHere(); 1.336 + } 1.337 + // tail call 1.338 + __ jump (ExternalAddress(slow_case_addr)); 1.339 + 1.340 + __ flush (); 1.341 + 1.342 +#ifndef _WINDOWS 1.343 + return fast_entry; 1.344 +#else 1.345 + switch (type) { 1.346 + case T_FLOAT: jni_fast_GetFloatField_fp = (GetFloatField_t)fast_entry; break; 1.347 + case T_DOUBLE: jni_fast_GetDoubleField_fp = (GetDoubleField_t)fast_entry; 1.348 + } 1.349 + return os::win32::fast_jni_accessor_wrapper(type); 1.350 +#endif 1.351 +} 1.352 + 1.353 +address JNI_FastGetField::generate_fast_get_float_field() { 1.354 + return generate_fast_get_float_field0(T_FLOAT); 1.355 +} 1.356 + 1.357 +address JNI_FastGetField::generate_fast_get_double_field() { 1.358 + return generate_fast_get_float_field0(T_DOUBLE); 1.359 +}