src/cpu/x86/vm/jniFastGetField_x86_64.cpp

Wed, 21 May 2008 16:31:35 -0700

author
kvn
date
Wed, 21 May 2008 16:31:35 -0700
changeset 600
437d03ea40b1
parent 435
a61af66fc99e
child 739
dc7f315e41f7
permissions
-rw-r--r--

6703888: Compressed Oops: use the 32-bits gap after klass in a object
Summary: Use the gap also for a narrow oop field and a boxing object value.
Reviewed-by: coleenp, never

duke@435 1 /*
duke@435 2 * Copyright 2004-2006 Sun Microsystems, Inc. All Rights Reserved.
duke@435 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
duke@435 4 *
duke@435 5 * This code is free software; you can redistribute it and/or modify it
duke@435 6 * under the terms of the GNU General Public License version 2 only, as
duke@435 7 * published by the Free Software Foundation.
duke@435 8 *
duke@435 9 * This code is distributed in the hope that it will be useful, but WITHOUT
duke@435 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
duke@435 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
duke@435 12 * version 2 for more details (a copy is included in the LICENSE file that
duke@435 13 * accompanied this code).
duke@435 14 *
duke@435 15 * You should have received a copy of the GNU General Public License version
duke@435 16 * 2 along with this work; if not, write to the Free Software Foundation,
duke@435 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
duke@435 18 *
duke@435 19 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
duke@435 20 * CA 95054 USA or visit www.sun.com if you need additional information or
duke@435 21 * have any questions.
duke@435 22 *
duke@435 23 */
duke@435 24
duke@435 25 # include "incls/_precompiled.incl"
duke@435 26 # include "incls/_jniFastGetField_x86_64.cpp.incl"
duke@435 27
duke@435 28 #define __ masm->
duke@435 29
duke@435 30 #define BUFFER_SIZE 30*wordSize
duke@435 31
duke@435 32 // Instead of issuing lfence for LoadLoad barrier, we create data dependency
duke@435 33 // between loads, which is more efficient than lfence.
duke@435 34
duke@435 35 // Common register usage:
duke@435 36 // rax/xmm0: result
duke@435 37 // c_rarg0: jni env
duke@435 38 // c_rarg1: obj
duke@435 39 // c_rarg2: jfield id
duke@435 40
duke@435 41 static const Register robj = r9;
duke@435 42 static const Register rcounter = r10;
duke@435 43 static const Register roffset = r11;
duke@435 44 static const Register rcounter_addr = r11;
duke@435 45
duke@435 46 // Warning: do not use rip relative addressing after the first counter load
duke@435 47 // since that may scratch r10!
duke@435 48
duke@435 49 address JNI_FastGetField::generate_fast_get_int_field0(BasicType type) {
duke@435 50 const char *name;
duke@435 51 switch (type) {
duke@435 52 case T_BOOLEAN: name = "jni_fast_GetBooleanField"; break;
duke@435 53 case T_BYTE: name = "jni_fast_GetByteField"; break;
duke@435 54 case T_CHAR: name = "jni_fast_GetCharField"; break;
duke@435 55 case T_SHORT: name = "jni_fast_GetShortField"; break;
duke@435 56 case T_INT: name = "jni_fast_GetIntField"; break;
duke@435 57 case T_LONG: name = "jni_fast_GetLongField"; break;
duke@435 58 default: ShouldNotReachHere();
duke@435 59 }
duke@435 60 ResourceMark rm;
duke@435 61 BufferBlob* b = BufferBlob::create(name, BUFFER_SIZE);
duke@435 62 address fast_entry = b->instructions_begin();
duke@435 63 CodeBuffer cbuf(fast_entry, b->instructions_size());
duke@435 64 MacroAssembler* masm = new MacroAssembler(&cbuf);
duke@435 65
duke@435 66 Label slow;
duke@435 67
duke@435 68 ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
duke@435 69 __ mov32 (rcounter, counter);
duke@435 70 __ movq (robj, c_rarg1);
duke@435 71 __ testb (rcounter, 1);
duke@435 72 __ jcc (Assembler::notZero, slow);
duke@435 73 if (os::is_MP()) {
duke@435 74 __ xorq (robj, rcounter);
duke@435 75 __ xorq (robj, rcounter); // obj, since
duke@435 76 // robj ^ rcounter ^ rcounter == robj
duke@435 77 // robj is data dependent on rcounter.
duke@435 78 }
duke@435 79 __ movq (robj, Address(robj, 0)); // *obj
duke@435 80 __ movq (roffset, c_rarg2);
duke@435 81 __ shrq (roffset, 2); // offset
duke@435 82
duke@435 83 assert(count < LIST_CAPACITY, "LIST_CAPACITY too small");
duke@435 84 speculative_load_pclist[count] = __ pc();
duke@435 85 switch (type) {
duke@435 86 case T_BOOLEAN: __ movzbl (rax, Address(robj, roffset, Address::times_1)); break;
duke@435 87 case T_BYTE: __ movsbl (rax, Address(robj, roffset, Address::times_1)); break;
duke@435 88 case T_CHAR: __ movzwl (rax, Address(robj, roffset, Address::times_1)); break;
duke@435 89 case T_SHORT: __ movswl (rax, Address(robj, roffset, Address::times_1)); break;
duke@435 90 case T_INT: __ movl (rax, Address(robj, roffset, Address::times_1)); break;
duke@435 91 case T_LONG: __ movq (rax, Address(robj, roffset, Address::times_1)); break;
duke@435 92 default: ShouldNotReachHere();
duke@435 93 }
duke@435 94
duke@435 95 if (os::is_MP()) {
duke@435 96 __ lea(rcounter_addr, counter);
duke@435 97 // ca is data dependent on rax.
duke@435 98 __ xorq (rcounter_addr, rax);
duke@435 99 __ xorq (rcounter_addr, rax);
duke@435 100 __ cmpl (rcounter, Address(rcounter_addr, 0));
duke@435 101 } else {
duke@435 102 __ cmp32 (rcounter, counter);
duke@435 103 }
duke@435 104 __ jcc (Assembler::notEqual, slow);
duke@435 105
duke@435 106 __ ret (0);
duke@435 107
duke@435 108 slowcase_entry_pclist[count++] = __ pc();
duke@435 109 __ bind (slow);
duke@435 110 address slow_case_addr;
duke@435 111 switch (type) {
duke@435 112 case T_BOOLEAN: slow_case_addr = jni_GetBooleanField_addr(); break;
duke@435 113 case T_BYTE: slow_case_addr = jni_GetByteField_addr(); break;
duke@435 114 case T_CHAR: slow_case_addr = jni_GetCharField_addr(); break;
duke@435 115 case T_SHORT: slow_case_addr = jni_GetShortField_addr(); break;
duke@435 116 case T_INT: slow_case_addr = jni_GetIntField_addr(); break;
duke@435 117 case T_LONG: slow_case_addr = jni_GetLongField_addr();
duke@435 118 }
duke@435 119 // tail call
duke@435 120 __ jump (ExternalAddress(slow_case_addr));
duke@435 121
duke@435 122 __ flush ();
duke@435 123
duke@435 124 return fast_entry;
duke@435 125 }
duke@435 126
duke@435 127 address JNI_FastGetField::generate_fast_get_boolean_field() {
duke@435 128 return generate_fast_get_int_field0(T_BOOLEAN);
duke@435 129 }
duke@435 130
duke@435 131 address JNI_FastGetField::generate_fast_get_byte_field() {
duke@435 132 return generate_fast_get_int_field0(T_BYTE);
duke@435 133 }
duke@435 134
duke@435 135 address JNI_FastGetField::generate_fast_get_char_field() {
duke@435 136 return generate_fast_get_int_field0(T_CHAR);
duke@435 137 }
duke@435 138
duke@435 139 address JNI_FastGetField::generate_fast_get_short_field() {
duke@435 140 return generate_fast_get_int_field0(T_SHORT);
duke@435 141 }
duke@435 142
duke@435 143 address JNI_FastGetField::generate_fast_get_int_field() {
duke@435 144 return generate_fast_get_int_field0(T_INT);
duke@435 145 }
duke@435 146
duke@435 147 address JNI_FastGetField::generate_fast_get_long_field() {
duke@435 148 return generate_fast_get_int_field0(T_LONG);
duke@435 149 }
duke@435 150
duke@435 151 address JNI_FastGetField::generate_fast_get_float_field0(BasicType type) {
duke@435 152 const char *name;
duke@435 153 switch (type) {
duke@435 154 case T_FLOAT: name = "jni_fast_GetFloatField"; break;
duke@435 155 case T_DOUBLE: name = "jni_fast_GetDoubleField"; break;
duke@435 156 default: ShouldNotReachHere();
duke@435 157 }
duke@435 158 ResourceMark rm;
duke@435 159 BufferBlob* b = BufferBlob::create(name, BUFFER_SIZE);
duke@435 160 address fast_entry = b->instructions_begin();
duke@435 161 CodeBuffer cbuf(fast_entry, b->instructions_size());
duke@435 162 MacroAssembler* masm = new MacroAssembler(&cbuf);
duke@435 163
duke@435 164 Label slow;
duke@435 165
duke@435 166 ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
duke@435 167 __ mov32 (rcounter, counter);
duke@435 168 __ movq (robj, c_rarg1);
duke@435 169 __ testb (rcounter, 1);
duke@435 170 __ jcc (Assembler::notZero, slow);
duke@435 171 if (os::is_MP()) {
duke@435 172 __ xorq (robj, rcounter);
duke@435 173 __ xorq (robj, rcounter); // obj, since
duke@435 174 // robj ^ rcounter ^ rcounter == robj
duke@435 175 // robj is data dependent on rcounter.
duke@435 176 }
duke@435 177 __ movq (robj, Address(robj, 0)); // *obj
duke@435 178 __ movq (roffset, c_rarg2);
duke@435 179 __ shrq (roffset, 2); // offset
duke@435 180
duke@435 181 assert(count < LIST_CAPACITY, "LIST_CAPACITY too small");
duke@435 182 speculative_load_pclist[count] = __ pc();
duke@435 183 switch (type) {
duke@435 184 case T_FLOAT: __ movflt (xmm0, Address(robj, roffset, Address::times_1)); break;
duke@435 185 case T_DOUBLE: __ movdbl (xmm0, Address(robj, roffset, Address::times_1)); break;
duke@435 186 default: ShouldNotReachHere();
duke@435 187 }
duke@435 188
duke@435 189 if (os::is_MP()) {
duke@435 190 __ lea(rcounter_addr, counter);
duke@435 191 __ movdq (rax, xmm0);
duke@435 192 // counter address is data dependent on xmm0.
duke@435 193 __ xorq (rcounter_addr, rax);
duke@435 194 __ xorq (rcounter_addr, rax);
duke@435 195 __ cmpl (rcounter, Address(rcounter_addr, 0));
duke@435 196 } else {
duke@435 197 __ cmp32 (rcounter, counter);
duke@435 198 }
duke@435 199 __ jcc (Assembler::notEqual, slow);
duke@435 200
duke@435 201 __ ret (0);
duke@435 202
duke@435 203 slowcase_entry_pclist[count++] = __ pc();
duke@435 204 __ bind (slow);
duke@435 205 address slow_case_addr;
duke@435 206 switch (type) {
duke@435 207 case T_FLOAT: slow_case_addr = jni_GetFloatField_addr(); break;
duke@435 208 case T_DOUBLE: slow_case_addr = jni_GetDoubleField_addr();
duke@435 209 }
duke@435 210 // tail call
duke@435 211 __ jump (ExternalAddress(slow_case_addr));
duke@435 212
duke@435 213 __ flush ();
duke@435 214
duke@435 215 return fast_entry;
duke@435 216 }
duke@435 217
duke@435 218 address JNI_FastGetField::generate_fast_get_float_field() {
duke@435 219 return generate_fast_get_float_field0(T_FLOAT);
duke@435 220 }
duke@435 221
duke@435 222 address JNI_FastGetField::generate_fast_get_double_field() {
duke@435 223 return generate_fast_get_float_field0(T_DOUBLE);
duke@435 224 }

mercurial