Tue, 02 Sep 2014 12:48:45 -0700
8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
Summary: Add new C2 intrinsic for BigInteger::multiplyToLen() on x86 in 64-bit VM.
Reviewed-by: roland
duke@435 | 1 | /* |
mikael@6198 | 2 | * Copyright (c) 1999, 2013, Oracle and/or its affiliates. All rights reserved. |
duke@435 | 3 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
duke@435 | 4 | * |
duke@435 | 5 | * This code is free software; you can redistribute it and/or modify it |
duke@435 | 6 | * under the terms of the GNU General Public License version 2 only, as |
duke@435 | 7 | * published by the Free Software Foundation. |
duke@435 | 8 | * |
duke@435 | 9 | * This code is distributed in the hope that it will be useful, but WITHOUT |
duke@435 | 10 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
duke@435 | 11 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
duke@435 | 12 | * version 2 for more details (a copy is included in the LICENSE file that |
duke@435 | 13 | * accompanied this code). |
duke@435 | 14 | * |
duke@435 | 15 | * You should have received a copy of the GNU General Public License version |
duke@435 | 16 | * 2 along with this work; if not, write to the Free Software Foundation, |
duke@435 | 17 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
duke@435 | 18 | * |
trims@1907 | 19 | * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
trims@1907 | 20 | * or visit www.oracle.com if you need additional information or have any |
trims@1907 | 21 | * questions. |
duke@435 | 22 | * |
duke@435 | 23 | */ |
duke@435 | 24 | |
stefank@2314 | 25 | #include "precompiled.hpp" |
stefank@2314 | 26 | #include "c1/c1_FrameMap.hpp" |
stefank@2314 | 27 | #include "c1/c1_LIR.hpp" |
stefank@2314 | 28 | #include "runtime/sharedRuntime.hpp" |
stefank@2314 | 29 | #include "vmreg_x86.inline.hpp" |
duke@435 | 30 | |
duke@435 | 31 | const int FrameMap::pd_c_runtime_reserved_arg_size = 0; |
duke@435 | 32 | |
duke@435 | 33 | LIR_Opr FrameMap::map_to_opr(BasicType type, VMRegPair* reg, bool) { |
duke@435 | 34 | LIR_Opr opr = LIR_OprFact::illegalOpr; |
duke@435 | 35 | VMReg r_1 = reg->first(); |
duke@435 | 36 | VMReg r_2 = reg->second(); |
duke@435 | 37 | if (r_1->is_stack()) { |
duke@435 | 38 | // Convert stack slot to an SP offset |
duke@435 | 39 | // The calling convention does not count the SharedRuntime::out_preserve_stack_slots() value |
duke@435 | 40 | // so we must add it in here. |
duke@435 | 41 | int st_off = (r_1->reg2stack() + SharedRuntime::out_preserve_stack_slots()) * VMRegImpl::stack_slot_size; |
duke@435 | 42 | opr = LIR_OprFact::address(new LIR_Address(rsp_opr, st_off, type)); |
duke@435 | 43 | } else if (r_1->is_Register()) { |
duke@435 | 44 | Register reg = r_1->as_Register(); |
never@739 | 45 | if (r_2->is_Register() && (type == T_LONG || type == T_DOUBLE)) { |
duke@435 | 46 | Register reg2 = r_2->as_Register(); |
never@739 | 47 | #ifdef _LP64 |
never@739 | 48 | assert(reg2 == reg, "must be same register"); |
never@739 | 49 | opr = as_long_opr(reg); |
never@739 | 50 | #else |
duke@435 | 51 | opr = as_long_opr(reg2, reg); |
never@739 | 52 | #endif // _LP64 |
never@739 | 53 | } else if (type == T_OBJECT || type == T_ARRAY) { |
duke@435 | 54 | opr = as_oop_opr(reg); |
iveresov@5994 | 55 | } else if (type == T_METADATA) { |
iveresov@5994 | 56 | opr = as_metadata_opr(reg); |
duke@435 | 57 | } else { |
duke@435 | 58 | opr = as_opr(reg); |
duke@435 | 59 | } |
duke@435 | 60 | } else if (r_1->is_FloatRegister()) { |
duke@435 | 61 | assert(type == T_DOUBLE || type == T_FLOAT, "wrong type"); |
duke@435 | 62 | int num = r_1->as_FloatRegister()->encoding(); |
duke@435 | 63 | if (type == T_FLOAT) { |
duke@435 | 64 | opr = LIR_OprFact::single_fpu(num); |
duke@435 | 65 | } else { |
duke@435 | 66 | opr = LIR_OprFact::double_fpu(num); |
duke@435 | 67 | } |
duke@435 | 68 | } else if (r_1->is_XMMRegister()) { |
duke@435 | 69 | assert(type == T_DOUBLE || type == T_FLOAT, "wrong type"); |
duke@435 | 70 | int num = r_1->as_XMMRegister()->encoding(); |
duke@435 | 71 | if (type == T_FLOAT) { |
duke@435 | 72 | opr = LIR_OprFact::single_xmm(num); |
duke@435 | 73 | } else { |
duke@435 | 74 | opr = LIR_OprFact::double_xmm(num); |
duke@435 | 75 | } |
duke@435 | 76 | } else { |
duke@435 | 77 | ShouldNotReachHere(); |
duke@435 | 78 | } |
duke@435 | 79 | return opr; |
duke@435 | 80 | } |
duke@435 | 81 | |
duke@435 | 82 | |
duke@435 | 83 | LIR_Opr FrameMap::rsi_opr; |
duke@435 | 84 | LIR_Opr FrameMap::rdi_opr; |
duke@435 | 85 | LIR_Opr FrameMap::rbx_opr; |
duke@435 | 86 | LIR_Opr FrameMap::rax_opr; |
duke@435 | 87 | LIR_Opr FrameMap::rdx_opr; |
duke@435 | 88 | LIR_Opr FrameMap::rcx_opr; |
duke@435 | 89 | LIR_Opr FrameMap::rsp_opr; |
duke@435 | 90 | LIR_Opr FrameMap::rbp_opr; |
duke@435 | 91 | |
duke@435 | 92 | LIR_Opr FrameMap::receiver_opr; |
duke@435 | 93 | |
duke@435 | 94 | LIR_Opr FrameMap::rsi_oop_opr; |
duke@435 | 95 | LIR_Opr FrameMap::rdi_oop_opr; |
duke@435 | 96 | LIR_Opr FrameMap::rbx_oop_opr; |
duke@435 | 97 | LIR_Opr FrameMap::rax_oop_opr; |
duke@435 | 98 | LIR_Opr FrameMap::rdx_oop_opr; |
duke@435 | 99 | LIR_Opr FrameMap::rcx_oop_opr; |
duke@435 | 100 | |
roland@4051 | 101 | LIR_Opr FrameMap::rsi_metadata_opr; |
roland@4051 | 102 | LIR_Opr FrameMap::rdi_metadata_opr; |
roland@4051 | 103 | LIR_Opr FrameMap::rbx_metadata_opr; |
roland@4051 | 104 | LIR_Opr FrameMap::rax_metadata_opr; |
roland@4051 | 105 | LIR_Opr FrameMap::rdx_metadata_opr; |
roland@4051 | 106 | LIR_Opr FrameMap::rcx_metadata_opr; |
roland@4051 | 107 | |
never@739 | 108 | LIR_Opr FrameMap::long0_opr; |
never@739 | 109 | LIR_Opr FrameMap::long1_opr; |
duke@435 | 110 | LIR_Opr FrameMap::fpu0_float_opr; |
duke@435 | 111 | LIR_Opr FrameMap::fpu0_double_opr; |
duke@435 | 112 | LIR_Opr FrameMap::xmm0_float_opr; |
duke@435 | 113 | LIR_Opr FrameMap::xmm0_double_opr; |
duke@435 | 114 | |
never@739 | 115 | #ifdef _LP64 |
never@739 | 116 | |
never@739 | 117 | LIR_Opr FrameMap::r8_opr; |
never@739 | 118 | LIR_Opr FrameMap::r9_opr; |
never@739 | 119 | LIR_Opr FrameMap::r10_opr; |
never@739 | 120 | LIR_Opr FrameMap::r11_opr; |
never@739 | 121 | LIR_Opr FrameMap::r12_opr; |
never@739 | 122 | LIR_Opr FrameMap::r13_opr; |
never@739 | 123 | LIR_Opr FrameMap::r14_opr; |
never@739 | 124 | LIR_Opr FrameMap::r15_opr; |
never@739 | 125 | |
never@739 | 126 | // r10 and r15 can never contain oops since they aren't available to |
never@739 | 127 | // the allocator |
never@739 | 128 | LIR_Opr FrameMap::r8_oop_opr; |
never@739 | 129 | LIR_Opr FrameMap::r9_oop_opr; |
never@739 | 130 | LIR_Opr FrameMap::r11_oop_opr; |
never@739 | 131 | LIR_Opr FrameMap::r12_oop_opr; |
never@739 | 132 | LIR_Opr FrameMap::r13_oop_opr; |
never@739 | 133 | LIR_Opr FrameMap::r14_oop_opr; |
roland@4051 | 134 | |
roland@4051 | 135 | LIR_Opr FrameMap::r8_metadata_opr; |
roland@4051 | 136 | LIR_Opr FrameMap::r9_metadata_opr; |
roland@4051 | 137 | LIR_Opr FrameMap::r11_metadata_opr; |
roland@4051 | 138 | LIR_Opr FrameMap::r12_metadata_opr; |
roland@4051 | 139 | LIR_Opr FrameMap::r13_metadata_opr; |
roland@4051 | 140 | LIR_Opr FrameMap::r14_metadata_opr; |
never@739 | 141 | #endif // _LP64 |
never@739 | 142 | |
duke@435 | 143 | LIR_Opr FrameMap::_caller_save_cpu_regs[] = { 0, }; |
duke@435 | 144 | LIR_Opr FrameMap::_caller_save_fpu_regs[] = { 0, }; |
duke@435 | 145 | LIR_Opr FrameMap::_caller_save_xmm_regs[] = { 0, }; |
duke@435 | 146 | |
never@739 | 147 | XMMRegister FrameMap::_xmm_regs [] = { 0, }; |
duke@435 | 148 | |
duke@435 | 149 | XMMRegister FrameMap::nr2xmmreg(int rnr) { |
duke@435 | 150 | assert(_init_done, "tables not initialized"); |
duke@435 | 151 | return _xmm_regs[rnr]; |
duke@435 | 152 | } |
duke@435 | 153 | |
duke@435 | 154 | //-------------------------------------------------------- |
duke@435 | 155 | // FrameMap |
duke@435 | 156 | //-------------------------------------------------------- |
duke@435 | 157 | |
iveresov@1939 | 158 | void FrameMap::initialize() { |
iveresov@1939 | 159 | assert(!_init_done, "once"); |
duke@435 | 160 | |
never@739 | 161 | assert(nof_cpu_regs == LP64_ONLY(16) NOT_LP64(8), "wrong number of CPU registers"); |
never@739 | 162 | map_register(0, rsi); rsi_opr = LIR_OprFact::single_cpu(0); |
never@739 | 163 | map_register(1, rdi); rdi_opr = LIR_OprFact::single_cpu(1); |
never@739 | 164 | map_register(2, rbx); rbx_opr = LIR_OprFact::single_cpu(2); |
never@739 | 165 | map_register(3, rax); rax_opr = LIR_OprFact::single_cpu(3); |
never@739 | 166 | map_register(4, rdx); rdx_opr = LIR_OprFact::single_cpu(4); |
never@739 | 167 | map_register(5, rcx); rcx_opr = LIR_OprFact::single_cpu(5); |
duke@435 | 168 | |
never@739 | 169 | #ifndef _LP64 |
never@739 | 170 | // The unallocatable registers are at the end |
never@739 | 171 | map_register(6, rsp); |
never@739 | 172 | map_register(7, rbp); |
never@739 | 173 | #else |
never@739 | 174 | map_register( 6, r8); r8_opr = LIR_OprFact::single_cpu(6); |
never@739 | 175 | map_register( 7, r9); r9_opr = LIR_OprFact::single_cpu(7); |
never@739 | 176 | map_register( 8, r11); r11_opr = LIR_OprFact::single_cpu(8); |
iveresov@2344 | 177 | map_register( 9, r13); r13_opr = LIR_OprFact::single_cpu(9); |
iveresov@2344 | 178 | map_register(10, r14); r14_opr = LIR_OprFact::single_cpu(10); |
iveresov@2344 | 179 | // r12 is allocated conditionally. With compressed oops it holds |
iveresov@2344 | 180 | // the heapbase value and is not visible to the allocator. |
iveresov@2344 | 181 | map_register(11, r12); r12_opr = LIR_OprFact::single_cpu(11); |
never@739 | 182 | // The unallocatable registers are at the end |
never@739 | 183 | map_register(12, r10); r10_opr = LIR_OprFact::single_cpu(12); |
never@739 | 184 | map_register(13, r15); r15_opr = LIR_OprFact::single_cpu(13); |
never@739 | 185 | map_register(14, rsp); |
never@739 | 186 | map_register(15, rbp); |
never@739 | 187 | #endif // _LP64 |
never@739 | 188 | |
never@739 | 189 | #ifdef _LP64 |
never@739 | 190 | long0_opr = LIR_OprFact::double_cpu(3 /*eax*/, 3 /*eax*/); |
never@739 | 191 | long1_opr = LIR_OprFact::double_cpu(2 /*ebx*/, 2 /*ebx*/); |
never@739 | 192 | #else |
never@739 | 193 | long0_opr = LIR_OprFact::double_cpu(3 /*eax*/, 4 /*edx*/); |
never@739 | 194 | long1_opr = LIR_OprFact::double_cpu(2 /*ebx*/, 5 /*ecx*/); |
never@739 | 195 | #endif // _LP64 |
duke@435 | 196 | fpu0_float_opr = LIR_OprFact::single_fpu(0); |
duke@435 | 197 | fpu0_double_opr = LIR_OprFact::double_fpu(0); |
duke@435 | 198 | xmm0_float_opr = LIR_OprFact::single_xmm(0); |
duke@435 | 199 | xmm0_double_opr = LIR_OprFact::double_xmm(0); |
duke@435 | 200 | |
duke@435 | 201 | _caller_save_cpu_regs[0] = rsi_opr; |
duke@435 | 202 | _caller_save_cpu_regs[1] = rdi_opr; |
duke@435 | 203 | _caller_save_cpu_regs[2] = rbx_opr; |
duke@435 | 204 | _caller_save_cpu_regs[3] = rax_opr; |
duke@435 | 205 | _caller_save_cpu_regs[4] = rdx_opr; |
duke@435 | 206 | _caller_save_cpu_regs[5] = rcx_opr; |
duke@435 | 207 | |
never@739 | 208 | #ifdef _LP64 |
never@739 | 209 | _caller_save_cpu_regs[6] = r8_opr; |
never@739 | 210 | _caller_save_cpu_regs[7] = r9_opr; |
never@739 | 211 | _caller_save_cpu_regs[8] = r11_opr; |
iveresov@2344 | 212 | _caller_save_cpu_regs[9] = r13_opr; |
iveresov@2344 | 213 | _caller_save_cpu_regs[10] = r14_opr; |
iveresov@2344 | 214 | _caller_save_cpu_regs[11] = r12_opr; |
never@739 | 215 | #endif // _LP64 |
never@739 | 216 | |
duke@435 | 217 | |
duke@435 | 218 | _xmm_regs[0] = xmm0; |
duke@435 | 219 | _xmm_regs[1] = xmm1; |
duke@435 | 220 | _xmm_regs[2] = xmm2; |
duke@435 | 221 | _xmm_regs[3] = xmm3; |
duke@435 | 222 | _xmm_regs[4] = xmm4; |
duke@435 | 223 | _xmm_regs[5] = xmm5; |
duke@435 | 224 | _xmm_regs[6] = xmm6; |
duke@435 | 225 | _xmm_regs[7] = xmm7; |
duke@435 | 226 | |
never@739 | 227 | #ifdef _LP64 |
never@739 | 228 | _xmm_regs[8] = xmm8; |
never@739 | 229 | _xmm_regs[9] = xmm9; |
never@739 | 230 | _xmm_regs[10] = xmm10; |
never@739 | 231 | _xmm_regs[11] = xmm11; |
never@739 | 232 | _xmm_regs[12] = xmm12; |
never@739 | 233 | _xmm_regs[13] = xmm13; |
never@739 | 234 | _xmm_regs[14] = xmm14; |
never@739 | 235 | _xmm_regs[15] = xmm15; |
never@739 | 236 | #endif // _LP64 |
never@739 | 237 | |
duke@435 | 238 | for (int i = 0; i < 8; i++) { |
duke@435 | 239 | _caller_save_fpu_regs[i] = LIR_OprFact::single_fpu(i); |
never@739 | 240 | } |
never@739 | 241 | |
never@739 | 242 | for (int i = 0; i < nof_caller_save_xmm_regs ; i++) { |
duke@435 | 243 | _caller_save_xmm_regs[i] = LIR_OprFact::single_xmm(i); |
duke@435 | 244 | } |
duke@435 | 245 | |
duke@435 | 246 | _init_done = true; |
duke@435 | 247 | |
never@739 | 248 | rsi_oop_opr = as_oop_opr(rsi); |
never@739 | 249 | rdi_oop_opr = as_oop_opr(rdi); |
never@739 | 250 | rbx_oop_opr = as_oop_opr(rbx); |
never@739 | 251 | rax_oop_opr = as_oop_opr(rax); |
never@739 | 252 | rdx_oop_opr = as_oop_opr(rdx); |
never@739 | 253 | rcx_oop_opr = as_oop_opr(rcx); |
never@739 | 254 | |
roland@4051 | 255 | rsi_metadata_opr = as_metadata_opr(rsi); |
roland@4051 | 256 | rdi_metadata_opr = as_metadata_opr(rdi); |
roland@4051 | 257 | rbx_metadata_opr = as_metadata_opr(rbx); |
roland@4051 | 258 | rax_metadata_opr = as_metadata_opr(rax); |
roland@4051 | 259 | rdx_metadata_opr = as_metadata_opr(rdx); |
roland@4051 | 260 | rcx_metadata_opr = as_metadata_opr(rcx); |
roland@4051 | 261 | |
never@739 | 262 | rsp_opr = as_pointer_opr(rsp); |
never@739 | 263 | rbp_opr = as_pointer_opr(rbp); |
never@739 | 264 | |
never@739 | 265 | #ifdef _LP64 |
never@739 | 266 | r8_oop_opr = as_oop_opr(r8); |
never@739 | 267 | r9_oop_opr = as_oop_opr(r9); |
never@739 | 268 | r11_oop_opr = as_oop_opr(r11); |
never@739 | 269 | r12_oop_opr = as_oop_opr(r12); |
never@739 | 270 | r13_oop_opr = as_oop_opr(r13); |
never@739 | 271 | r14_oop_opr = as_oop_opr(r14); |
roland@4051 | 272 | |
roland@4051 | 273 | r8_metadata_opr = as_metadata_opr(r8); |
roland@4051 | 274 | r9_metadata_opr = as_metadata_opr(r9); |
roland@4051 | 275 | r11_metadata_opr = as_metadata_opr(r11); |
roland@4051 | 276 | r12_metadata_opr = as_metadata_opr(r12); |
roland@4051 | 277 | r13_metadata_opr = as_metadata_opr(r13); |
roland@4051 | 278 | r14_metadata_opr = as_metadata_opr(r14); |
never@739 | 279 | #endif // _LP64 |
never@739 | 280 | |
duke@435 | 281 | VMRegPair regs; |
duke@435 | 282 | BasicType sig_bt = T_OBJECT; |
duke@435 | 283 | SharedRuntime::java_calling_convention(&sig_bt, ®s, 1, true); |
duke@435 | 284 | receiver_opr = as_oop_opr(regs.first()->as_Register()); |
never@739 | 285 | |
duke@435 | 286 | } |
duke@435 | 287 | |
duke@435 | 288 | |
duke@435 | 289 | Address FrameMap::make_new_address(ByteSize sp_offset) const { |
duke@435 | 290 | // for rbp, based address use this: |
duke@435 | 291 | // return Address(rbp, in_bytes(sp_offset) - (framesize() - 2) * 4); |
duke@435 | 292 | return Address(rsp, in_bytes(sp_offset)); |
duke@435 | 293 | } |
duke@435 | 294 | |
duke@435 | 295 | |
duke@435 | 296 | // ----------------mapping----------------------- |
duke@435 | 297 | // all mapping is based on rbp, addressing, except for simple leaf methods where we access |
duke@435 | 298 | // the locals rsp based (and no frame is built) |
duke@435 | 299 | |
duke@435 | 300 | |
duke@435 | 301 | // Frame for simple leaf methods (quick entries) |
duke@435 | 302 | // |
duke@435 | 303 | // +----------+ |
duke@435 | 304 | // | ret addr | <- TOS |
duke@435 | 305 | // +----------+ |
duke@435 | 306 | // | args | |
duke@435 | 307 | // | ...... | |
duke@435 | 308 | |
duke@435 | 309 | // Frame for standard methods |
duke@435 | 310 | // |
duke@435 | 311 | // | .........| <- TOS |
duke@435 | 312 | // | locals | |
duke@435 | 313 | // +----------+ |
duke@435 | 314 | // | old rbp, | <- EBP |
duke@435 | 315 | // +----------+ |
duke@435 | 316 | // | ret addr | |
duke@435 | 317 | // +----------+ |
duke@435 | 318 | // | args | |
duke@435 | 319 | // | .........| |
duke@435 | 320 | |
duke@435 | 321 | |
duke@435 | 322 | // For OopMaps, map a local variable or spill index to an VMRegImpl name. |
duke@435 | 323 | // This is the offset from sp() in the frame of the slot for the index, |
duke@435 | 324 | // skewed by VMRegImpl::stack0 to indicate a stack location (vs.a register.) |
duke@435 | 325 | // |
duke@435 | 326 | // framesize + |
duke@435 | 327 | // stack0 stack0 0 <- VMReg |
duke@435 | 328 | // | | <registers> | |
duke@435 | 329 | // ...........|..............|.............| |
duke@435 | 330 | // 0 1 2 3 x x 4 5 6 ... | <- local indices |
duke@435 | 331 | // ^ ^ sp() ( x x indicate link |
duke@435 | 332 | // | | and return addr) |
duke@435 | 333 | // arguments non-argument locals |
duke@435 | 334 | |
duke@435 | 335 | |
duke@435 | 336 | VMReg FrameMap::fpu_regname (int n) { |
duke@435 | 337 | // Return the OptoReg name for the fpu stack slot "n" |
duke@435 | 338 | // A spilled fpu stack slot comprises to two single-word OptoReg's. |
duke@435 | 339 | return as_FloatRegister(n)->as_VMReg(); |
duke@435 | 340 | } |
duke@435 | 341 | |
duke@435 | 342 | LIR_Opr FrameMap::stack_pointer() { |
duke@435 | 343 | return FrameMap::rsp_opr; |
duke@435 | 344 | } |
duke@435 | 345 | |
duke@435 | 346 | |
twisti@1919 | 347 | // JSR 292 |
twisti@1919 | 348 | LIR_Opr FrameMap::method_handle_invoke_SP_save_opr() { |
twisti@1919 | 349 | assert(rbp == rbp_mh_SP_save, "must be same register"); |
twisti@1919 | 350 | return rbp_opr; |
twisti@1919 | 351 | } |
twisti@1919 | 352 | |
twisti@1919 | 353 | |
duke@435 | 354 | bool FrameMap::validate_frame() { |
duke@435 | 355 | return true; |
duke@435 | 356 | } |