src/cpu/x86/vm/x86.ad

changeset 3390
65149e74c706
child 3577
9b8ce46870df
     1.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     1.2 +++ b/src/cpu/x86/vm/x86.ad	Tue Dec 20 00:55:02 2011 -0800
     1.3 @@ -0,0 +1,777 @@
     1.4 +//
     1.5 +// Copyright (c) 2011, Oracle and/or its affiliates. All rights reserved.
     1.6 +// DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
     1.7 +//
     1.8 +// This code is free software; you can redistribute it and/or modify it
     1.9 +// under the terms of the GNU General Public License version 2 only, as
    1.10 +// published by the Free Software Foundation.
    1.11 +//
    1.12 +// This code is distributed in the hope that it will be useful, but WITHOUT
    1.13 +// ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
    1.14 +// FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
    1.15 +// version 2 for more details (a copy is included in the LICENSE file that
    1.16 +// accompanied this code).
    1.17 +//
    1.18 +// You should have received a copy of the GNU General Public License version
    1.19 +// 2 along with this work; if not, write to the Free Software Foundation,
    1.20 +// Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
    1.21 +//
    1.22 +// Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
    1.23 +// or visit www.oracle.com if you need additional information or have any
    1.24 +// questions.
    1.25 +//
    1.26 +//
    1.27 +
    1.28 +// X86 Common Architecture Description File
    1.29 +
    1.30 +source %{
    1.31 +  // Float masks come from different places depending on platform.
    1.32 +#ifdef _LP64
    1.33 +  static address float_signmask()  { return StubRoutines::x86::float_sign_mask(); }
    1.34 +  static address float_signflip()  { return StubRoutines::x86::float_sign_flip(); }
    1.35 +  static address double_signmask() { return StubRoutines::x86::double_sign_mask(); }
    1.36 +  static address double_signflip() { return StubRoutines::x86::double_sign_flip(); }
    1.37 +#else
    1.38 +  static address float_signmask()  { return (address)float_signmask_pool; }
    1.39 +  static address float_signflip()  { return (address)float_signflip_pool; }
    1.40 +  static address double_signmask() { return (address)double_signmask_pool; }
    1.41 +  static address double_signflip() { return (address)double_signflip_pool; }
    1.42 +#endif
    1.43 +%}
    1.44 +
    1.45 +// INSTRUCTIONS -- Platform independent definitions (same for 32- and 64-bit)
    1.46 +
    1.47 +instruct addF_reg(regF dst, regF src) %{
    1.48 +  predicate((UseSSE>=1) && (UseAVX == 0));
    1.49 +  match(Set dst (AddF dst src));
    1.50 +
    1.51 +  format %{ "addss   $dst, $src" %}
    1.52 +  ins_cost(150);
    1.53 +  ins_encode %{
    1.54 +    __ addss($dst$$XMMRegister, $src$$XMMRegister);
    1.55 +  %}
    1.56 +  ins_pipe(pipe_slow);
    1.57 +%}
    1.58 +
    1.59 +instruct addF_mem(regF dst, memory src) %{
    1.60 +  predicate((UseSSE>=1) && (UseAVX == 0));
    1.61 +  match(Set dst (AddF dst (LoadF src)));
    1.62 +
    1.63 +  format %{ "addss   $dst, $src" %}
    1.64 +  ins_cost(150);
    1.65 +  ins_encode %{
    1.66 +    __ addss($dst$$XMMRegister, $src$$Address);
    1.67 +  %}
    1.68 +  ins_pipe(pipe_slow);
    1.69 +%}
    1.70 +
    1.71 +instruct addF_imm(regF dst, immF con) %{
    1.72 +  predicate((UseSSE>=1) && (UseAVX == 0));
    1.73 +  match(Set dst (AddF dst con));
    1.74 +  format %{ "addss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
    1.75 +  ins_cost(150);
    1.76 +  ins_encode %{
    1.77 +    __ addss($dst$$XMMRegister, $constantaddress($con));
    1.78 +  %}
    1.79 +  ins_pipe(pipe_slow);
    1.80 +%}
    1.81 +
    1.82 +instruct vaddF_reg(regF dst, regF src1, regF src2) %{
    1.83 +  predicate(UseAVX > 0);
    1.84 +  match(Set dst (AddF src1 src2));
    1.85 +
    1.86 +  format %{ "vaddss  $dst, $src1, $src2" %}
    1.87 +  ins_cost(150);
    1.88 +  ins_encode %{
    1.89 +    __ vaddss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
    1.90 +  %}
    1.91 +  ins_pipe(pipe_slow);
    1.92 +%}
    1.93 +
    1.94 +instruct vaddF_mem(regF dst, regF src1, memory src2) %{
    1.95 +  predicate(UseAVX > 0);
    1.96 +  match(Set dst (AddF src1 (LoadF src2)));
    1.97 +
    1.98 +  format %{ "vaddss  $dst, $src1, $src2" %}
    1.99 +  ins_cost(150);
   1.100 +  ins_encode %{
   1.101 +    __ vaddss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
   1.102 +  %}
   1.103 +  ins_pipe(pipe_slow);
   1.104 +%}
   1.105 +
   1.106 +instruct vaddF_imm(regF dst, regF src, immF con) %{
   1.107 +  predicate(UseAVX > 0);
   1.108 +  match(Set dst (AddF src con));
   1.109 +
   1.110 +  format %{ "vaddss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
   1.111 +  ins_cost(150);
   1.112 +  ins_encode %{
   1.113 +    __ vaddss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
   1.114 +  %}
   1.115 +  ins_pipe(pipe_slow);
   1.116 +%}
   1.117 +
   1.118 +instruct addD_reg(regD dst, regD src) %{
   1.119 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.120 +  match(Set dst (AddD dst src));
   1.121 +
   1.122 +  format %{ "addsd   $dst, $src" %}
   1.123 +  ins_cost(150);
   1.124 +  ins_encode %{
   1.125 +    __ addsd($dst$$XMMRegister, $src$$XMMRegister);
   1.126 +  %}
   1.127 +  ins_pipe(pipe_slow);
   1.128 +%}
   1.129 +
   1.130 +instruct addD_mem(regD dst, memory src) %{
   1.131 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.132 +  match(Set dst (AddD dst (LoadD src)));
   1.133 +
   1.134 +  format %{ "addsd   $dst, $src" %}
   1.135 +  ins_cost(150);
   1.136 +  ins_encode %{
   1.137 +    __ addsd($dst$$XMMRegister, $src$$Address);
   1.138 +  %}
   1.139 +  ins_pipe(pipe_slow);
   1.140 +%}
   1.141 +
   1.142 +instruct addD_imm(regD dst, immD con) %{
   1.143 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.144 +  match(Set dst (AddD dst con));
   1.145 +  format %{ "addsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
   1.146 +  ins_cost(150);
   1.147 +  ins_encode %{
   1.148 +    __ addsd($dst$$XMMRegister, $constantaddress($con));
   1.149 +  %}
   1.150 +  ins_pipe(pipe_slow);
   1.151 +%}
   1.152 +
   1.153 +instruct vaddD_reg(regD dst, regD src1, regD src2) %{
   1.154 +  predicate(UseAVX > 0);
   1.155 +  match(Set dst (AddD src1 src2));
   1.156 +
   1.157 +  format %{ "vaddsd  $dst, $src1, $src2" %}
   1.158 +  ins_cost(150);
   1.159 +  ins_encode %{
   1.160 +    __ vaddsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
   1.161 +  %}
   1.162 +  ins_pipe(pipe_slow);
   1.163 +%}
   1.164 +
   1.165 +instruct vaddD_mem(regD dst, regD src1, memory src2) %{
   1.166 +  predicate(UseAVX > 0);
   1.167 +  match(Set dst (AddD src1 (LoadD src2)));
   1.168 +
   1.169 +  format %{ "vaddsd  $dst, $src1, $src2" %}
   1.170 +  ins_cost(150);
   1.171 +  ins_encode %{
   1.172 +    __ vaddsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
   1.173 +  %}
   1.174 +  ins_pipe(pipe_slow);
   1.175 +%}
   1.176 +
   1.177 +instruct vaddD_imm(regD dst, regD src, immD con) %{
   1.178 +  predicate(UseAVX > 0);
   1.179 +  match(Set dst (AddD src con));
   1.180 +
   1.181 +  format %{ "vaddsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
   1.182 +  ins_cost(150);
   1.183 +  ins_encode %{
   1.184 +    __ vaddsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
   1.185 +  %}
   1.186 +  ins_pipe(pipe_slow);
   1.187 +%}
   1.188 +
   1.189 +instruct subF_reg(regF dst, regF src) %{
   1.190 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.191 +  match(Set dst (SubF dst src));
   1.192 +
   1.193 +  format %{ "subss   $dst, $src" %}
   1.194 +  ins_cost(150);
   1.195 +  ins_encode %{
   1.196 +    __ subss($dst$$XMMRegister, $src$$XMMRegister);
   1.197 +  %}
   1.198 +  ins_pipe(pipe_slow);
   1.199 +%}
   1.200 +
   1.201 +instruct subF_mem(regF dst, memory src) %{
   1.202 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.203 +  match(Set dst (SubF dst (LoadF src)));
   1.204 +
   1.205 +  format %{ "subss   $dst, $src" %}
   1.206 +  ins_cost(150);
   1.207 +  ins_encode %{
   1.208 +    __ subss($dst$$XMMRegister, $src$$Address);
   1.209 +  %}
   1.210 +  ins_pipe(pipe_slow);
   1.211 +%}
   1.212 +
   1.213 +instruct subF_imm(regF dst, immF con) %{
   1.214 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.215 +  match(Set dst (SubF dst con));
   1.216 +  format %{ "subss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
   1.217 +  ins_cost(150);
   1.218 +  ins_encode %{
   1.219 +    __ subss($dst$$XMMRegister, $constantaddress($con));
   1.220 +  %}
   1.221 +  ins_pipe(pipe_slow);
   1.222 +%}
   1.223 +
   1.224 +instruct vsubF_reg(regF dst, regF src1, regF src2) %{
   1.225 +  predicate(UseAVX > 0);
   1.226 +  match(Set dst (SubF src1 src2));
   1.227 +
   1.228 +  format %{ "vsubss  $dst, $src1, $src2" %}
   1.229 +  ins_cost(150);
   1.230 +  ins_encode %{
   1.231 +    __ vsubss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
   1.232 +  %}
   1.233 +  ins_pipe(pipe_slow);
   1.234 +%}
   1.235 +
   1.236 +instruct vsubF_mem(regF dst, regF src1, memory src2) %{
   1.237 +  predicate(UseAVX > 0);
   1.238 +  match(Set dst (SubF src1 (LoadF src2)));
   1.239 +
   1.240 +  format %{ "vsubss  $dst, $src1, $src2" %}
   1.241 +  ins_cost(150);
   1.242 +  ins_encode %{
   1.243 +    __ vsubss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
   1.244 +  %}
   1.245 +  ins_pipe(pipe_slow);
   1.246 +%}
   1.247 +
   1.248 +instruct vsubF_imm(regF dst, regF src, immF con) %{
   1.249 +  predicate(UseAVX > 0);
   1.250 +  match(Set dst (SubF src con));
   1.251 +
   1.252 +  format %{ "vsubss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
   1.253 +  ins_cost(150);
   1.254 +  ins_encode %{
   1.255 +    __ vsubss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
   1.256 +  %}
   1.257 +  ins_pipe(pipe_slow);
   1.258 +%}
   1.259 +
   1.260 +instruct subD_reg(regD dst, regD src) %{
   1.261 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.262 +  match(Set dst (SubD dst src));
   1.263 +
   1.264 +  format %{ "subsd   $dst, $src" %}
   1.265 +  ins_cost(150);
   1.266 +  ins_encode %{
   1.267 +    __ subsd($dst$$XMMRegister, $src$$XMMRegister);
   1.268 +  %}
   1.269 +  ins_pipe(pipe_slow);
   1.270 +%}
   1.271 +
   1.272 +instruct subD_mem(regD dst, memory src) %{
   1.273 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.274 +  match(Set dst (SubD dst (LoadD src)));
   1.275 +
   1.276 +  format %{ "subsd   $dst, $src" %}
   1.277 +  ins_cost(150);
   1.278 +  ins_encode %{
   1.279 +    __ subsd($dst$$XMMRegister, $src$$Address);
   1.280 +  %}
   1.281 +  ins_pipe(pipe_slow);
   1.282 +%}
   1.283 +
   1.284 +instruct subD_imm(regD dst, immD con) %{
   1.285 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.286 +  match(Set dst (SubD dst con));
   1.287 +  format %{ "subsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
   1.288 +  ins_cost(150);
   1.289 +  ins_encode %{
   1.290 +    __ subsd($dst$$XMMRegister, $constantaddress($con));
   1.291 +  %}
   1.292 +  ins_pipe(pipe_slow);
   1.293 +%}
   1.294 +
   1.295 +instruct vsubD_reg(regD dst, regD src1, regD src2) %{
   1.296 +  predicate(UseAVX > 0);
   1.297 +  match(Set dst (SubD src1 src2));
   1.298 +
   1.299 +  format %{ "vsubsd  $dst, $src1, $src2" %}
   1.300 +  ins_cost(150);
   1.301 +  ins_encode %{
   1.302 +    __ vsubsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
   1.303 +  %}
   1.304 +  ins_pipe(pipe_slow);
   1.305 +%}
   1.306 +
   1.307 +instruct vsubD_mem(regD dst, regD src1, memory src2) %{
   1.308 +  predicate(UseAVX > 0);
   1.309 +  match(Set dst (SubD src1 (LoadD src2)));
   1.310 +
   1.311 +  format %{ "vsubsd  $dst, $src1, $src2" %}
   1.312 +  ins_cost(150);
   1.313 +  ins_encode %{
   1.314 +    __ vsubsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
   1.315 +  %}
   1.316 +  ins_pipe(pipe_slow);
   1.317 +%}
   1.318 +
   1.319 +instruct vsubD_imm(regD dst, regD src, immD con) %{
   1.320 +  predicate(UseAVX > 0);
   1.321 +  match(Set dst (SubD src con));
   1.322 +
   1.323 +  format %{ "vsubsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
   1.324 +  ins_cost(150);
   1.325 +  ins_encode %{
   1.326 +    __ vsubsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
   1.327 +  %}
   1.328 +  ins_pipe(pipe_slow);
   1.329 +%}
   1.330 +
   1.331 +instruct mulF_reg(regF dst, regF src) %{
   1.332 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.333 +  match(Set dst (MulF dst src));
   1.334 +
   1.335 +  format %{ "mulss   $dst, $src" %}
   1.336 +  ins_cost(150);
   1.337 +  ins_encode %{
   1.338 +    __ mulss($dst$$XMMRegister, $src$$XMMRegister);
   1.339 +  %}
   1.340 +  ins_pipe(pipe_slow);
   1.341 +%}
   1.342 +
   1.343 +instruct mulF_mem(regF dst, memory src) %{
   1.344 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.345 +  match(Set dst (MulF dst (LoadF src)));
   1.346 +
   1.347 +  format %{ "mulss   $dst, $src" %}
   1.348 +  ins_cost(150);
   1.349 +  ins_encode %{
   1.350 +    __ mulss($dst$$XMMRegister, $src$$Address);
   1.351 +  %}
   1.352 +  ins_pipe(pipe_slow);
   1.353 +%}
   1.354 +
   1.355 +instruct mulF_imm(regF dst, immF con) %{
   1.356 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.357 +  match(Set dst (MulF dst con));
   1.358 +  format %{ "mulss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
   1.359 +  ins_cost(150);
   1.360 +  ins_encode %{
   1.361 +    __ mulss($dst$$XMMRegister, $constantaddress($con));
   1.362 +  %}
   1.363 +  ins_pipe(pipe_slow);
   1.364 +%}
   1.365 +
   1.366 +instruct vmulF_reg(regF dst, regF src1, regF src2) %{
   1.367 +  predicate(UseAVX > 0);
   1.368 +  match(Set dst (MulF src1 src2));
   1.369 +
   1.370 +  format %{ "vmulss  $dst, $src1, $src2" %}
   1.371 +  ins_cost(150);
   1.372 +  ins_encode %{
   1.373 +    __ vmulss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
   1.374 +  %}
   1.375 +  ins_pipe(pipe_slow);
   1.376 +%}
   1.377 +
   1.378 +instruct vmulF_mem(regF dst, regF src1, memory src2) %{
   1.379 +  predicate(UseAVX > 0);
   1.380 +  match(Set dst (MulF src1 (LoadF src2)));
   1.381 +
   1.382 +  format %{ "vmulss  $dst, $src1, $src2" %}
   1.383 +  ins_cost(150);
   1.384 +  ins_encode %{
   1.385 +    __ vmulss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
   1.386 +  %}
   1.387 +  ins_pipe(pipe_slow);
   1.388 +%}
   1.389 +
   1.390 +instruct vmulF_imm(regF dst, regF src, immF con) %{
   1.391 +  predicate(UseAVX > 0);
   1.392 +  match(Set dst (MulF src con));
   1.393 +
   1.394 +  format %{ "vmulss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
   1.395 +  ins_cost(150);
   1.396 +  ins_encode %{
   1.397 +    __ vmulss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
   1.398 +  %}
   1.399 +  ins_pipe(pipe_slow);
   1.400 +%}
   1.401 +
   1.402 +instruct mulD_reg(regD dst, regD src) %{
   1.403 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.404 +  match(Set dst (MulD dst src));
   1.405 +
   1.406 +  format %{ "mulsd   $dst, $src" %}
   1.407 +  ins_cost(150);
   1.408 +  ins_encode %{
   1.409 +    __ mulsd($dst$$XMMRegister, $src$$XMMRegister);
   1.410 +  %}
   1.411 +  ins_pipe(pipe_slow);
   1.412 +%}
   1.413 +
   1.414 +instruct mulD_mem(regD dst, memory src) %{
   1.415 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.416 +  match(Set dst (MulD dst (LoadD src)));
   1.417 +
   1.418 +  format %{ "mulsd   $dst, $src" %}
   1.419 +  ins_cost(150);
   1.420 +  ins_encode %{
   1.421 +    __ mulsd($dst$$XMMRegister, $src$$Address);
   1.422 +  %}
   1.423 +  ins_pipe(pipe_slow);
   1.424 +%}
   1.425 +
   1.426 +instruct mulD_imm(regD dst, immD con) %{
   1.427 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.428 +  match(Set dst (MulD dst con));
   1.429 +  format %{ "mulsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
   1.430 +  ins_cost(150);
   1.431 +  ins_encode %{
   1.432 +    __ mulsd($dst$$XMMRegister, $constantaddress($con));
   1.433 +  %}
   1.434 +  ins_pipe(pipe_slow);
   1.435 +%}
   1.436 +
   1.437 +instruct vmulD_reg(regD dst, regD src1, regD src2) %{
   1.438 +  predicate(UseAVX > 0);
   1.439 +  match(Set dst (MulD src1 src2));
   1.440 +
   1.441 +  format %{ "vmulsd  $dst, $src1, $src2" %}
   1.442 +  ins_cost(150);
   1.443 +  ins_encode %{
   1.444 +    __ vmulsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
   1.445 +  %}
   1.446 +  ins_pipe(pipe_slow);
   1.447 +%}
   1.448 +
   1.449 +instruct vmulD_mem(regD dst, regD src1, memory src2) %{
   1.450 +  predicate(UseAVX > 0);
   1.451 +  match(Set dst (MulD src1 (LoadD src2)));
   1.452 +
   1.453 +  format %{ "vmulsd  $dst, $src1, $src2" %}
   1.454 +  ins_cost(150);
   1.455 +  ins_encode %{
   1.456 +    __ vmulsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
   1.457 +  %}
   1.458 +  ins_pipe(pipe_slow);
   1.459 +%}
   1.460 +
   1.461 +instruct vmulD_imm(regD dst, regD src, immD con) %{
   1.462 +  predicate(UseAVX > 0);
   1.463 +  match(Set dst (MulD src con));
   1.464 +
   1.465 +  format %{ "vmulsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
   1.466 +  ins_cost(150);
   1.467 +  ins_encode %{
   1.468 +    __ vmulsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
   1.469 +  %}
   1.470 +  ins_pipe(pipe_slow);
   1.471 +%}
   1.472 +
   1.473 +instruct divF_reg(regF dst, regF src) %{
   1.474 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.475 +  match(Set dst (DivF dst src));
   1.476 +
   1.477 +  format %{ "divss   $dst, $src" %}
   1.478 +  ins_cost(150);
   1.479 +  ins_encode %{
   1.480 +    __ divss($dst$$XMMRegister, $src$$XMMRegister);
   1.481 +  %}
   1.482 +  ins_pipe(pipe_slow);
   1.483 +%}
   1.484 +
   1.485 +instruct divF_mem(regF dst, memory src) %{
   1.486 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.487 +  match(Set dst (DivF dst (LoadF src)));
   1.488 +
   1.489 +  format %{ "divss   $dst, $src" %}
   1.490 +  ins_cost(150);
   1.491 +  ins_encode %{
   1.492 +    __ divss($dst$$XMMRegister, $src$$Address);
   1.493 +  %}
   1.494 +  ins_pipe(pipe_slow);
   1.495 +%}
   1.496 +
   1.497 +instruct divF_imm(regF dst, immF con) %{
   1.498 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.499 +  match(Set dst (DivF dst con));
   1.500 +  format %{ "divss   $dst, [$constantaddress]\t# load from constant table: float=$con" %}
   1.501 +  ins_cost(150);
   1.502 +  ins_encode %{
   1.503 +    __ divss($dst$$XMMRegister, $constantaddress($con));
   1.504 +  %}
   1.505 +  ins_pipe(pipe_slow);
   1.506 +%}
   1.507 +
   1.508 +instruct vdivF_reg(regF dst, regF src1, regF src2) %{
   1.509 +  predicate(UseAVX > 0);
   1.510 +  match(Set dst (DivF src1 src2));
   1.511 +
   1.512 +  format %{ "vdivss  $dst, $src1, $src2" %}
   1.513 +  ins_cost(150);
   1.514 +  ins_encode %{
   1.515 +    __ vdivss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
   1.516 +  %}
   1.517 +  ins_pipe(pipe_slow);
   1.518 +%}
   1.519 +
   1.520 +instruct vdivF_mem(regF dst, regF src1, memory src2) %{
   1.521 +  predicate(UseAVX > 0);
   1.522 +  match(Set dst (DivF src1 (LoadF src2)));
   1.523 +
   1.524 +  format %{ "vdivss  $dst, $src1, $src2" %}
   1.525 +  ins_cost(150);
   1.526 +  ins_encode %{
   1.527 +    __ vdivss($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
   1.528 +  %}
   1.529 +  ins_pipe(pipe_slow);
   1.530 +%}
   1.531 +
   1.532 +instruct vdivF_imm(regF dst, regF src, immF con) %{
   1.533 +  predicate(UseAVX > 0);
   1.534 +  match(Set dst (DivF src con));
   1.535 +
   1.536 +  format %{ "vdivss  $dst, $src, [$constantaddress]\t# load from constant table: float=$con" %}
   1.537 +  ins_cost(150);
   1.538 +  ins_encode %{
   1.539 +    __ vdivss($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
   1.540 +  %}
   1.541 +  ins_pipe(pipe_slow);
   1.542 +%}
   1.543 +
   1.544 +instruct divD_reg(regD dst, regD src) %{
   1.545 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.546 +  match(Set dst (DivD dst src));
   1.547 +
   1.548 +  format %{ "divsd   $dst, $src" %}
   1.549 +  ins_cost(150);
   1.550 +  ins_encode %{
   1.551 +    __ divsd($dst$$XMMRegister, $src$$XMMRegister);
   1.552 +  %}
   1.553 +  ins_pipe(pipe_slow);
   1.554 +%}
   1.555 +
   1.556 +instruct divD_mem(regD dst, memory src) %{
   1.557 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.558 +  match(Set dst (DivD dst (LoadD src)));
   1.559 +
   1.560 +  format %{ "divsd   $dst, $src" %}
   1.561 +  ins_cost(150);
   1.562 +  ins_encode %{
   1.563 +    __ divsd($dst$$XMMRegister, $src$$Address);
   1.564 +  %}
   1.565 +  ins_pipe(pipe_slow);
   1.566 +%}
   1.567 +
   1.568 +instruct divD_imm(regD dst, immD con) %{
   1.569 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.570 +  match(Set dst (DivD dst con));
   1.571 +  format %{ "divsd   $dst, [$constantaddress]\t# load from constant table: double=$con" %}
   1.572 +  ins_cost(150);
   1.573 +  ins_encode %{
   1.574 +    __ divsd($dst$$XMMRegister, $constantaddress($con));
   1.575 +  %}
   1.576 +  ins_pipe(pipe_slow);
   1.577 +%}
   1.578 +
   1.579 +instruct vdivD_reg(regD dst, regD src1, regD src2) %{
   1.580 +  predicate(UseAVX > 0);
   1.581 +  match(Set dst (DivD src1 src2));
   1.582 +
   1.583 +  format %{ "vdivsd  $dst, $src1, $src2" %}
   1.584 +  ins_cost(150);
   1.585 +  ins_encode %{
   1.586 +    __ vdivsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$XMMRegister);
   1.587 +  %}
   1.588 +  ins_pipe(pipe_slow);
   1.589 +%}
   1.590 +
   1.591 +instruct vdivD_mem(regD dst, regD src1, memory src2) %{
   1.592 +  predicate(UseAVX > 0);
   1.593 +  match(Set dst (DivD src1 (LoadD src2)));
   1.594 +
   1.595 +  format %{ "vdivsd  $dst, $src1, $src2" %}
   1.596 +  ins_cost(150);
   1.597 +  ins_encode %{
   1.598 +    __ vdivsd($dst$$XMMRegister, $src1$$XMMRegister, $src2$$Address);
   1.599 +  %}
   1.600 +  ins_pipe(pipe_slow);
   1.601 +%}
   1.602 +
   1.603 +instruct vdivD_imm(regD dst, regD src, immD con) %{
   1.604 +  predicate(UseAVX > 0);
   1.605 +  match(Set dst (DivD src con));
   1.606 +
   1.607 +  format %{ "vdivsd  $dst, $src, [$constantaddress]\t# load from constant table: double=$con" %}
   1.608 +  ins_cost(150);
   1.609 +  ins_encode %{
   1.610 +    __ vdivsd($dst$$XMMRegister, $src$$XMMRegister, $constantaddress($con));
   1.611 +  %}
   1.612 +  ins_pipe(pipe_slow);
   1.613 +%}
   1.614 +
   1.615 +instruct absF_reg(regF dst) %{
   1.616 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.617 +  match(Set dst (AbsF dst));
   1.618 +  ins_cost(150);
   1.619 +  format %{ "andps   $dst, [0x7fffffff]\t# abs float by sign masking" %}
   1.620 +  ins_encode %{
   1.621 +    __ andps($dst$$XMMRegister, ExternalAddress(float_signmask()));
   1.622 +  %}
   1.623 +  ins_pipe(pipe_slow);
   1.624 +%}
   1.625 +
   1.626 +instruct vabsF_reg(regF dst, regF src) %{
   1.627 +  predicate(UseAVX > 0);
   1.628 +  match(Set dst (AbsF src));
   1.629 +  ins_cost(150);
   1.630 +  format %{ "vandps  $dst, $src, [0x7fffffff]\t# abs float by sign masking" %}
   1.631 +  ins_encode %{
   1.632 +    __ vandps($dst$$XMMRegister, $src$$XMMRegister,
   1.633 +              ExternalAddress(float_signmask()));
   1.634 +  %}
   1.635 +  ins_pipe(pipe_slow);
   1.636 +%}
   1.637 +
   1.638 +instruct absD_reg(regD dst) %{
   1.639 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.640 +  match(Set dst (AbsD dst));
   1.641 +  ins_cost(150);
   1.642 +  format %{ "andpd   $dst, [0x7fffffffffffffff]\t"
   1.643 +            "# abs double by sign masking" %}
   1.644 +  ins_encode %{
   1.645 +    __ andpd($dst$$XMMRegister, ExternalAddress(double_signmask()));
   1.646 +  %}
   1.647 +  ins_pipe(pipe_slow);
   1.648 +%}
   1.649 +
   1.650 +instruct vabsD_reg(regD dst, regD src) %{
   1.651 +  predicate(UseAVX > 0);
   1.652 +  match(Set dst (AbsD src));
   1.653 +  ins_cost(150);
   1.654 +  format %{ "vandpd  $dst, $src, [0x7fffffffffffffff]\t"
   1.655 +            "# abs double by sign masking" %}
   1.656 +  ins_encode %{
   1.657 +    __ vandpd($dst$$XMMRegister, $src$$XMMRegister,
   1.658 +              ExternalAddress(double_signmask()));
   1.659 +  %}
   1.660 +  ins_pipe(pipe_slow);
   1.661 +%}
   1.662 +
   1.663 +instruct negF_reg(regF dst) %{
   1.664 +  predicate((UseSSE>=1) && (UseAVX == 0));
   1.665 +  match(Set dst (NegF dst));
   1.666 +  ins_cost(150);
   1.667 +  format %{ "xorps   $dst, [0x80000000]\t# neg float by sign flipping" %}
   1.668 +  ins_encode %{
   1.669 +    __ xorps($dst$$XMMRegister, ExternalAddress(float_signflip()));
   1.670 +  %}
   1.671 +  ins_pipe(pipe_slow);
   1.672 +%}
   1.673 +
   1.674 +instruct vnegF_reg(regF dst, regF src) %{
   1.675 +  predicate(UseAVX > 0);
   1.676 +  match(Set dst (NegF src));
   1.677 +  ins_cost(150);
   1.678 +  format %{ "vxorps  $dst, $src, [0x80000000]\t# neg float by sign flipping" %}
   1.679 +  ins_encode %{
   1.680 +    __ vxorps($dst$$XMMRegister, $src$$XMMRegister,
   1.681 +              ExternalAddress(float_signflip()));
   1.682 +  %}
   1.683 +  ins_pipe(pipe_slow);
   1.684 +%}
   1.685 +
   1.686 +instruct negD_reg(regD dst) %{
   1.687 +  predicate((UseSSE>=2) && (UseAVX == 0));
   1.688 +  match(Set dst (NegD dst));
   1.689 +  ins_cost(150);
   1.690 +  format %{ "xorpd   $dst, [0x8000000000000000]\t"
   1.691 +            "# neg double by sign flipping" %}
   1.692 +  ins_encode %{
   1.693 +    __ xorpd($dst$$XMMRegister, ExternalAddress(double_signflip()));
   1.694 +  %}
   1.695 +  ins_pipe(pipe_slow);
   1.696 +%}
   1.697 +
   1.698 +instruct vnegD_reg(regD dst, regD src) %{
   1.699 +  predicate(UseAVX > 0);
   1.700 +  match(Set dst (NegD src));
   1.701 +  ins_cost(150);
   1.702 +  format %{ "vxorpd  $dst, $src, [0x8000000000000000]\t"
   1.703 +            "# neg double by sign flipping" %}
   1.704 +  ins_encode %{
   1.705 +    __ vxorpd($dst$$XMMRegister, $src$$XMMRegister,
   1.706 +              ExternalAddress(double_signflip()));
   1.707 +  %}
   1.708 +  ins_pipe(pipe_slow);
   1.709 +%}
   1.710 +
   1.711 +instruct sqrtF_reg(regF dst, regF src) %{
   1.712 +  predicate(UseSSE>=1);
   1.713 +  match(Set dst (ConvD2F (SqrtD (ConvF2D src))));
   1.714 +
   1.715 +  format %{ "sqrtss  $dst, $src" %}
   1.716 +  ins_cost(150);
   1.717 +  ins_encode %{
   1.718 +    __ sqrtss($dst$$XMMRegister, $src$$XMMRegister);
   1.719 +  %}
   1.720 +  ins_pipe(pipe_slow);
   1.721 +%}
   1.722 +
   1.723 +instruct sqrtF_mem(regF dst, memory src) %{
   1.724 +  predicate(UseSSE>=1);
   1.725 +  match(Set dst (ConvD2F (SqrtD (ConvF2D (LoadF src)))));
   1.726 +
   1.727 +  format %{ "sqrtss  $dst, $src" %}
   1.728 +  ins_cost(150);
   1.729 +  ins_encode %{
   1.730 +    __ sqrtss($dst$$XMMRegister, $src$$Address);
   1.731 +  %}
   1.732 +  ins_pipe(pipe_slow);
   1.733 +%}
   1.734 +
   1.735 +instruct sqrtF_imm(regF dst, immF con) %{
   1.736 +  predicate(UseSSE>=1);
   1.737 +  match(Set dst (ConvD2F (SqrtD (ConvF2D con))));
   1.738 +  format %{ "sqrtss  $dst, [$constantaddress]\t# load from constant table: float=$con" %}
   1.739 +  ins_cost(150);
   1.740 +  ins_encode %{
   1.741 +    __ sqrtss($dst$$XMMRegister, $constantaddress($con));
   1.742 +  %}
   1.743 +  ins_pipe(pipe_slow);
   1.744 +%}
   1.745 +
   1.746 +instruct sqrtD_reg(regD dst, regD src) %{
   1.747 +  predicate(UseSSE>=2);
   1.748 +  match(Set dst (SqrtD src));
   1.749 +
   1.750 +  format %{ "sqrtsd  $dst, $src" %}
   1.751 +  ins_cost(150);
   1.752 +  ins_encode %{
   1.753 +    __ sqrtsd($dst$$XMMRegister, $src$$XMMRegister);
   1.754 +  %}
   1.755 +  ins_pipe(pipe_slow);
   1.756 +%}
   1.757 +
   1.758 +instruct sqrtD_mem(regD dst, memory src) %{
   1.759 +  predicate(UseSSE>=2);
   1.760 +  match(Set dst (SqrtD (LoadD src)));
   1.761 +
   1.762 +  format %{ "sqrtsd  $dst, $src" %}
   1.763 +  ins_cost(150);
   1.764 +  ins_encode %{
   1.765 +    __ sqrtsd($dst$$XMMRegister, $src$$Address);
   1.766 +  %}
   1.767 +  ins_pipe(pipe_slow);
   1.768 +%}
   1.769 +
   1.770 +instruct sqrtD_imm(regD dst, immD con) %{
   1.771 +  predicate(UseSSE>=2);
   1.772 +  match(Set dst (SqrtD con));
   1.773 +  format %{ "sqrtsd  $dst, [$constantaddress]\t# load from constant table: double=$con" %}
   1.774 +  ins_cost(150);
   1.775 +  ins_encode %{
   1.776 +    __ sqrtsd($dst$$XMMRegister, $constantaddress($con));
   1.777 +  %}
   1.778 +  ins_pipe(pipe_slow);
   1.779 +%}
   1.780 +

mercurial