Wed, 18 Sep 2013 14:34:56 -0700
8024342: PPC64 (part 111): Support for C calling conventions that require 64-bit ints.
Summary: Some platforms, as ppc and s390x/zArch require that 32-bit ints are passed as 64-bit values to C functions. This change adds support to adapt the signature and to issue proper casts to c2-compiled stubs. The functions are used in generate_native_wrapper(). Adapt signature used by the compiler as in PhaseIdealLoop::intrinsify_fill().
Reviewed-by: kvn
duke@435 | 1 | /* |
coleenp@4037 | 2 | * Copyright (c) 1998, 2012, Oracle and/or its affiliates. All rights reserved. |
duke@435 | 3 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
duke@435 | 4 | * |
duke@435 | 5 | * This code is free software; you can redistribute it and/or modify it |
duke@435 | 6 | * under the terms of the GNU General Public License version 2 only, as |
duke@435 | 7 | * published by the Free Software Foundation. |
duke@435 | 8 | * |
duke@435 | 9 | * This code is distributed in the hope that it will be useful, but WITHOUT |
duke@435 | 10 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
duke@435 | 11 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
duke@435 | 12 | * version 2 for more details (a copy is included in the LICENSE file that |
duke@435 | 13 | * accompanied this code). |
duke@435 | 14 | * |
duke@435 | 15 | * You should have received a copy of the GNU General Public License version |
duke@435 | 16 | * 2 along with this work; if not, write to the Free Software Foundation, |
duke@435 | 17 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
duke@435 | 18 | * |
trims@1907 | 19 | * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
trims@1907 | 20 | * or visit www.oracle.com if you need additional information or have any |
trims@1907 | 21 | * questions. |
duke@435 | 22 | * |
duke@435 | 23 | */ |
duke@435 | 24 | |
stefank@2314 | 25 | #include "precompiled.hpp" |
stefank@2314 | 26 | #include "ci/ciMethodData.hpp" |
stefank@2314 | 27 | #include "classfile/systemDictionary.hpp" |
stefank@2314 | 28 | #include "classfile/vmSymbols.hpp" |
stefank@2314 | 29 | #include "compiler/compileLog.hpp" |
stefank@2314 | 30 | #include "interpreter/linkResolver.hpp" |
stefank@2314 | 31 | #include "memory/universe.inline.hpp" |
stefank@2314 | 32 | #include "opto/addnode.hpp" |
stefank@2314 | 33 | #include "opto/divnode.hpp" |
stefank@2314 | 34 | #include "opto/idealGraphPrinter.hpp" |
stefank@2314 | 35 | #include "opto/matcher.hpp" |
stefank@2314 | 36 | #include "opto/memnode.hpp" |
stefank@2314 | 37 | #include "opto/mulnode.hpp" |
stefank@2314 | 38 | #include "opto/parse.hpp" |
stefank@2314 | 39 | #include "opto/runtime.hpp" |
stefank@2314 | 40 | #include "runtime/deoptimization.hpp" |
stefank@2314 | 41 | #include "runtime/sharedRuntime.hpp" |
duke@435 | 42 | |
duke@435 | 43 | extern int explicit_null_checks_inserted, |
duke@435 | 44 | explicit_null_checks_elided; |
duke@435 | 45 | |
duke@435 | 46 | //---------------------------------array_load---------------------------------- |
duke@435 | 47 | void Parse::array_load(BasicType elem_type) { |
duke@435 | 48 | const Type* elem = Type::TOP; |
duke@435 | 49 | Node* adr = array_addressing(elem_type, 0, &elem); |
twisti@1040 | 50 | if (stopped()) return; // guaranteed null or range check |
twisti@4313 | 51 | dec_sp(2); // Pop array and index |
duke@435 | 52 | const TypeAryPtr* adr_type = TypeAryPtr::get_array_body_type(elem_type); |
duke@435 | 53 | Node* ld = make_load(control(), adr, elem, elem_type, adr_type); |
duke@435 | 54 | push(ld); |
duke@435 | 55 | } |
duke@435 | 56 | |
duke@435 | 57 | |
duke@435 | 58 | //--------------------------------array_store---------------------------------- |
duke@435 | 59 | void Parse::array_store(BasicType elem_type) { |
duke@435 | 60 | Node* adr = array_addressing(elem_type, 1); |
twisti@1040 | 61 | if (stopped()) return; // guaranteed null or range check |
duke@435 | 62 | Node* val = pop(); |
twisti@4313 | 63 | dec_sp(2); // Pop array and index |
duke@435 | 64 | const TypeAryPtr* adr_type = TypeAryPtr::get_array_body_type(elem_type); |
duke@435 | 65 | store_to_memory(control(), adr, val, elem_type, adr_type); |
duke@435 | 66 | } |
duke@435 | 67 | |
duke@435 | 68 | |
duke@435 | 69 | //------------------------------array_addressing------------------------------- |
duke@435 | 70 | // Pull array and index from the stack. Compute pointer-to-element. |
duke@435 | 71 | Node* Parse::array_addressing(BasicType type, int vals, const Type* *result2) { |
duke@435 | 72 | Node *idx = peek(0+vals); // Get from stack without popping |
duke@435 | 73 | Node *ary = peek(1+vals); // in case of exception |
duke@435 | 74 | |
duke@435 | 75 | // Null check the array base, with correct stack contents |
twisti@4313 | 76 | ary = null_check(ary, T_ARRAY); |
duke@435 | 77 | // Compile-time detect of null-exception? |
duke@435 | 78 | if (stopped()) return top(); |
duke@435 | 79 | |
duke@435 | 80 | const TypeAryPtr* arytype = _gvn.type(ary)->is_aryptr(); |
duke@435 | 81 | const TypeInt* sizetype = arytype->size(); |
duke@435 | 82 | const Type* elemtype = arytype->elem(); |
duke@435 | 83 | |
duke@435 | 84 | if (UseUniqueSubclasses && result2 != NULL) { |
kvn@656 | 85 | const Type* el = elemtype->make_ptr(); |
kvn@656 | 86 | if (el && el->isa_instptr()) { |
kvn@656 | 87 | const TypeInstPtr* toop = el->is_instptr(); |
duke@435 | 88 | if (toop->klass()->as_instance_klass()->unique_concrete_subklass()) { |
duke@435 | 89 | // If we load from "AbstractClass[]" we must see "ConcreteSubClass". |
duke@435 | 90 | const Type* subklass = Type::get_const_type(toop->klass()); |
coleenp@548 | 91 | elemtype = subklass->join(el); |
duke@435 | 92 | } |
duke@435 | 93 | } |
duke@435 | 94 | } |
duke@435 | 95 | |
duke@435 | 96 | // Check for big class initializers with all constant offsets |
duke@435 | 97 | // feeding into a known-size array. |
duke@435 | 98 | const TypeInt* idxtype = _gvn.type(idx)->is_int(); |
duke@435 | 99 | // See if the highest idx value is less than the lowest array bound, |
duke@435 | 100 | // and if the idx value cannot be negative: |
duke@435 | 101 | bool need_range_check = true; |
duke@435 | 102 | if (idxtype->_hi < sizetype->_lo && idxtype->_lo >= 0) { |
duke@435 | 103 | need_range_check = false; |
duke@435 | 104 | if (C->log() != NULL) C->log()->elem("observe that='!need_range_check'"); |
duke@435 | 105 | } |
duke@435 | 106 | |
bharadwaj@4862 | 107 | ciKlass * arytype_klass = arytype->klass(); |
bharadwaj@4862 | 108 | if ((arytype_klass != NULL) && (!arytype_klass->is_loaded())) { |
duke@435 | 109 | // Only fails for some -Xcomp runs |
duke@435 | 110 | // The class is unloaded. We have to run this bytecode in the interpreter. |
duke@435 | 111 | uncommon_trap(Deoptimization::Reason_unloaded, |
duke@435 | 112 | Deoptimization::Action_reinterpret, |
duke@435 | 113 | arytype->klass(), "!loaded array"); |
duke@435 | 114 | return top(); |
duke@435 | 115 | } |
duke@435 | 116 | |
duke@435 | 117 | // Do the range check |
duke@435 | 118 | if (GenerateRangeChecks && need_range_check) { |
rasbold@564 | 119 | Node* tst; |
rasbold@564 | 120 | if (sizetype->_hi <= 0) { |
rasbold@801 | 121 | // The greatest array bound is negative, so we can conclude that we're |
rasbold@564 | 122 | // compiling unreachable code, but the unsigned compare trick used below |
rasbold@564 | 123 | // only works with non-negative lengths. Instead, hack "tst" to be zero so |
rasbold@564 | 124 | // the uncommon_trap path will always be taken. |
rasbold@564 | 125 | tst = _gvn.intcon(0); |
rasbold@564 | 126 | } else { |
rasbold@801 | 127 | // Range is constant in array-oop, so we can use the original state of mem |
rasbold@801 | 128 | Node* len = load_array_length(ary); |
rasbold@801 | 129 | |
rasbold@564 | 130 | // Test length vs index (standard trick using unsigned compare) |
kvn@4115 | 131 | Node* chk = _gvn.transform( new (C) CmpUNode(idx, len) ); |
rasbold@564 | 132 | BoolTest::mask btest = BoolTest::lt; |
kvn@4115 | 133 | tst = _gvn.transform( new (C) BoolNode(chk, btest) ); |
rasbold@564 | 134 | } |
duke@435 | 135 | // Branch to failure if out of bounds |
duke@435 | 136 | { BuildCutout unless(this, tst, PROB_MAX); |
duke@435 | 137 | if (C->allow_range_check_smearing()) { |
duke@435 | 138 | // Do not use builtin_throw, since range checks are sometimes |
duke@435 | 139 | // made more stringent by an optimistic transformation. |
duke@435 | 140 | // This creates "tentative" range checks at this point, |
duke@435 | 141 | // which are not guaranteed to throw exceptions. |
duke@435 | 142 | // See IfNode::Ideal, is_range_check, adjust_check. |
duke@435 | 143 | uncommon_trap(Deoptimization::Reason_range_check, |
duke@435 | 144 | Deoptimization::Action_make_not_entrant, |
duke@435 | 145 | NULL, "range_check"); |
duke@435 | 146 | } else { |
duke@435 | 147 | // If we have already recompiled with the range-check-widening |
duke@435 | 148 | // heroic optimization turned off, then we must really be throwing |
duke@435 | 149 | // range check exceptions. |
duke@435 | 150 | builtin_throw(Deoptimization::Reason_range_check, idx); |
duke@435 | 151 | } |
duke@435 | 152 | } |
duke@435 | 153 | } |
duke@435 | 154 | // Check for always knowing you are throwing a range-check exception |
duke@435 | 155 | if (stopped()) return top(); |
duke@435 | 156 | |
rasbold@801 | 157 | Node* ptr = array_element_address(ary, idx, type, sizetype); |
duke@435 | 158 | |
duke@435 | 159 | if (result2 != NULL) *result2 = elemtype; |
rasbold@801 | 160 | |
rasbold@801 | 161 | assert(ptr != top(), "top should go hand-in-hand with stopped"); |
rasbold@801 | 162 | |
duke@435 | 163 | return ptr; |
duke@435 | 164 | } |
duke@435 | 165 | |
duke@435 | 166 | |
duke@435 | 167 | // returns IfNode |
duke@435 | 168 | IfNode* Parse::jump_if_fork_int(Node* a, Node* b, BoolTest::mask mask) { |
kvn@4115 | 169 | Node *cmp = _gvn.transform( new (C) CmpINode( a, b)); // two cases: shiftcount > 32 and shiftcount <= 32 |
kvn@4115 | 170 | Node *tst = _gvn.transform( new (C) BoolNode( cmp, mask)); |
duke@435 | 171 | IfNode *iff = create_and_map_if( control(), tst, ((mask == BoolTest::eq) ? PROB_STATIC_INFREQUENT : PROB_FAIR), COUNT_UNKNOWN ); |
duke@435 | 172 | return iff; |
duke@435 | 173 | } |
duke@435 | 174 | |
duke@435 | 175 | // return Region node |
duke@435 | 176 | Node* Parse::jump_if_join(Node* iffalse, Node* iftrue) { |
kvn@4115 | 177 | Node *region = new (C) RegionNode(3); // 2 results |
duke@435 | 178 | record_for_igvn(region); |
duke@435 | 179 | region->init_req(1, iffalse); |
duke@435 | 180 | region->init_req(2, iftrue ); |
duke@435 | 181 | _gvn.set_type(region, Type::CONTROL); |
duke@435 | 182 | region = _gvn.transform(region); |
duke@435 | 183 | set_control (region); |
duke@435 | 184 | return region; |
duke@435 | 185 | } |
duke@435 | 186 | |
duke@435 | 187 | |
duke@435 | 188 | //------------------------------helper for tableswitch------------------------- |
duke@435 | 189 | void Parse::jump_if_true_fork(IfNode *iff, int dest_bci_if_true, int prof_table_index) { |
duke@435 | 190 | // True branch, use existing map info |
duke@435 | 191 | { PreserveJVMState pjvms(this); |
kvn@4115 | 192 | Node *iftrue = _gvn.transform( new (C) IfTrueNode (iff) ); |
duke@435 | 193 | set_control( iftrue ); |
duke@435 | 194 | profile_switch_case(prof_table_index); |
duke@435 | 195 | merge_new_path(dest_bci_if_true); |
duke@435 | 196 | } |
duke@435 | 197 | |
duke@435 | 198 | // False branch |
kvn@4115 | 199 | Node *iffalse = _gvn.transform( new (C) IfFalseNode(iff) ); |
duke@435 | 200 | set_control( iffalse ); |
duke@435 | 201 | } |
duke@435 | 202 | |
duke@435 | 203 | void Parse::jump_if_false_fork(IfNode *iff, int dest_bci_if_true, int prof_table_index) { |
duke@435 | 204 | // True branch, use existing map info |
duke@435 | 205 | { PreserveJVMState pjvms(this); |
kvn@4115 | 206 | Node *iffalse = _gvn.transform( new (C) IfFalseNode (iff) ); |
duke@435 | 207 | set_control( iffalse ); |
duke@435 | 208 | profile_switch_case(prof_table_index); |
duke@435 | 209 | merge_new_path(dest_bci_if_true); |
duke@435 | 210 | } |
duke@435 | 211 | |
duke@435 | 212 | // False branch |
kvn@4115 | 213 | Node *iftrue = _gvn.transform( new (C) IfTrueNode(iff) ); |
duke@435 | 214 | set_control( iftrue ); |
duke@435 | 215 | } |
duke@435 | 216 | |
duke@435 | 217 | void Parse::jump_if_always_fork(int dest_bci, int prof_table_index) { |
duke@435 | 218 | // False branch, use existing map and control() |
duke@435 | 219 | profile_switch_case(prof_table_index); |
duke@435 | 220 | merge_new_path(dest_bci); |
duke@435 | 221 | } |
duke@435 | 222 | |
duke@435 | 223 | |
duke@435 | 224 | extern "C" { |
duke@435 | 225 | static int jint_cmp(const void *i, const void *j) { |
duke@435 | 226 | int a = *(jint *)i; |
duke@435 | 227 | int b = *(jint *)j; |
duke@435 | 228 | return a > b ? 1 : a < b ? -1 : 0; |
duke@435 | 229 | } |
duke@435 | 230 | } |
duke@435 | 231 | |
duke@435 | 232 | |
duke@435 | 233 | // Default value for methodData switch indexing. Must be a negative value to avoid |
duke@435 | 234 | // conflict with any legal switch index. |
duke@435 | 235 | #define NullTableIndex -1 |
duke@435 | 236 | |
duke@435 | 237 | class SwitchRange : public StackObj { |
duke@435 | 238 | // a range of integers coupled with a bci destination |
duke@435 | 239 | jint _lo; // inclusive lower limit |
duke@435 | 240 | jint _hi; // inclusive upper limit |
duke@435 | 241 | int _dest; |
duke@435 | 242 | int _table_index; // index into method data table |
duke@435 | 243 | |
duke@435 | 244 | public: |
duke@435 | 245 | jint lo() const { return _lo; } |
duke@435 | 246 | jint hi() const { return _hi; } |
duke@435 | 247 | int dest() const { return _dest; } |
duke@435 | 248 | int table_index() const { return _table_index; } |
duke@435 | 249 | bool is_singleton() const { return _lo == _hi; } |
duke@435 | 250 | |
duke@435 | 251 | void setRange(jint lo, jint hi, int dest, int table_index) { |
duke@435 | 252 | assert(lo <= hi, "must be a non-empty range"); |
duke@435 | 253 | _lo = lo, _hi = hi; _dest = dest; _table_index = table_index; |
duke@435 | 254 | } |
duke@435 | 255 | bool adjoinRange(jint lo, jint hi, int dest, int table_index) { |
duke@435 | 256 | assert(lo <= hi, "must be a non-empty range"); |
duke@435 | 257 | if (lo == _hi+1 && dest == _dest && table_index == _table_index) { |
duke@435 | 258 | _hi = hi; |
duke@435 | 259 | return true; |
duke@435 | 260 | } |
duke@435 | 261 | return false; |
duke@435 | 262 | } |
duke@435 | 263 | |
duke@435 | 264 | void set (jint value, int dest, int table_index) { |
duke@435 | 265 | setRange(value, value, dest, table_index); |
duke@435 | 266 | } |
duke@435 | 267 | bool adjoin(jint value, int dest, int table_index) { |
duke@435 | 268 | return adjoinRange(value, value, dest, table_index); |
duke@435 | 269 | } |
duke@435 | 270 | |
duke@435 | 271 | void print(ciEnv* env) { |
duke@435 | 272 | if (is_singleton()) |
duke@435 | 273 | tty->print(" {%d}=>%d", lo(), dest()); |
duke@435 | 274 | else if (lo() == min_jint) |
duke@435 | 275 | tty->print(" {..%d}=>%d", hi(), dest()); |
duke@435 | 276 | else if (hi() == max_jint) |
duke@435 | 277 | tty->print(" {%d..}=>%d", lo(), dest()); |
duke@435 | 278 | else |
duke@435 | 279 | tty->print(" {%d..%d}=>%d", lo(), hi(), dest()); |
duke@435 | 280 | } |
duke@435 | 281 | }; |
duke@435 | 282 | |
duke@435 | 283 | |
duke@435 | 284 | //-------------------------------do_tableswitch-------------------------------- |
duke@435 | 285 | void Parse::do_tableswitch() { |
duke@435 | 286 | Node* lookup = pop(); |
duke@435 | 287 | |
duke@435 | 288 | // Get information about tableswitch |
duke@435 | 289 | int default_dest = iter().get_dest_table(0); |
duke@435 | 290 | int lo_index = iter().get_int_table(1); |
duke@435 | 291 | int hi_index = iter().get_int_table(2); |
duke@435 | 292 | int len = hi_index - lo_index + 1; |
duke@435 | 293 | |
duke@435 | 294 | if (len < 1) { |
duke@435 | 295 | // If this is a backward branch, add safepoint |
duke@435 | 296 | maybe_add_safepoint(default_dest); |
duke@435 | 297 | merge(default_dest); |
duke@435 | 298 | return; |
duke@435 | 299 | } |
duke@435 | 300 | |
duke@435 | 301 | // generate decision tree, using trichotomy when possible |
duke@435 | 302 | int rnum = len+2; |
duke@435 | 303 | bool makes_backward_branch = false; |
duke@435 | 304 | SwitchRange* ranges = NEW_RESOURCE_ARRAY(SwitchRange, rnum); |
duke@435 | 305 | int rp = -1; |
duke@435 | 306 | if (lo_index != min_jint) { |
duke@435 | 307 | ranges[++rp].setRange(min_jint, lo_index-1, default_dest, NullTableIndex); |
duke@435 | 308 | } |
duke@435 | 309 | for (int j = 0; j < len; j++) { |
duke@435 | 310 | jint match_int = lo_index+j; |
duke@435 | 311 | int dest = iter().get_dest_table(j+3); |
duke@435 | 312 | makes_backward_branch |= (dest <= bci()); |
duke@435 | 313 | int table_index = method_data_update() ? j : NullTableIndex; |
duke@435 | 314 | if (rp < 0 || !ranges[rp].adjoin(match_int, dest, table_index)) { |
duke@435 | 315 | ranges[++rp].set(match_int, dest, table_index); |
duke@435 | 316 | } |
duke@435 | 317 | } |
duke@435 | 318 | jint highest = lo_index+(len-1); |
duke@435 | 319 | assert(ranges[rp].hi() == highest, ""); |
duke@435 | 320 | if (highest != max_jint |
duke@435 | 321 | && !ranges[rp].adjoinRange(highest+1, max_jint, default_dest, NullTableIndex)) { |
duke@435 | 322 | ranges[++rp].setRange(highest+1, max_jint, default_dest, NullTableIndex); |
duke@435 | 323 | } |
duke@435 | 324 | assert(rp < len+2, "not too many ranges"); |
duke@435 | 325 | |
duke@435 | 326 | // Safepoint in case if backward branch observed |
duke@435 | 327 | if( makes_backward_branch && UseLoopSafepoints ) |
duke@435 | 328 | add_safepoint(); |
duke@435 | 329 | |
duke@435 | 330 | jump_switch_ranges(lookup, &ranges[0], &ranges[rp]); |
duke@435 | 331 | } |
duke@435 | 332 | |
duke@435 | 333 | |
duke@435 | 334 | //------------------------------do_lookupswitch-------------------------------- |
duke@435 | 335 | void Parse::do_lookupswitch() { |
duke@435 | 336 | Node *lookup = pop(); // lookup value |
duke@435 | 337 | // Get information about lookupswitch |
duke@435 | 338 | int default_dest = iter().get_dest_table(0); |
duke@435 | 339 | int len = iter().get_int_table(1); |
duke@435 | 340 | |
duke@435 | 341 | if (len < 1) { // If this is a backward branch, add safepoint |
duke@435 | 342 | maybe_add_safepoint(default_dest); |
duke@435 | 343 | merge(default_dest); |
duke@435 | 344 | return; |
duke@435 | 345 | } |
duke@435 | 346 | |
duke@435 | 347 | // generate decision tree, using trichotomy when possible |
duke@435 | 348 | jint* table = NEW_RESOURCE_ARRAY(jint, len*2); |
duke@435 | 349 | { |
duke@435 | 350 | for( int j = 0; j < len; j++ ) { |
duke@435 | 351 | table[j+j+0] = iter().get_int_table(2+j+j); |
duke@435 | 352 | table[j+j+1] = iter().get_dest_table(2+j+j+1); |
duke@435 | 353 | } |
duke@435 | 354 | qsort( table, len, 2*sizeof(table[0]), jint_cmp ); |
duke@435 | 355 | } |
duke@435 | 356 | |
duke@435 | 357 | int rnum = len*2+1; |
duke@435 | 358 | bool makes_backward_branch = false; |
duke@435 | 359 | SwitchRange* ranges = NEW_RESOURCE_ARRAY(SwitchRange, rnum); |
duke@435 | 360 | int rp = -1; |
duke@435 | 361 | for( int j = 0; j < len; j++ ) { |
duke@435 | 362 | jint match_int = table[j+j+0]; |
duke@435 | 363 | int dest = table[j+j+1]; |
duke@435 | 364 | int next_lo = rp < 0 ? min_jint : ranges[rp].hi()+1; |
duke@435 | 365 | int table_index = method_data_update() ? j : NullTableIndex; |
duke@435 | 366 | makes_backward_branch |= (dest <= bci()); |
duke@435 | 367 | if( match_int != next_lo ) { |
duke@435 | 368 | ranges[++rp].setRange(next_lo, match_int-1, default_dest, NullTableIndex); |
duke@435 | 369 | } |
duke@435 | 370 | if( rp < 0 || !ranges[rp].adjoin(match_int, dest, table_index) ) { |
duke@435 | 371 | ranges[++rp].set(match_int, dest, table_index); |
duke@435 | 372 | } |
duke@435 | 373 | } |
duke@435 | 374 | jint highest = table[2*(len-1)]; |
duke@435 | 375 | assert(ranges[rp].hi() == highest, ""); |
duke@435 | 376 | if( highest != max_jint |
duke@435 | 377 | && !ranges[rp].adjoinRange(highest+1, max_jint, default_dest, NullTableIndex) ) { |
duke@435 | 378 | ranges[++rp].setRange(highest+1, max_jint, default_dest, NullTableIndex); |
duke@435 | 379 | } |
duke@435 | 380 | assert(rp < rnum, "not too many ranges"); |
duke@435 | 381 | |
duke@435 | 382 | // Safepoint in case backward branch observed |
duke@435 | 383 | if( makes_backward_branch && UseLoopSafepoints ) |
duke@435 | 384 | add_safepoint(); |
duke@435 | 385 | |
duke@435 | 386 | jump_switch_ranges(lookup, &ranges[0], &ranges[rp]); |
duke@435 | 387 | } |
duke@435 | 388 | |
duke@435 | 389 | //----------------------------create_jump_tables------------------------------- |
duke@435 | 390 | bool Parse::create_jump_tables(Node* key_val, SwitchRange* lo, SwitchRange* hi) { |
duke@435 | 391 | // Are jumptables enabled |
duke@435 | 392 | if (!UseJumpTables) return false; |
duke@435 | 393 | |
duke@435 | 394 | // Are jumptables supported |
duke@435 | 395 | if (!Matcher::has_match_rule(Op_Jump)) return false; |
duke@435 | 396 | |
duke@435 | 397 | // Don't make jump table if profiling |
duke@435 | 398 | if (method_data_update()) return false; |
duke@435 | 399 | |
duke@435 | 400 | // Decide if a guard is needed to lop off big ranges at either (or |
duke@435 | 401 | // both) end(s) of the input set. We'll call this the default target |
duke@435 | 402 | // even though we can't be sure that it is the true "default". |
duke@435 | 403 | |
duke@435 | 404 | bool needs_guard = false; |
duke@435 | 405 | int default_dest; |
duke@435 | 406 | int64 total_outlier_size = 0; |
duke@435 | 407 | int64 hi_size = ((int64)hi->hi()) - ((int64)hi->lo()) + 1; |
duke@435 | 408 | int64 lo_size = ((int64)lo->hi()) - ((int64)lo->lo()) + 1; |
duke@435 | 409 | |
duke@435 | 410 | if (lo->dest() == hi->dest()) { |
duke@435 | 411 | total_outlier_size = hi_size + lo_size; |
duke@435 | 412 | default_dest = lo->dest(); |
duke@435 | 413 | } else if (lo_size > hi_size) { |
duke@435 | 414 | total_outlier_size = lo_size; |
duke@435 | 415 | default_dest = lo->dest(); |
duke@435 | 416 | } else { |
duke@435 | 417 | total_outlier_size = hi_size; |
duke@435 | 418 | default_dest = hi->dest(); |
duke@435 | 419 | } |
duke@435 | 420 | |
duke@435 | 421 | // If a guard test will eliminate very sparse end ranges, then |
duke@435 | 422 | // it is worth the cost of an extra jump. |
duke@435 | 423 | if (total_outlier_size > (MaxJumpTableSparseness * 4)) { |
duke@435 | 424 | needs_guard = true; |
duke@435 | 425 | if (default_dest == lo->dest()) lo++; |
duke@435 | 426 | if (default_dest == hi->dest()) hi--; |
duke@435 | 427 | } |
duke@435 | 428 | |
duke@435 | 429 | // Find the total number of cases and ranges |
duke@435 | 430 | int64 num_cases = ((int64)hi->hi()) - ((int64)lo->lo()) + 1; |
duke@435 | 431 | int num_range = hi - lo + 1; |
duke@435 | 432 | |
duke@435 | 433 | // Don't create table if: too large, too small, or too sparse. |
duke@435 | 434 | if (num_cases < MinJumpTableSize || num_cases > MaxJumpTableSize) |
duke@435 | 435 | return false; |
duke@435 | 436 | if (num_cases > (MaxJumpTableSparseness * num_range)) |
duke@435 | 437 | return false; |
duke@435 | 438 | |
duke@435 | 439 | // Normalize table lookups to zero |
duke@435 | 440 | int lowval = lo->lo(); |
kvn@4115 | 441 | key_val = _gvn.transform( new (C) SubINode(key_val, _gvn.intcon(lowval)) ); |
duke@435 | 442 | |
duke@435 | 443 | // Generate a guard to protect against input keyvals that aren't |
duke@435 | 444 | // in the switch domain. |
duke@435 | 445 | if (needs_guard) { |
duke@435 | 446 | Node* size = _gvn.intcon(num_cases); |
kvn@4115 | 447 | Node* cmp = _gvn.transform( new (C) CmpUNode(key_val, size) ); |
kvn@4115 | 448 | Node* tst = _gvn.transform( new (C) BoolNode(cmp, BoolTest::ge) ); |
duke@435 | 449 | IfNode* iff = create_and_map_if( control(), tst, PROB_FAIR, COUNT_UNKNOWN); |
duke@435 | 450 | jump_if_true_fork(iff, default_dest, NullTableIndex); |
duke@435 | 451 | } |
duke@435 | 452 | |
duke@435 | 453 | // Create an ideal node JumpTable that has projections |
duke@435 | 454 | // of all possible ranges for a switch statement |
duke@435 | 455 | // The key_val input must be converted to a pointer offset and scaled. |
duke@435 | 456 | // Compare Parse::array_addressing above. |
duke@435 | 457 | #ifdef _LP64 |
duke@435 | 458 | // Clean the 32-bit int into a real 64-bit offset. |
duke@435 | 459 | // Otherwise, the jint value 0 might turn into an offset of 0x0800000000. |
duke@435 | 460 | const TypeLong* lkeytype = TypeLong::make(CONST64(0), num_cases-1, Type::WidenMin); |
kvn@4115 | 461 | key_val = _gvn.transform( new (C) ConvI2LNode(key_val, lkeytype) ); |
duke@435 | 462 | #endif |
duke@435 | 463 | // Shift the value by wordsize so we have an index into the table, rather |
duke@435 | 464 | // than a switch value |
duke@435 | 465 | Node *shiftWord = _gvn.MakeConX(wordSize); |
kvn@4115 | 466 | key_val = _gvn.transform( new (C) MulXNode( key_val, shiftWord)); |
duke@435 | 467 | |
duke@435 | 468 | // Create the JumpNode |
kvn@4115 | 469 | Node* jtn = _gvn.transform( new (C) JumpNode(control(), key_val, num_cases) ); |
duke@435 | 470 | |
duke@435 | 471 | // These are the switch destinations hanging off the jumpnode |
duke@435 | 472 | int i = 0; |
duke@435 | 473 | for (SwitchRange* r = lo; r <= hi; r++) { |
duke@435 | 474 | for (int j = r->lo(); j <= r->hi(); j++, i++) { |
kvn@4115 | 475 | Node* input = _gvn.transform(new (C) JumpProjNode(jtn, i, r->dest(), j - lowval)); |
duke@435 | 476 | { |
duke@435 | 477 | PreserveJVMState pjvms(this); |
duke@435 | 478 | set_control(input); |
duke@435 | 479 | jump_if_always_fork(r->dest(), r->table_index()); |
duke@435 | 480 | } |
duke@435 | 481 | } |
duke@435 | 482 | } |
duke@435 | 483 | assert(i == num_cases, "miscount of cases"); |
duke@435 | 484 | stop_and_kill_map(); // no more uses for this JVMS |
duke@435 | 485 | return true; |
duke@435 | 486 | } |
duke@435 | 487 | |
duke@435 | 488 | //----------------------------jump_switch_ranges------------------------------- |
duke@435 | 489 | void Parse::jump_switch_ranges(Node* key_val, SwitchRange *lo, SwitchRange *hi, int switch_depth) { |
duke@435 | 490 | Block* switch_block = block(); |
duke@435 | 491 | |
duke@435 | 492 | if (switch_depth == 0) { |
duke@435 | 493 | // Do special processing for the top-level call. |
duke@435 | 494 | assert(lo->lo() == min_jint, "initial range must exhaust Type::INT"); |
duke@435 | 495 | assert(hi->hi() == max_jint, "initial range must exhaust Type::INT"); |
duke@435 | 496 | |
duke@435 | 497 | // Decrement pred-numbers for the unique set of nodes. |
duke@435 | 498 | #ifdef ASSERT |
duke@435 | 499 | // Ensure that the block's successors are a (duplicate-free) set. |
duke@435 | 500 | int successors_counted = 0; // block occurrences in [hi..lo] |
duke@435 | 501 | int unique_successors = switch_block->num_successors(); |
duke@435 | 502 | for (int i = 0; i < unique_successors; i++) { |
duke@435 | 503 | Block* target = switch_block->successor_at(i); |
duke@435 | 504 | |
duke@435 | 505 | // Check that the set of successors is the same in both places. |
duke@435 | 506 | int successors_found = 0; |
duke@435 | 507 | for (SwitchRange* p = lo; p <= hi; p++) { |
duke@435 | 508 | if (p->dest() == target->start()) successors_found++; |
duke@435 | 509 | } |
duke@435 | 510 | assert(successors_found > 0, "successor must be known"); |
duke@435 | 511 | successors_counted += successors_found; |
duke@435 | 512 | } |
duke@435 | 513 | assert(successors_counted == (hi-lo)+1, "no unexpected successors"); |
duke@435 | 514 | #endif |
duke@435 | 515 | |
duke@435 | 516 | // Maybe prune the inputs, based on the type of key_val. |
duke@435 | 517 | jint min_val = min_jint; |
duke@435 | 518 | jint max_val = max_jint; |
duke@435 | 519 | const TypeInt* ti = key_val->bottom_type()->isa_int(); |
duke@435 | 520 | if (ti != NULL) { |
duke@435 | 521 | min_val = ti->_lo; |
duke@435 | 522 | max_val = ti->_hi; |
duke@435 | 523 | assert(min_val <= max_val, "invalid int type"); |
duke@435 | 524 | } |
duke@435 | 525 | while (lo->hi() < min_val) lo++; |
duke@435 | 526 | if (lo->lo() < min_val) lo->setRange(min_val, lo->hi(), lo->dest(), lo->table_index()); |
duke@435 | 527 | while (hi->lo() > max_val) hi--; |
duke@435 | 528 | if (hi->hi() > max_val) hi->setRange(hi->lo(), max_val, hi->dest(), hi->table_index()); |
duke@435 | 529 | } |
duke@435 | 530 | |
duke@435 | 531 | #ifndef PRODUCT |
duke@435 | 532 | if (switch_depth == 0) { |
duke@435 | 533 | _max_switch_depth = 0; |
duke@435 | 534 | _est_switch_depth = log2_intptr((hi-lo+1)-1)+1; |
duke@435 | 535 | } |
duke@435 | 536 | #endif |
duke@435 | 537 | |
duke@435 | 538 | assert(lo <= hi, "must be a non-empty set of ranges"); |
duke@435 | 539 | if (lo == hi) { |
duke@435 | 540 | jump_if_always_fork(lo->dest(), lo->table_index()); |
duke@435 | 541 | } else { |
duke@435 | 542 | assert(lo->hi() == (lo+1)->lo()-1, "contiguous ranges"); |
duke@435 | 543 | assert(hi->lo() == (hi-1)->hi()+1, "contiguous ranges"); |
duke@435 | 544 | |
duke@435 | 545 | if (create_jump_tables(key_val, lo, hi)) return; |
duke@435 | 546 | |
duke@435 | 547 | int nr = hi - lo + 1; |
duke@435 | 548 | |
duke@435 | 549 | SwitchRange* mid = lo + nr/2; |
duke@435 | 550 | // if there is an easy choice, pivot at a singleton: |
duke@435 | 551 | if (nr > 3 && !mid->is_singleton() && (mid-1)->is_singleton()) mid--; |
duke@435 | 552 | |
duke@435 | 553 | assert(lo < mid && mid <= hi, "good pivot choice"); |
duke@435 | 554 | assert(nr != 2 || mid == hi, "should pick higher of 2"); |
duke@435 | 555 | assert(nr != 3 || mid == hi-1, "should pick middle of 3"); |
duke@435 | 556 | |
duke@435 | 557 | Node *test_val = _gvn.intcon(mid->lo()); |
duke@435 | 558 | |
duke@435 | 559 | if (mid->is_singleton()) { |
duke@435 | 560 | IfNode *iff_ne = jump_if_fork_int(key_val, test_val, BoolTest::ne); |
duke@435 | 561 | jump_if_false_fork(iff_ne, mid->dest(), mid->table_index()); |
duke@435 | 562 | |
duke@435 | 563 | // Special Case: If there are exactly three ranges, and the high |
duke@435 | 564 | // and low range each go to the same place, omit the "gt" test, |
duke@435 | 565 | // since it will not discriminate anything. |
duke@435 | 566 | bool eq_test_only = (hi == lo+2 && hi->dest() == lo->dest()); |
duke@435 | 567 | if (eq_test_only) { |
duke@435 | 568 | assert(mid == hi-1, ""); |
duke@435 | 569 | } |
duke@435 | 570 | |
duke@435 | 571 | // if there is a higher range, test for it and process it: |
duke@435 | 572 | if (mid < hi && !eq_test_only) { |
duke@435 | 573 | // two comparisons of same values--should enable 1 test for 2 branches |
duke@435 | 574 | // Use BoolTest::le instead of BoolTest::gt |
duke@435 | 575 | IfNode *iff_le = jump_if_fork_int(key_val, test_val, BoolTest::le); |
kvn@4115 | 576 | Node *iftrue = _gvn.transform( new (C) IfTrueNode(iff_le) ); |
kvn@4115 | 577 | Node *iffalse = _gvn.transform( new (C) IfFalseNode(iff_le) ); |
duke@435 | 578 | { PreserveJVMState pjvms(this); |
duke@435 | 579 | set_control(iffalse); |
duke@435 | 580 | jump_switch_ranges(key_val, mid+1, hi, switch_depth+1); |
duke@435 | 581 | } |
duke@435 | 582 | set_control(iftrue); |
duke@435 | 583 | } |
duke@435 | 584 | |
duke@435 | 585 | } else { |
duke@435 | 586 | // mid is a range, not a singleton, so treat mid..hi as a unit |
duke@435 | 587 | IfNode *iff_ge = jump_if_fork_int(key_val, test_val, BoolTest::ge); |
duke@435 | 588 | |
duke@435 | 589 | // if there is a higher range, test for it and process it: |
duke@435 | 590 | if (mid == hi) { |
duke@435 | 591 | jump_if_true_fork(iff_ge, mid->dest(), mid->table_index()); |
duke@435 | 592 | } else { |
kvn@4115 | 593 | Node *iftrue = _gvn.transform( new (C) IfTrueNode(iff_ge) ); |
kvn@4115 | 594 | Node *iffalse = _gvn.transform( new (C) IfFalseNode(iff_ge) ); |
duke@435 | 595 | { PreserveJVMState pjvms(this); |
duke@435 | 596 | set_control(iftrue); |
duke@435 | 597 | jump_switch_ranges(key_val, mid, hi, switch_depth+1); |
duke@435 | 598 | } |
duke@435 | 599 | set_control(iffalse); |
duke@435 | 600 | } |
duke@435 | 601 | } |
duke@435 | 602 | |
duke@435 | 603 | // in any case, process the lower range |
duke@435 | 604 | jump_switch_ranges(key_val, lo, mid-1, switch_depth+1); |
duke@435 | 605 | } |
duke@435 | 606 | |
duke@435 | 607 | // Decrease pred_count for each successor after all is done. |
duke@435 | 608 | if (switch_depth == 0) { |
duke@435 | 609 | int unique_successors = switch_block->num_successors(); |
duke@435 | 610 | for (int i = 0; i < unique_successors; i++) { |
duke@435 | 611 | Block* target = switch_block->successor_at(i); |
duke@435 | 612 | // Throw away the pre-allocated path for each unique successor. |
duke@435 | 613 | target->next_path_num(); |
duke@435 | 614 | } |
duke@435 | 615 | } |
duke@435 | 616 | |
duke@435 | 617 | #ifndef PRODUCT |
duke@435 | 618 | _max_switch_depth = MAX2(switch_depth, _max_switch_depth); |
duke@435 | 619 | if (TraceOptoParse && Verbose && WizardMode && switch_depth == 0) { |
duke@435 | 620 | SwitchRange* r; |
duke@435 | 621 | int nsing = 0; |
duke@435 | 622 | for( r = lo; r <= hi; r++ ) { |
duke@435 | 623 | if( r->is_singleton() ) nsing++; |
duke@435 | 624 | } |
duke@435 | 625 | tty->print(">>> "); |
duke@435 | 626 | _method->print_short_name(); |
duke@435 | 627 | tty->print_cr(" switch decision tree"); |
duke@435 | 628 | tty->print_cr(" %d ranges (%d singletons), max_depth=%d, est_depth=%d", |
duke@435 | 629 | hi-lo+1, nsing, _max_switch_depth, _est_switch_depth); |
duke@435 | 630 | if (_max_switch_depth > _est_switch_depth) { |
duke@435 | 631 | tty->print_cr("******** BAD SWITCH DEPTH ********"); |
duke@435 | 632 | } |
duke@435 | 633 | tty->print(" "); |
duke@435 | 634 | for( r = lo; r <= hi; r++ ) { |
duke@435 | 635 | r->print(env()); |
duke@435 | 636 | } |
duke@435 | 637 | tty->print_cr(""); |
duke@435 | 638 | } |
duke@435 | 639 | #endif |
duke@435 | 640 | } |
duke@435 | 641 | |
duke@435 | 642 | void Parse::modf() { |
duke@435 | 643 | Node *f2 = pop(); |
duke@435 | 644 | Node *f1 = pop(); |
duke@435 | 645 | Node* c = make_runtime_call(RC_LEAF, OptoRuntime::modf_Type(), |
duke@435 | 646 | CAST_FROM_FN_PTR(address, SharedRuntime::frem), |
duke@435 | 647 | "frem", NULL, //no memory effects |
duke@435 | 648 | f1, f2); |
kvn@4115 | 649 | Node* res = _gvn.transform(new (C) ProjNode(c, TypeFunc::Parms + 0)); |
duke@435 | 650 | |
duke@435 | 651 | push(res); |
duke@435 | 652 | } |
duke@435 | 653 | |
duke@435 | 654 | void Parse::modd() { |
duke@435 | 655 | Node *d2 = pop_pair(); |
duke@435 | 656 | Node *d1 = pop_pair(); |
duke@435 | 657 | Node* c = make_runtime_call(RC_LEAF, OptoRuntime::Math_DD_D_Type(), |
duke@435 | 658 | CAST_FROM_FN_PTR(address, SharedRuntime::drem), |
duke@435 | 659 | "drem", NULL, //no memory effects |
duke@435 | 660 | d1, top(), d2, top()); |
kvn@4115 | 661 | Node* res_d = _gvn.transform(new (C) ProjNode(c, TypeFunc::Parms + 0)); |
duke@435 | 662 | |
duke@435 | 663 | #ifdef ASSERT |
kvn@4115 | 664 | Node* res_top = _gvn.transform(new (C) ProjNode(c, TypeFunc::Parms + 1)); |
duke@435 | 665 | assert(res_top == top(), "second value must be top"); |
duke@435 | 666 | #endif |
duke@435 | 667 | |
duke@435 | 668 | push_pair(res_d); |
duke@435 | 669 | } |
duke@435 | 670 | |
duke@435 | 671 | void Parse::l2f() { |
duke@435 | 672 | Node* f2 = pop(); |
duke@435 | 673 | Node* f1 = pop(); |
duke@435 | 674 | Node* c = make_runtime_call(RC_LEAF, OptoRuntime::l2f_Type(), |
duke@435 | 675 | CAST_FROM_FN_PTR(address, SharedRuntime::l2f), |
duke@435 | 676 | "l2f", NULL, //no memory effects |
duke@435 | 677 | f1, f2); |
kvn@4115 | 678 | Node* res = _gvn.transform(new (C) ProjNode(c, TypeFunc::Parms + 0)); |
duke@435 | 679 | |
duke@435 | 680 | push(res); |
duke@435 | 681 | } |
duke@435 | 682 | |
duke@435 | 683 | void Parse::do_irem() { |
duke@435 | 684 | // Must keep both values on the expression-stack during null-check |
twisti@4313 | 685 | zero_check_int(peek()); |
duke@435 | 686 | // Compile-time detect of null-exception? |
duke@435 | 687 | if (stopped()) return; |
duke@435 | 688 | |
duke@435 | 689 | Node* b = pop(); |
duke@435 | 690 | Node* a = pop(); |
duke@435 | 691 | |
duke@435 | 692 | const Type *t = _gvn.type(b); |
duke@435 | 693 | if (t != Type::TOP) { |
duke@435 | 694 | const TypeInt *ti = t->is_int(); |
duke@435 | 695 | if (ti->is_con()) { |
duke@435 | 696 | int divisor = ti->get_con(); |
duke@435 | 697 | // check for positive power of 2 |
duke@435 | 698 | if (divisor > 0 && |
duke@435 | 699 | (divisor & ~(divisor-1)) == divisor) { |
duke@435 | 700 | // yes ! |
duke@435 | 701 | Node *mask = _gvn.intcon((divisor - 1)); |
duke@435 | 702 | // Sigh, must handle negative dividends |
duke@435 | 703 | Node *zero = _gvn.intcon(0); |
duke@435 | 704 | IfNode *ifff = jump_if_fork_int(a, zero, BoolTest::lt); |
kvn@4115 | 705 | Node *iff = _gvn.transform( new (C) IfFalseNode(ifff) ); |
kvn@4115 | 706 | Node *ift = _gvn.transform( new (C) IfTrueNode (ifff) ); |
duke@435 | 707 | Node *reg = jump_if_join(ift, iff); |
duke@435 | 708 | Node *phi = PhiNode::make(reg, NULL, TypeInt::INT); |
duke@435 | 709 | // Negative path; negate/and/negate |
kvn@4115 | 710 | Node *neg = _gvn.transform( new (C) SubINode(zero, a) ); |
kvn@4115 | 711 | Node *andn= _gvn.transform( new (C) AndINode(neg, mask) ); |
kvn@4115 | 712 | Node *negn= _gvn.transform( new (C) SubINode(zero, andn) ); |
duke@435 | 713 | phi->init_req(1, negn); |
duke@435 | 714 | // Fast positive case |
kvn@4115 | 715 | Node *andx = _gvn.transform( new (C) AndINode(a, mask) ); |
duke@435 | 716 | phi->init_req(2, andx); |
duke@435 | 717 | // Push the merge |
duke@435 | 718 | push( _gvn.transform(phi) ); |
duke@435 | 719 | return; |
duke@435 | 720 | } |
duke@435 | 721 | } |
duke@435 | 722 | } |
duke@435 | 723 | // Default case |
kvn@4115 | 724 | push( _gvn.transform( new (C) ModINode(control(),a,b) ) ); |
duke@435 | 725 | } |
duke@435 | 726 | |
duke@435 | 727 | // Handle jsr and jsr_w bytecode |
duke@435 | 728 | void Parse::do_jsr() { |
duke@435 | 729 | assert(bc() == Bytecodes::_jsr || bc() == Bytecodes::_jsr_w, "wrong bytecode"); |
duke@435 | 730 | |
duke@435 | 731 | // Store information about current state, tagged with new _jsr_bci |
duke@435 | 732 | int return_bci = iter().next_bci(); |
duke@435 | 733 | int jsr_bci = (bc() == Bytecodes::_jsr) ? iter().get_dest() : iter().get_far_dest(); |
duke@435 | 734 | |
duke@435 | 735 | // Update method data |
duke@435 | 736 | profile_taken_branch(jsr_bci); |
duke@435 | 737 | |
duke@435 | 738 | // The way we do things now, there is only one successor block |
duke@435 | 739 | // for the jsr, because the target code is cloned by ciTypeFlow. |
duke@435 | 740 | Block* target = successor_for_bci(jsr_bci); |
duke@435 | 741 | |
duke@435 | 742 | // What got pushed? |
duke@435 | 743 | const Type* ret_addr = target->peek(); |
duke@435 | 744 | assert(ret_addr->singleton(), "must be a constant (cloned jsr body)"); |
duke@435 | 745 | |
duke@435 | 746 | // Effect on jsr on stack |
duke@435 | 747 | push(_gvn.makecon(ret_addr)); |
duke@435 | 748 | |
duke@435 | 749 | // Flow to the jsr. |
duke@435 | 750 | merge(jsr_bci); |
duke@435 | 751 | } |
duke@435 | 752 | |
duke@435 | 753 | // Handle ret bytecode |
duke@435 | 754 | void Parse::do_ret() { |
duke@435 | 755 | // Find to whom we return. |
duke@435 | 756 | assert(block()->num_successors() == 1, "a ret can only go one place now"); |
duke@435 | 757 | Block* target = block()->successor_at(0); |
duke@435 | 758 | assert(!target->is_ready(), "our arrival must be expected"); |
duke@435 | 759 | profile_ret(target->flow()->start()); |
duke@435 | 760 | int pnum = target->next_path_num(); |
duke@435 | 761 | merge_common(target, pnum); |
duke@435 | 762 | } |
duke@435 | 763 | |
duke@435 | 764 | //--------------------------dynamic_branch_prediction-------------------------- |
duke@435 | 765 | // Try to gather dynamic branch prediction behavior. Return a probability |
duke@435 | 766 | // of the branch being taken and set the "cnt" field. Returns a -1.0 |
duke@435 | 767 | // if we need to use static prediction for some reason. |
duke@435 | 768 | float Parse::dynamic_branch_prediction(float &cnt) { |
duke@435 | 769 | ResourceMark rm; |
duke@435 | 770 | |
duke@435 | 771 | cnt = COUNT_UNKNOWN; |
duke@435 | 772 | |
duke@435 | 773 | // Use MethodData information if it is available |
duke@435 | 774 | // FIXME: free the ProfileData structure |
duke@435 | 775 | ciMethodData* methodData = method()->method_data(); |
duke@435 | 776 | if (!methodData->is_mature()) return PROB_UNKNOWN; |
duke@435 | 777 | ciProfileData* data = methodData->bci_to_data(bci()); |
duke@435 | 778 | if (!data->is_JumpData()) return PROB_UNKNOWN; |
duke@435 | 779 | |
duke@435 | 780 | // get taken and not taken values |
duke@435 | 781 | int taken = data->as_JumpData()->taken(); |
duke@435 | 782 | int not_taken = 0; |
duke@435 | 783 | if (data->is_BranchData()) { |
duke@435 | 784 | not_taken = data->as_BranchData()->not_taken(); |
duke@435 | 785 | } |
duke@435 | 786 | |
duke@435 | 787 | // scale the counts to be commensurate with invocation counts: |
duke@435 | 788 | taken = method()->scale_count(taken); |
duke@435 | 789 | not_taken = method()->scale_count(not_taken); |
duke@435 | 790 | |
iveresov@2763 | 791 | // Give up if too few (or too many, in which case the sum will overflow) counts to be meaningful. |
iveresov@2763 | 792 | // We also check that individual counters are positive first, overwise the sum can become positive. |
iveresov@2763 | 793 | if (taken < 0 || not_taken < 0 || taken + not_taken < 40) { |
duke@435 | 794 | if (C->log() != NULL) { |
duke@435 | 795 | C->log()->elem("branch target_bci='%d' taken='%d' not_taken='%d'", iter().get_dest(), taken, not_taken); |
duke@435 | 796 | } |
duke@435 | 797 | return PROB_UNKNOWN; |
duke@435 | 798 | } |
duke@435 | 799 | |
duke@435 | 800 | // Compute frequency that we arrive here |
iveresov@2763 | 801 | float sum = taken + not_taken; |
duke@435 | 802 | // Adjust, if this block is a cloned private block but the |
duke@435 | 803 | // Jump counts are shared. Taken the private counts for |
duke@435 | 804 | // just this path instead of the shared counts. |
duke@435 | 805 | if( block()->count() > 0 ) |
duke@435 | 806 | sum = block()->count(); |
iveresov@2763 | 807 | cnt = sum / FreqCountInvocations; |
duke@435 | 808 | |
duke@435 | 809 | // Pin probability to sane limits |
duke@435 | 810 | float prob; |
duke@435 | 811 | if( !taken ) |
duke@435 | 812 | prob = (0+PROB_MIN) / 2; |
duke@435 | 813 | else if( !not_taken ) |
duke@435 | 814 | prob = (1+PROB_MAX) / 2; |
duke@435 | 815 | else { // Compute probability of true path |
duke@435 | 816 | prob = (float)taken / (float)(taken + not_taken); |
duke@435 | 817 | if (prob > PROB_MAX) prob = PROB_MAX; |
duke@435 | 818 | if (prob < PROB_MIN) prob = PROB_MIN; |
duke@435 | 819 | } |
duke@435 | 820 | |
duke@435 | 821 | assert((cnt > 0.0f) && (prob > 0.0f), |
duke@435 | 822 | "Bad frequency assignment in if"); |
duke@435 | 823 | |
duke@435 | 824 | if (C->log() != NULL) { |
duke@435 | 825 | const char* prob_str = NULL; |
duke@435 | 826 | if (prob >= PROB_MAX) prob_str = (prob == PROB_MAX) ? "max" : "always"; |
duke@435 | 827 | if (prob <= PROB_MIN) prob_str = (prob == PROB_MIN) ? "min" : "never"; |
duke@435 | 828 | char prob_str_buf[30]; |
duke@435 | 829 | if (prob_str == NULL) { |
duke@435 | 830 | sprintf(prob_str_buf, "%g", prob); |
duke@435 | 831 | prob_str = prob_str_buf; |
duke@435 | 832 | } |
duke@435 | 833 | C->log()->elem("branch target_bci='%d' taken='%d' not_taken='%d' cnt='%g' prob='%s'", |
duke@435 | 834 | iter().get_dest(), taken, not_taken, cnt, prob_str); |
duke@435 | 835 | } |
duke@435 | 836 | return prob; |
duke@435 | 837 | } |
duke@435 | 838 | |
duke@435 | 839 | //-----------------------------branch_prediction------------------------------- |
duke@435 | 840 | float Parse::branch_prediction(float& cnt, |
duke@435 | 841 | BoolTest::mask btest, |
duke@435 | 842 | int target_bci) { |
duke@435 | 843 | float prob = dynamic_branch_prediction(cnt); |
duke@435 | 844 | // If prob is unknown, switch to static prediction |
duke@435 | 845 | if (prob != PROB_UNKNOWN) return prob; |
duke@435 | 846 | |
duke@435 | 847 | prob = PROB_FAIR; // Set default value |
duke@435 | 848 | if (btest == BoolTest::eq) // Exactly equal test? |
duke@435 | 849 | prob = PROB_STATIC_INFREQUENT; // Assume its relatively infrequent |
duke@435 | 850 | else if (btest == BoolTest::ne) |
duke@435 | 851 | prob = PROB_STATIC_FREQUENT; // Assume its relatively frequent |
duke@435 | 852 | |
duke@435 | 853 | // If this is a conditional test guarding a backwards branch, |
duke@435 | 854 | // assume its a loop-back edge. Make it a likely taken branch. |
duke@435 | 855 | if (target_bci < bci()) { |
duke@435 | 856 | if (is_osr_parse()) { // Could be a hot OSR'd loop; force deopt |
duke@435 | 857 | // Since it's an OSR, we probably have profile data, but since |
duke@435 | 858 | // branch_prediction returned PROB_UNKNOWN, the counts are too small. |
duke@435 | 859 | // Let's make a special check here for completely zero counts. |
duke@435 | 860 | ciMethodData* methodData = method()->method_data(); |
duke@435 | 861 | if (!methodData->is_empty()) { |
duke@435 | 862 | ciProfileData* data = methodData->bci_to_data(bci()); |
duke@435 | 863 | // Only stop for truly zero counts, which mean an unknown part |
duke@435 | 864 | // of the OSR-ed method, and we want to deopt to gather more stats. |
duke@435 | 865 | // If you have ANY counts, then this loop is simply 'cold' relative |
duke@435 | 866 | // to the OSR loop. |
duke@435 | 867 | if (data->as_BranchData()->taken() + |
duke@435 | 868 | data->as_BranchData()->not_taken() == 0 ) { |
duke@435 | 869 | // This is the only way to return PROB_UNKNOWN: |
duke@435 | 870 | return PROB_UNKNOWN; |
duke@435 | 871 | } |
duke@435 | 872 | } |
duke@435 | 873 | } |
duke@435 | 874 | prob = PROB_STATIC_FREQUENT; // Likely to take backwards branch |
duke@435 | 875 | } |
duke@435 | 876 | |
duke@435 | 877 | assert(prob != PROB_UNKNOWN, "must have some guess at this point"); |
duke@435 | 878 | return prob; |
duke@435 | 879 | } |
duke@435 | 880 | |
duke@435 | 881 | // The magic constants are chosen so as to match the output of |
duke@435 | 882 | // branch_prediction() when the profile reports a zero taken count. |
duke@435 | 883 | // It is important to distinguish zero counts unambiguously, because |
duke@435 | 884 | // some branches (e.g., _213_javac.Assembler.eliminate) validly produce |
duke@435 | 885 | // very small but nonzero probabilities, which if confused with zero |
duke@435 | 886 | // counts would keep the program recompiling indefinitely. |
duke@435 | 887 | bool Parse::seems_never_taken(float prob) { |
duke@435 | 888 | return prob < PROB_MIN; |
duke@435 | 889 | } |
duke@435 | 890 | |
jrose@2101 | 891 | // True if the comparison seems to be the kind that will not change its |
jrose@2101 | 892 | // statistics from true to false. See comments in adjust_map_after_if. |
jrose@2101 | 893 | // This question is only asked along paths which are already |
jrose@2101 | 894 | // classifed as untaken (by seems_never_taken), so really, |
jrose@2101 | 895 | // if a path is never taken, its controlling comparison is |
jrose@2101 | 896 | // already acting in a stable fashion. If the comparison |
jrose@2101 | 897 | // seems stable, we will put an expensive uncommon trap |
jrose@2101 | 898 | // on the untaken path. To be conservative, and to allow |
jrose@2101 | 899 | // partially executed counted loops to be compiled fully, |
jrose@2101 | 900 | // we will plant uncommon traps only after pointer comparisons. |
jrose@2101 | 901 | bool Parse::seems_stable_comparison(BoolTest::mask btest, Node* cmp) { |
jrose@2101 | 902 | for (int depth = 4; depth > 0; depth--) { |
jrose@2101 | 903 | // The following switch can find CmpP here over half the time for |
jrose@2101 | 904 | // dynamic language code rich with type tests. |
jrose@2101 | 905 | // Code using counted loops or array manipulations (typical |
jrose@2101 | 906 | // of benchmarks) will have many (>80%) CmpI instructions. |
jrose@2101 | 907 | switch (cmp->Opcode()) { |
jrose@2101 | 908 | case Op_CmpP: |
jrose@2101 | 909 | // A never-taken null check looks like CmpP/BoolTest::eq. |
jrose@2101 | 910 | // These certainly should be closed off as uncommon traps. |
jrose@2101 | 911 | if (btest == BoolTest::eq) |
jrose@2101 | 912 | return true; |
jrose@2101 | 913 | // A never-failed type check looks like CmpP/BoolTest::ne. |
jrose@2101 | 914 | // Let's put traps on those, too, so that we don't have to compile |
jrose@2101 | 915 | // unused paths with indeterminate dynamic type information. |
jrose@2101 | 916 | if (ProfileDynamicTypes) |
jrose@2101 | 917 | return true; |
jrose@2101 | 918 | return false; |
jrose@2101 | 919 | |
jrose@2101 | 920 | case Op_CmpI: |
jrose@2101 | 921 | // A small minority (< 10%) of CmpP are masked as CmpI, |
jrose@2101 | 922 | // as if by boolean conversion ((p == q? 1: 0) != 0). |
jrose@2101 | 923 | // Detect that here, even if it hasn't optimized away yet. |
jrose@2101 | 924 | // Specifically, this covers the 'instanceof' operator. |
jrose@2101 | 925 | if (btest == BoolTest::ne || btest == BoolTest::eq) { |
jrose@2101 | 926 | if (_gvn.type(cmp->in(2))->singleton() && |
jrose@2101 | 927 | cmp->in(1)->is_Phi()) { |
jrose@2101 | 928 | PhiNode* phi = cmp->in(1)->as_Phi(); |
jrose@2101 | 929 | int true_path = phi->is_diamond_phi(); |
jrose@2101 | 930 | if (true_path > 0 && |
jrose@2101 | 931 | _gvn.type(phi->in(1))->singleton() && |
jrose@2101 | 932 | _gvn.type(phi->in(2))->singleton()) { |
jrose@2101 | 933 | // phi->region->if_proj->ifnode->bool->cmp |
jrose@2101 | 934 | BoolNode* bol = phi->in(0)->in(1)->in(0)->in(1)->as_Bool(); |
jrose@2101 | 935 | btest = bol->_test._test; |
jrose@2101 | 936 | cmp = bol->in(1); |
jrose@2101 | 937 | continue; |
jrose@2101 | 938 | } |
jrose@2101 | 939 | } |
jrose@2101 | 940 | } |
jrose@2101 | 941 | return false; |
jrose@2101 | 942 | } |
jrose@2101 | 943 | } |
jrose@2101 | 944 | return false; |
jrose@2101 | 945 | } |
jrose@2101 | 946 | |
rasbold@681 | 947 | //-------------------------------repush_if_args-------------------------------- |
rasbold@681 | 948 | // Push arguments of an "if" bytecode back onto the stack by adjusting _sp. |
cfang@1607 | 949 | inline int Parse::repush_if_args() { |
duke@435 | 950 | #ifndef PRODUCT |
duke@435 | 951 | if (PrintOpto && WizardMode) { |
duke@435 | 952 | tty->print("defending against excessive implicit null exceptions on %s @%d in ", |
duke@435 | 953 | Bytecodes::name(iter().cur_bc()), iter().cur_bci()); |
duke@435 | 954 | method()->print_name(); tty->cr(); |
duke@435 | 955 | } |
duke@435 | 956 | #endif |
duke@435 | 957 | int bc_depth = - Bytecodes::depth(iter().cur_bc()); |
duke@435 | 958 | assert(bc_depth == 1 || bc_depth == 2, "only two kinds of branches"); |
duke@435 | 959 | DEBUG_ONLY(sync_jvms()); // argument(n) requires a synced jvms |
duke@435 | 960 | assert(argument(0) != NULL, "must exist"); |
duke@435 | 961 | assert(bc_depth == 1 || argument(1) != NULL, "two must exist"); |
twisti@4313 | 962 | inc_sp(bc_depth); |
cfang@1607 | 963 | return bc_depth; |
duke@435 | 964 | } |
duke@435 | 965 | |
duke@435 | 966 | //----------------------------------do_ifnull---------------------------------- |
rasbold@683 | 967 | void Parse::do_ifnull(BoolTest::mask btest, Node *c) { |
duke@435 | 968 | int target_bci = iter().get_dest(); |
duke@435 | 969 | |
never@452 | 970 | Block* branch_block = successor_for_bci(target_bci); |
never@452 | 971 | Block* next_block = successor_for_bci(iter().next_bci()); |
never@452 | 972 | |
duke@435 | 973 | float cnt; |
duke@435 | 974 | float prob = branch_prediction(cnt, btest, target_bci); |
duke@435 | 975 | if (prob == PROB_UNKNOWN) { |
duke@435 | 976 | // (An earlier version of do_ifnull omitted this trap for OSR methods.) |
duke@435 | 977 | #ifndef PRODUCT |
duke@435 | 978 | if (PrintOpto && Verbose) |
rasbold@683 | 979 | tty->print_cr("Never-taken edge stops compilation at bci %d",bci()); |
duke@435 | 980 | #endif |
rasbold@683 | 981 | repush_if_args(); // to gather stats on loop |
duke@435 | 982 | // We need to mark this branch as taken so that if we recompile we will |
duke@435 | 983 | // see that it is possible. In the tiered system the interpreter doesn't |
duke@435 | 984 | // do profiling and by the time we get to the lower tier from the interpreter |
duke@435 | 985 | // the path may be cold again. Make sure it doesn't look untaken |
duke@435 | 986 | profile_taken_branch(target_bci, !ProfileInterpreter); |
duke@435 | 987 | uncommon_trap(Deoptimization::Reason_unreached, |
duke@435 | 988 | Deoptimization::Action_reinterpret, |
duke@435 | 989 | NULL, "cold"); |
kvn@5110 | 990 | if (C->eliminate_boxing()) { |
never@452 | 991 | // Mark the successor blocks as parsed |
never@452 | 992 | branch_block->next_path_num(); |
never@452 | 993 | next_block->next_path_num(); |
never@452 | 994 | } |
duke@435 | 995 | return; |
duke@435 | 996 | } |
duke@435 | 997 | |
duke@435 | 998 | explicit_null_checks_inserted++; |
duke@435 | 999 | |
duke@435 | 1000 | // Generate real control flow |
kvn@4115 | 1001 | Node *tst = _gvn.transform( new (C) BoolNode( c, btest ) ); |
duke@435 | 1002 | |
duke@435 | 1003 | // Sanity check the probability value |
duke@435 | 1004 | assert(prob > 0.0f,"Bad probability in Parser"); |
duke@435 | 1005 | // Need xform to put node in hash table |
duke@435 | 1006 | IfNode *iff = create_and_xform_if( control(), tst, prob, cnt ); |
duke@435 | 1007 | assert(iff->_prob > 0.0f,"Optimizer made bad probability in parser"); |
duke@435 | 1008 | // True branch |
duke@435 | 1009 | { PreserveJVMState pjvms(this); |
kvn@4115 | 1010 | Node* iftrue = _gvn.transform( new (C) IfTrueNode (iff) ); |
duke@435 | 1011 | set_control(iftrue); |
duke@435 | 1012 | |
duke@435 | 1013 | if (stopped()) { // Path is dead? |
duke@435 | 1014 | explicit_null_checks_elided++; |
kvn@5110 | 1015 | if (C->eliminate_boxing()) { |
never@452 | 1016 | // Mark the successor block as parsed |
never@452 | 1017 | branch_block->next_path_num(); |
never@452 | 1018 | } |
duke@435 | 1019 | } else { // Path is live. |
duke@435 | 1020 | // Update method data |
duke@435 | 1021 | profile_taken_branch(target_bci); |
duke@435 | 1022 | adjust_map_after_if(btest, c, prob, branch_block, next_block); |
cfang@1607 | 1023 | if (!stopped()) { |
duke@435 | 1024 | merge(target_bci); |
cfang@1607 | 1025 | } |
duke@435 | 1026 | } |
duke@435 | 1027 | } |
duke@435 | 1028 | |
duke@435 | 1029 | // False branch |
kvn@4115 | 1030 | Node* iffalse = _gvn.transform( new (C) IfFalseNode(iff) ); |
duke@435 | 1031 | set_control(iffalse); |
duke@435 | 1032 | |
duke@435 | 1033 | if (stopped()) { // Path is dead? |
duke@435 | 1034 | explicit_null_checks_elided++; |
kvn@5110 | 1035 | if (C->eliminate_boxing()) { |
never@452 | 1036 | // Mark the successor block as parsed |
never@452 | 1037 | next_block->next_path_num(); |
never@452 | 1038 | } |
duke@435 | 1039 | } else { // Path is live. |
duke@435 | 1040 | // Update method data |
duke@435 | 1041 | profile_not_taken_branch(); |
duke@435 | 1042 | adjust_map_after_if(BoolTest(btest).negate(), c, 1.0-prob, |
duke@435 | 1043 | next_block, branch_block); |
duke@435 | 1044 | } |
duke@435 | 1045 | } |
duke@435 | 1046 | |
duke@435 | 1047 | //------------------------------------do_if------------------------------------ |
duke@435 | 1048 | void Parse::do_if(BoolTest::mask btest, Node* c) { |
duke@435 | 1049 | int target_bci = iter().get_dest(); |
duke@435 | 1050 | |
never@452 | 1051 | Block* branch_block = successor_for_bci(target_bci); |
never@452 | 1052 | Block* next_block = successor_for_bci(iter().next_bci()); |
never@452 | 1053 | |
duke@435 | 1054 | float cnt; |
duke@435 | 1055 | float prob = branch_prediction(cnt, btest, target_bci); |
duke@435 | 1056 | float untaken_prob = 1.0 - prob; |
duke@435 | 1057 | |
duke@435 | 1058 | if (prob == PROB_UNKNOWN) { |
duke@435 | 1059 | #ifndef PRODUCT |
duke@435 | 1060 | if (PrintOpto && Verbose) |
rasbold@683 | 1061 | tty->print_cr("Never-taken edge stops compilation at bci %d",bci()); |
duke@435 | 1062 | #endif |
duke@435 | 1063 | repush_if_args(); // to gather stats on loop |
duke@435 | 1064 | // We need to mark this branch as taken so that if we recompile we will |
duke@435 | 1065 | // see that it is possible. In the tiered system the interpreter doesn't |
duke@435 | 1066 | // do profiling and by the time we get to the lower tier from the interpreter |
duke@435 | 1067 | // the path may be cold again. Make sure it doesn't look untaken |
duke@435 | 1068 | profile_taken_branch(target_bci, !ProfileInterpreter); |
duke@435 | 1069 | uncommon_trap(Deoptimization::Reason_unreached, |
duke@435 | 1070 | Deoptimization::Action_reinterpret, |
duke@435 | 1071 | NULL, "cold"); |
kvn@5110 | 1072 | if (C->eliminate_boxing()) { |
never@452 | 1073 | // Mark the successor blocks as parsed |
never@452 | 1074 | branch_block->next_path_num(); |
never@452 | 1075 | next_block->next_path_num(); |
never@452 | 1076 | } |
duke@435 | 1077 | return; |
duke@435 | 1078 | } |
duke@435 | 1079 | |
duke@435 | 1080 | // Sanity check the probability value |
duke@435 | 1081 | assert(0.0f < prob && prob < 1.0f,"Bad probability in Parser"); |
duke@435 | 1082 | |
duke@435 | 1083 | bool taken_if_true = true; |
duke@435 | 1084 | // Convert BoolTest to canonical form: |
duke@435 | 1085 | if (!BoolTest(btest).is_canonical()) { |
duke@435 | 1086 | btest = BoolTest(btest).negate(); |
duke@435 | 1087 | taken_if_true = false; |
duke@435 | 1088 | // prob is NOT updated here; it remains the probability of the taken |
duke@435 | 1089 | // path (as opposed to the prob of the path guarded by an 'IfTrueNode'). |
duke@435 | 1090 | } |
duke@435 | 1091 | assert(btest != BoolTest::eq, "!= is the only canonical exact test"); |
duke@435 | 1092 | |
kvn@4115 | 1093 | Node* tst0 = new (C) BoolNode(c, btest); |
duke@435 | 1094 | Node* tst = _gvn.transform(tst0); |
duke@435 | 1095 | BoolTest::mask taken_btest = BoolTest::illegal; |
duke@435 | 1096 | BoolTest::mask untaken_btest = BoolTest::illegal; |
kvn@472 | 1097 | |
kvn@472 | 1098 | if (tst->is_Bool()) { |
kvn@472 | 1099 | // Refresh c from the transformed bool node, since it may be |
kvn@472 | 1100 | // simpler than the original c. Also re-canonicalize btest. |
kvn@472 | 1101 | // This wins when (Bool ne (Conv2B p) 0) => (Bool ne (CmpP p NULL)). |
kvn@472 | 1102 | // That can arise from statements like: if (x instanceof C) ... |
kvn@472 | 1103 | if (tst != tst0) { |
kvn@472 | 1104 | // Canonicalize one more time since transform can change it. |
kvn@472 | 1105 | btest = tst->as_Bool()->_test._test; |
kvn@472 | 1106 | if (!BoolTest(btest).is_canonical()) { |
kvn@472 | 1107 | // Reverse edges one more time... |
kvn@472 | 1108 | tst = _gvn.transform( tst->as_Bool()->negate(&_gvn) ); |
kvn@472 | 1109 | btest = tst->as_Bool()->_test._test; |
kvn@472 | 1110 | assert(BoolTest(btest).is_canonical(), "sanity"); |
kvn@472 | 1111 | taken_if_true = !taken_if_true; |
kvn@472 | 1112 | } |
kvn@472 | 1113 | c = tst->in(1); |
kvn@472 | 1114 | } |
kvn@472 | 1115 | BoolTest::mask neg_btest = BoolTest(btest).negate(); |
kvn@472 | 1116 | taken_btest = taken_if_true ? btest : neg_btest; |
kvn@472 | 1117 | untaken_btest = taken_if_true ? neg_btest : btest; |
duke@435 | 1118 | } |
duke@435 | 1119 | |
duke@435 | 1120 | // Generate real control flow |
duke@435 | 1121 | float true_prob = (taken_if_true ? prob : untaken_prob); |
duke@435 | 1122 | IfNode* iff = create_and_map_if(control(), tst, true_prob, cnt); |
duke@435 | 1123 | assert(iff->_prob > 0.0f,"Optimizer made bad probability in parser"); |
kvn@4115 | 1124 | Node* taken_branch = new (C) IfTrueNode(iff); |
kvn@4115 | 1125 | Node* untaken_branch = new (C) IfFalseNode(iff); |
duke@435 | 1126 | if (!taken_if_true) { // Finish conversion to canonical form |
duke@435 | 1127 | Node* tmp = taken_branch; |
duke@435 | 1128 | taken_branch = untaken_branch; |
duke@435 | 1129 | untaken_branch = tmp; |
duke@435 | 1130 | } |
duke@435 | 1131 | |
duke@435 | 1132 | // Branch is taken: |
duke@435 | 1133 | { PreserveJVMState pjvms(this); |
duke@435 | 1134 | taken_branch = _gvn.transform(taken_branch); |
duke@435 | 1135 | set_control(taken_branch); |
duke@435 | 1136 | |
never@452 | 1137 | if (stopped()) { |
kvn@5110 | 1138 | if (C->eliminate_boxing()) { |
never@452 | 1139 | // Mark the successor block as parsed |
never@452 | 1140 | branch_block->next_path_num(); |
never@452 | 1141 | } |
never@452 | 1142 | } else { |
duke@435 | 1143 | // Update method data |
duke@435 | 1144 | profile_taken_branch(target_bci); |
duke@435 | 1145 | adjust_map_after_if(taken_btest, c, prob, branch_block, next_block); |
cfang@1607 | 1146 | if (!stopped()) { |
duke@435 | 1147 | merge(target_bci); |
cfang@1607 | 1148 | } |
duke@435 | 1149 | } |
duke@435 | 1150 | } |
duke@435 | 1151 | |
duke@435 | 1152 | untaken_branch = _gvn.transform(untaken_branch); |
duke@435 | 1153 | set_control(untaken_branch); |
duke@435 | 1154 | |
duke@435 | 1155 | // Branch not taken. |
never@452 | 1156 | if (stopped()) { |
kvn@5110 | 1157 | if (C->eliminate_boxing()) { |
never@452 | 1158 | // Mark the successor block as parsed |
never@452 | 1159 | next_block->next_path_num(); |
never@452 | 1160 | } |
never@452 | 1161 | } else { |
duke@435 | 1162 | // Update method data |
duke@435 | 1163 | profile_not_taken_branch(); |
duke@435 | 1164 | adjust_map_after_if(untaken_btest, c, untaken_prob, |
duke@435 | 1165 | next_block, branch_block); |
duke@435 | 1166 | } |
duke@435 | 1167 | } |
duke@435 | 1168 | |
duke@435 | 1169 | //----------------------------adjust_map_after_if------------------------------ |
duke@435 | 1170 | // Adjust the JVM state to reflect the result of taking this path. |
duke@435 | 1171 | // Basically, it means inspecting the CmpNode controlling this |
duke@435 | 1172 | // branch, seeing how it constrains a tested value, and then |
duke@435 | 1173 | // deciding if it's worth our while to encode this constraint |
duke@435 | 1174 | // as graph nodes in the current abstract interpretation map. |
duke@435 | 1175 | void Parse::adjust_map_after_if(BoolTest::mask btest, Node* c, float prob, |
duke@435 | 1176 | Block* path, Block* other_path) { |
duke@435 | 1177 | if (stopped() || !c->is_Cmp() || btest == BoolTest::illegal) |
duke@435 | 1178 | return; // nothing to do |
duke@435 | 1179 | |
duke@435 | 1180 | bool is_fallthrough = (path == successor_for_bci(iter().next_bci())); |
duke@435 | 1181 | |
jrose@2101 | 1182 | if (seems_never_taken(prob) && seems_stable_comparison(btest, c)) { |
duke@435 | 1183 | // If this might possibly turn into an implicit null check, |
duke@435 | 1184 | // and the null has never yet been seen, we need to generate |
duke@435 | 1185 | // an uncommon trap, so as to recompile instead of suffering |
duke@435 | 1186 | // with very slow branches. (We'll get the slow branches if |
duke@435 | 1187 | // the program ever changes phase and starts seeing nulls here.) |
duke@435 | 1188 | // |
jrose@2101 | 1189 | // We do not inspect for a null constant, since a node may |
duke@435 | 1190 | // optimize to 'null' later on. |
jrose@2101 | 1191 | // |
jrose@2101 | 1192 | // Null checks, and other tests which expect inequality, |
jrose@2101 | 1193 | // show btest == BoolTest::eq along the non-taken branch. |
jrose@2101 | 1194 | // On the other hand, type tests, must-be-null tests, |
jrose@2101 | 1195 | // and other tests which expect pointer equality, |
jrose@2101 | 1196 | // show btest == BoolTest::ne along the non-taken branch. |
jrose@2101 | 1197 | // We prune both types of branches if they look unused. |
duke@435 | 1198 | repush_if_args(); |
duke@435 | 1199 | // We need to mark this branch as taken so that if we recompile we will |
duke@435 | 1200 | // see that it is possible. In the tiered system the interpreter doesn't |
duke@435 | 1201 | // do profiling and by the time we get to the lower tier from the interpreter |
duke@435 | 1202 | // the path may be cold again. Make sure it doesn't look untaken |
duke@435 | 1203 | if (is_fallthrough) { |
duke@435 | 1204 | profile_not_taken_branch(!ProfileInterpreter); |
duke@435 | 1205 | } else { |
duke@435 | 1206 | profile_taken_branch(iter().get_dest(), !ProfileInterpreter); |
duke@435 | 1207 | } |
duke@435 | 1208 | uncommon_trap(Deoptimization::Reason_unreached, |
duke@435 | 1209 | Deoptimization::Action_reinterpret, |
duke@435 | 1210 | NULL, |
duke@435 | 1211 | (is_fallthrough ? "taken always" : "taken never")); |
duke@435 | 1212 | return; |
duke@435 | 1213 | } |
duke@435 | 1214 | |
duke@435 | 1215 | Node* val = c->in(1); |
duke@435 | 1216 | Node* con = c->in(2); |
duke@435 | 1217 | const Type* tcon = _gvn.type(con); |
duke@435 | 1218 | const Type* tval = _gvn.type(val); |
duke@435 | 1219 | bool have_con = tcon->singleton(); |
duke@435 | 1220 | if (tval->singleton()) { |
duke@435 | 1221 | if (!have_con) { |
duke@435 | 1222 | // Swap, so constant is in con. |
duke@435 | 1223 | con = val; |
duke@435 | 1224 | tcon = tval; |
duke@435 | 1225 | val = c->in(2); |
duke@435 | 1226 | tval = _gvn.type(val); |
duke@435 | 1227 | btest = BoolTest(btest).commute(); |
duke@435 | 1228 | have_con = true; |
duke@435 | 1229 | } else { |
duke@435 | 1230 | // Do we have two constants? Then leave well enough alone. |
duke@435 | 1231 | have_con = false; |
duke@435 | 1232 | } |
duke@435 | 1233 | } |
duke@435 | 1234 | if (!have_con) // remaining adjustments need a con |
duke@435 | 1235 | return; |
duke@435 | 1236 | |
kvn@3834 | 1237 | sharpen_type_after_if(btest, con, tcon, val, tval); |
kvn@3834 | 1238 | } |
kvn@3834 | 1239 | |
kvn@3834 | 1240 | |
kvn@3834 | 1241 | static Node* extract_obj_from_klass_load(PhaseGVN* gvn, Node* n) { |
kvn@3834 | 1242 | Node* ldk; |
roland@4159 | 1243 | if (n->is_DecodeNKlass()) { |
kvn@3834 | 1244 | if (n->in(1)->Opcode() != Op_LoadNKlass) { |
kvn@3834 | 1245 | return NULL; |
kvn@3834 | 1246 | } else { |
kvn@3834 | 1247 | ldk = n->in(1); |
kvn@3834 | 1248 | } |
kvn@3834 | 1249 | } else if (n->Opcode() != Op_LoadKlass) { |
kvn@3834 | 1250 | return NULL; |
kvn@3834 | 1251 | } else { |
kvn@3834 | 1252 | ldk = n; |
kvn@3834 | 1253 | } |
kvn@3834 | 1254 | assert(ldk != NULL && ldk->is_Load(), "should have found a LoadKlass or LoadNKlass node"); |
kvn@3834 | 1255 | |
kvn@3834 | 1256 | Node* adr = ldk->in(MemNode::Address); |
kvn@3834 | 1257 | intptr_t off = 0; |
kvn@3834 | 1258 | Node* obj = AddPNode::Ideal_base_and_offset(adr, gvn, off); |
kvn@3834 | 1259 | if (obj == NULL || off != oopDesc::klass_offset_in_bytes()) // loading oopDesc::_klass? |
kvn@3834 | 1260 | return NULL; |
kvn@3834 | 1261 | const TypePtr* tp = gvn->type(obj)->is_ptr(); |
kvn@3834 | 1262 | if (tp == NULL || !(tp->isa_instptr() || tp->isa_aryptr())) // is obj a Java object ptr? |
kvn@3834 | 1263 | return NULL; |
kvn@3834 | 1264 | |
kvn@3834 | 1265 | return obj; |
kvn@3834 | 1266 | } |
kvn@3834 | 1267 | |
kvn@3834 | 1268 | void Parse::sharpen_type_after_if(BoolTest::mask btest, |
kvn@3834 | 1269 | Node* con, const Type* tcon, |
kvn@3834 | 1270 | Node* val, const Type* tval) { |
kvn@3834 | 1271 | // Look for opportunities to sharpen the type of a node |
kvn@3834 | 1272 | // whose klass is compared with a constant klass. |
kvn@3834 | 1273 | if (btest == BoolTest::eq && tcon->isa_klassptr()) { |
kvn@3834 | 1274 | Node* obj = extract_obj_from_klass_load(&_gvn, val); |
kvn@3834 | 1275 | const TypeOopPtr* con_type = tcon->isa_klassptr()->as_instance_type(); |
kvn@3834 | 1276 | if (obj != NULL && (con_type->isa_instptr() || con_type->isa_aryptr())) { |
kvn@3834 | 1277 | // Found: |
kvn@3834 | 1278 | // Bool(CmpP(LoadKlass(obj._klass), ConP(Foo.klass)), [eq]) |
kvn@3834 | 1279 | // or the narrowOop equivalent. |
kvn@3834 | 1280 | const Type* obj_type = _gvn.type(obj); |
kvn@3834 | 1281 | const TypeOopPtr* tboth = obj_type->join(con_type)->isa_oopptr(); |
kvn@3909 | 1282 | if (tboth != NULL && tboth->klass_is_exact() && tboth != obj_type && |
kvn@3909 | 1283 | tboth->higher_equal(obj_type)) { |
kvn@3834 | 1284 | // obj has to be of the exact type Foo if the CmpP succeeds. |
kvn@3834 | 1285 | int obj_in_map = map()->find_edge(obj); |
kvn@3834 | 1286 | JVMState* jvms = this->jvms(); |
kvn@3834 | 1287 | if (obj_in_map >= 0 && |
kvn@3834 | 1288 | (jvms->is_loc(obj_in_map) || jvms->is_stk(obj_in_map))) { |
kvn@4115 | 1289 | TypeNode* ccast = new (C) CheckCastPPNode(control(), obj, tboth); |
kvn@3834 | 1290 | const Type* tcc = ccast->as_Type()->type(); |
kvn@3834 | 1291 | assert(tcc != obj_type && tcc->higher_equal(obj_type), "must improve"); |
kvn@3834 | 1292 | // Delay transform() call to allow recovery of pre-cast value |
kvn@3834 | 1293 | // at the control merge. |
kvn@3834 | 1294 | _gvn.set_type_bottom(ccast); |
kvn@3834 | 1295 | record_for_igvn(ccast); |
kvn@3834 | 1296 | // Here's the payoff. |
kvn@3834 | 1297 | replace_in_map(obj, ccast); |
kvn@3834 | 1298 | } |
kvn@3834 | 1299 | } |
kvn@3834 | 1300 | } |
kvn@3834 | 1301 | } |
duke@435 | 1302 | |
duke@435 | 1303 | int val_in_map = map()->find_edge(val); |
duke@435 | 1304 | if (val_in_map < 0) return; // replace_in_map would be useless |
duke@435 | 1305 | { |
duke@435 | 1306 | JVMState* jvms = this->jvms(); |
duke@435 | 1307 | if (!(jvms->is_loc(val_in_map) || |
duke@435 | 1308 | jvms->is_stk(val_in_map))) |
duke@435 | 1309 | return; // again, it would be useless |
duke@435 | 1310 | } |
duke@435 | 1311 | |
duke@435 | 1312 | // Check for a comparison to a constant, and "know" that the compared |
duke@435 | 1313 | // value is constrained on this path. |
duke@435 | 1314 | assert(tcon->singleton(), ""); |
duke@435 | 1315 | ConstraintCastNode* ccast = NULL; |
duke@435 | 1316 | Node* cast = NULL; |
duke@435 | 1317 | |
duke@435 | 1318 | switch (btest) { |
duke@435 | 1319 | case BoolTest::eq: // Constant test? |
duke@435 | 1320 | { |
duke@435 | 1321 | const Type* tboth = tcon->join(tval); |
duke@435 | 1322 | if (tboth == tval) break; // Nothing to gain. |
duke@435 | 1323 | if (tcon->isa_int()) { |
kvn@4115 | 1324 | ccast = new (C) CastIINode(val, tboth); |
duke@435 | 1325 | } else if (tcon == TypePtr::NULL_PTR) { |
duke@435 | 1326 | // Cast to null, but keep the pointer identity temporarily live. |
kvn@4115 | 1327 | ccast = new (C) CastPPNode(val, tboth); |
duke@435 | 1328 | } else { |
duke@435 | 1329 | const TypeF* tf = tcon->isa_float_constant(); |
duke@435 | 1330 | const TypeD* td = tcon->isa_double_constant(); |
duke@435 | 1331 | // Exclude tests vs float/double 0 as these could be |
duke@435 | 1332 | // either +0 or -0. Just because you are equal to +0 |
duke@435 | 1333 | // doesn't mean you ARE +0! |
kvn@3834 | 1334 | // Note, following code also replaces Long and Oop values. |
duke@435 | 1335 | if ((!tf || tf->_f != 0.0) && |
duke@435 | 1336 | (!td || td->_d != 0.0)) |
duke@435 | 1337 | cast = con; // Replace non-constant val by con. |
duke@435 | 1338 | } |
duke@435 | 1339 | } |
duke@435 | 1340 | break; |
duke@435 | 1341 | |
duke@435 | 1342 | case BoolTest::ne: |
duke@435 | 1343 | if (tcon == TypePtr::NULL_PTR) { |
duke@435 | 1344 | cast = cast_not_null(val, false); |
duke@435 | 1345 | } |
duke@435 | 1346 | break; |
duke@435 | 1347 | |
duke@435 | 1348 | default: |
duke@435 | 1349 | // (At this point we could record int range types with CastII.) |
duke@435 | 1350 | break; |
duke@435 | 1351 | } |
duke@435 | 1352 | |
duke@435 | 1353 | if (ccast != NULL) { |
duke@435 | 1354 | const Type* tcc = ccast->as_Type()->type(); |
duke@435 | 1355 | assert(tcc != tval && tcc->higher_equal(tval), "must improve"); |
duke@435 | 1356 | // Delay transform() call to allow recovery of pre-cast value |
duke@435 | 1357 | // at the control merge. |
duke@435 | 1358 | ccast->set_req(0, control()); |
duke@435 | 1359 | _gvn.set_type_bottom(ccast); |
duke@435 | 1360 | record_for_igvn(ccast); |
duke@435 | 1361 | cast = ccast; |
duke@435 | 1362 | } |
duke@435 | 1363 | |
duke@435 | 1364 | if (cast != NULL) { // Here's the payoff. |
duke@435 | 1365 | replace_in_map(val, cast); |
duke@435 | 1366 | } |
duke@435 | 1367 | } |
duke@435 | 1368 | |
duke@435 | 1369 | |
duke@435 | 1370 | //------------------------------do_one_bytecode-------------------------------- |
duke@435 | 1371 | // Parse this bytecode, and alter the Parsers JVM->Node mapping |
duke@435 | 1372 | void Parse::do_one_bytecode() { |
duke@435 | 1373 | Node *a, *b, *c, *d; // Handy temps |
duke@435 | 1374 | BoolTest::mask btest; |
duke@435 | 1375 | int i; |
duke@435 | 1376 | |
duke@435 | 1377 | assert(!has_exceptions(), "bytecode entry state must be clear of throws"); |
duke@435 | 1378 | |
duke@435 | 1379 | if (C->check_node_count(NodeLimitFudgeFactor * 5, |
duke@435 | 1380 | "out of nodes parsing method")) { |
duke@435 | 1381 | return; |
duke@435 | 1382 | } |
duke@435 | 1383 | |
duke@435 | 1384 | #ifdef ASSERT |
duke@435 | 1385 | // for setting breakpoints |
duke@435 | 1386 | if (TraceOptoParse) { |
duke@435 | 1387 | tty->print(" @"); |
duke@435 | 1388 | dump_bci(bci()); |
bharadwaj@4862 | 1389 | tty->cr(); |
duke@435 | 1390 | } |
duke@435 | 1391 | #endif |
duke@435 | 1392 | |
duke@435 | 1393 | switch (bc()) { |
duke@435 | 1394 | case Bytecodes::_nop: |
duke@435 | 1395 | // do nothing |
duke@435 | 1396 | break; |
duke@435 | 1397 | case Bytecodes::_lconst_0: |
duke@435 | 1398 | push_pair(longcon(0)); |
duke@435 | 1399 | break; |
duke@435 | 1400 | |
duke@435 | 1401 | case Bytecodes::_lconst_1: |
duke@435 | 1402 | push_pair(longcon(1)); |
duke@435 | 1403 | break; |
duke@435 | 1404 | |
duke@435 | 1405 | case Bytecodes::_fconst_0: |
duke@435 | 1406 | push(zerocon(T_FLOAT)); |
duke@435 | 1407 | break; |
duke@435 | 1408 | |
duke@435 | 1409 | case Bytecodes::_fconst_1: |
duke@435 | 1410 | push(makecon(TypeF::ONE)); |
duke@435 | 1411 | break; |
duke@435 | 1412 | |
duke@435 | 1413 | case Bytecodes::_fconst_2: |
duke@435 | 1414 | push(makecon(TypeF::make(2.0f))); |
duke@435 | 1415 | break; |
duke@435 | 1416 | |
duke@435 | 1417 | case Bytecodes::_dconst_0: |
duke@435 | 1418 | push_pair(zerocon(T_DOUBLE)); |
duke@435 | 1419 | break; |
duke@435 | 1420 | |
duke@435 | 1421 | case Bytecodes::_dconst_1: |
duke@435 | 1422 | push_pair(makecon(TypeD::ONE)); |
duke@435 | 1423 | break; |
duke@435 | 1424 | |
duke@435 | 1425 | case Bytecodes::_iconst_m1:push(intcon(-1)); break; |
duke@435 | 1426 | case Bytecodes::_iconst_0: push(intcon( 0)); break; |
duke@435 | 1427 | case Bytecodes::_iconst_1: push(intcon( 1)); break; |
duke@435 | 1428 | case Bytecodes::_iconst_2: push(intcon( 2)); break; |
duke@435 | 1429 | case Bytecodes::_iconst_3: push(intcon( 3)); break; |
duke@435 | 1430 | case Bytecodes::_iconst_4: push(intcon( 4)); break; |
duke@435 | 1431 | case Bytecodes::_iconst_5: push(intcon( 5)); break; |
jrose@1920 | 1432 | case Bytecodes::_bipush: push(intcon(iter().get_constant_u1())); break; |
jrose@1920 | 1433 | case Bytecodes::_sipush: push(intcon(iter().get_constant_u2())); break; |
duke@435 | 1434 | case Bytecodes::_aconst_null: push(null()); break; |
duke@435 | 1435 | case Bytecodes::_ldc: |
duke@435 | 1436 | case Bytecodes::_ldc_w: |
duke@435 | 1437 | case Bytecodes::_ldc2_w: |
duke@435 | 1438 | // If the constant is unresolved, run this BC once in the interpreter. |
jrose@1957 | 1439 | { |
duke@435 | 1440 | ciConstant constant = iter().get_constant(); |
jrose@1957 | 1441 | if (constant.basic_type() == T_OBJECT && |
jrose@1957 | 1442 | !constant.as_object()->is_loaded()) { |
jrose@1957 | 1443 | int index = iter().get_constant_pool_index(); |
jrose@1957 | 1444 | constantTag tag = iter().get_constant_pool_tag(index); |
jrose@1957 | 1445 | uncommon_trap(Deoptimization::make_trap_request |
jrose@1957 | 1446 | (Deoptimization::Reason_unloaded, |
jrose@1957 | 1447 | Deoptimization::Action_reinterpret, |
jrose@1957 | 1448 | index), |
jrose@1957 | 1449 | NULL, tag.internal_name()); |
jrose@1957 | 1450 | break; |
duke@435 | 1451 | } |
coleenp@4037 | 1452 | assert(constant.basic_type() != T_OBJECT || constant.as_object()->is_instance(), |
jrose@1957 | 1453 | "must be java_mirror of klass"); |
jrose@1424 | 1454 | bool pushed = push_constant(constant, true); |
jrose@1424 | 1455 | guarantee(pushed, "must be possible to push this constant"); |
duke@435 | 1456 | } |
duke@435 | 1457 | |
duke@435 | 1458 | break; |
duke@435 | 1459 | |
duke@435 | 1460 | case Bytecodes::_aload_0: |
duke@435 | 1461 | push( local(0) ); |
duke@435 | 1462 | break; |
duke@435 | 1463 | case Bytecodes::_aload_1: |
duke@435 | 1464 | push( local(1) ); |
duke@435 | 1465 | break; |
duke@435 | 1466 | case Bytecodes::_aload_2: |
duke@435 | 1467 | push( local(2) ); |
duke@435 | 1468 | break; |
duke@435 | 1469 | case Bytecodes::_aload_3: |
duke@435 | 1470 | push( local(3) ); |
duke@435 | 1471 | break; |
duke@435 | 1472 | case Bytecodes::_aload: |
duke@435 | 1473 | push( local(iter().get_index()) ); |
duke@435 | 1474 | break; |
duke@435 | 1475 | |
duke@435 | 1476 | case Bytecodes::_fload_0: |
duke@435 | 1477 | case Bytecodes::_iload_0: |
duke@435 | 1478 | push( local(0) ); |
duke@435 | 1479 | break; |
duke@435 | 1480 | case Bytecodes::_fload_1: |
duke@435 | 1481 | case Bytecodes::_iload_1: |
duke@435 | 1482 | push( local(1) ); |
duke@435 | 1483 | break; |
duke@435 | 1484 | case Bytecodes::_fload_2: |
duke@435 | 1485 | case Bytecodes::_iload_2: |
duke@435 | 1486 | push( local(2) ); |
duke@435 | 1487 | break; |
duke@435 | 1488 | case Bytecodes::_fload_3: |
duke@435 | 1489 | case Bytecodes::_iload_3: |
duke@435 | 1490 | push( local(3) ); |
duke@435 | 1491 | break; |
duke@435 | 1492 | case Bytecodes::_fload: |
duke@435 | 1493 | case Bytecodes::_iload: |
duke@435 | 1494 | push( local(iter().get_index()) ); |
duke@435 | 1495 | break; |
duke@435 | 1496 | case Bytecodes::_lload_0: |
duke@435 | 1497 | push_pair_local( 0 ); |
duke@435 | 1498 | break; |
duke@435 | 1499 | case Bytecodes::_lload_1: |
duke@435 | 1500 | push_pair_local( 1 ); |
duke@435 | 1501 | break; |
duke@435 | 1502 | case Bytecodes::_lload_2: |
duke@435 | 1503 | push_pair_local( 2 ); |
duke@435 | 1504 | break; |
duke@435 | 1505 | case Bytecodes::_lload_3: |
duke@435 | 1506 | push_pair_local( 3 ); |
duke@435 | 1507 | break; |
duke@435 | 1508 | case Bytecodes::_lload: |
duke@435 | 1509 | push_pair_local( iter().get_index() ); |
duke@435 | 1510 | break; |
duke@435 | 1511 | |
duke@435 | 1512 | case Bytecodes::_dload_0: |
duke@435 | 1513 | push_pair_local(0); |
duke@435 | 1514 | break; |
duke@435 | 1515 | case Bytecodes::_dload_1: |
duke@435 | 1516 | push_pair_local(1); |
duke@435 | 1517 | break; |
duke@435 | 1518 | case Bytecodes::_dload_2: |
duke@435 | 1519 | push_pair_local(2); |
duke@435 | 1520 | break; |
duke@435 | 1521 | case Bytecodes::_dload_3: |
duke@435 | 1522 | push_pair_local(3); |
duke@435 | 1523 | break; |
duke@435 | 1524 | case Bytecodes::_dload: |
duke@435 | 1525 | push_pair_local(iter().get_index()); |
duke@435 | 1526 | break; |
duke@435 | 1527 | case Bytecodes::_fstore_0: |
duke@435 | 1528 | case Bytecodes::_istore_0: |
duke@435 | 1529 | case Bytecodes::_astore_0: |
duke@435 | 1530 | set_local( 0, pop() ); |
duke@435 | 1531 | break; |
duke@435 | 1532 | case Bytecodes::_fstore_1: |
duke@435 | 1533 | case Bytecodes::_istore_1: |
duke@435 | 1534 | case Bytecodes::_astore_1: |
duke@435 | 1535 | set_local( 1, pop() ); |
duke@435 | 1536 | break; |
duke@435 | 1537 | case Bytecodes::_fstore_2: |
duke@435 | 1538 | case Bytecodes::_istore_2: |
duke@435 | 1539 | case Bytecodes::_astore_2: |
duke@435 | 1540 | set_local( 2, pop() ); |
duke@435 | 1541 | break; |
duke@435 | 1542 | case Bytecodes::_fstore_3: |
duke@435 | 1543 | case Bytecodes::_istore_3: |
duke@435 | 1544 | case Bytecodes::_astore_3: |
duke@435 | 1545 | set_local( 3, pop() ); |
duke@435 | 1546 | break; |
duke@435 | 1547 | case Bytecodes::_fstore: |
duke@435 | 1548 | case Bytecodes::_istore: |
duke@435 | 1549 | case Bytecodes::_astore: |
duke@435 | 1550 | set_local( iter().get_index(), pop() ); |
duke@435 | 1551 | break; |
duke@435 | 1552 | // long stores |
duke@435 | 1553 | case Bytecodes::_lstore_0: |
duke@435 | 1554 | set_pair_local( 0, pop_pair() ); |
duke@435 | 1555 | break; |
duke@435 | 1556 | case Bytecodes::_lstore_1: |
duke@435 | 1557 | set_pair_local( 1, pop_pair() ); |
duke@435 | 1558 | break; |
duke@435 | 1559 | case Bytecodes::_lstore_2: |
duke@435 | 1560 | set_pair_local( 2, pop_pair() ); |
duke@435 | 1561 | break; |
duke@435 | 1562 | case Bytecodes::_lstore_3: |
duke@435 | 1563 | set_pair_local( 3, pop_pair() ); |
duke@435 | 1564 | break; |
duke@435 | 1565 | case Bytecodes::_lstore: |
duke@435 | 1566 | set_pair_local( iter().get_index(), pop_pair() ); |
duke@435 | 1567 | break; |
duke@435 | 1568 | |
duke@435 | 1569 | // double stores |
duke@435 | 1570 | case Bytecodes::_dstore_0: |
duke@435 | 1571 | set_pair_local( 0, dstore_rounding(pop_pair()) ); |
duke@435 | 1572 | break; |
duke@435 | 1573 | case Bytecodes::_dstore_1: |
duke@435 | 1574 | set_pair_local( 1, dstore_rounding(pop_pair()) ); |
duke@435 | 1575 | break; |
duke@435 | 1576 | case Bytecodes::_dstore_2: |
duke@435 | 1577 | set_pair_local( 2, dstore_rounding(pop_pair()) ); |
duke@435 | 1578 | break; |
duke@435 | 1579 | case Bytecodes::_dstore_3: |
duke@435 | 1580 | set_pair_local( 3, dstore_rounding(pop_pair()) ); |
duke@435 | 1581 | break; |
duke@435 | 1582 | case Bytecodes::_dstore: |
duke@435 | 1583 | set_pair_local( iter().get_index(), dstore_rounding(pop_pair()) ); |
duke@435 | 1584 | break; |
duke@435 | 1585 | |
twisti@4313 | 1586 | case Bytecodes::_pop: dec_sp(1); break; |
twisti@4313 | 1587 | case Bytecodes::_pop2: dec_sp(2); break; |
duke@435 | 1588 | case Bytecodes::_swap: |
duke@435 | 1589 | a = pop(); |
duke@435 | 1590 | b = pop(); |
duke@435 | 1591 | push(a); |
duke@435 | 1592 | push(b); |
duke@435 | 1593 | break; |
duke@435 | 1594 | case Bytecodes::_dup: |
duke@435 | 1595 | a = pop(); |
duke@435 | 1596 | push(a); |
duke@435 | 1597 | push(a); |
duke@435 | 1598 | break; |
duke@435 | 1599 | case Bytecodes::_dup_x1: |
duke@435 | 1600 | a = pop(); |
duke@435 | 1601 | b = pop(); |
duke@435 | 1602 | push( a ); |
duke@435 | 1603 | push( b ); |
duke@435 | 1604 | push( a ); |
duke@435 | 1605 | break; |
duke@435 | 1606 | case Bytecodes::_dup_x2: |
duke@435 | 1607 | a = pop(); |
duke@435 | 1608 | b = pop(); |
duke@435 | 1609 | c = pop(); |
duke@435 | 1610 | push( a ); |
duke@435 | 1611 | push( c ); |
duke@435 | 1612 | push( b ); |
duke@435 | 1613 | push( a ); |
duke@435 | 1614 | break; |
duke@435 | 1615 | case Bytecodes::_dup2: |
duke@435 | 1616 | a = pop(); |
duke@435 | 1617 | b = pop(); |
duke@435 | 1618 | push( b ); |
duke@435 | 1619 | push( a ); |
duke@435 | 1620 | push( b ); |
duke@435 | 1621 | push( a ); |
duke@435 | 1622 | break; |
duke@435 | 1623 | |
duke@435 | 1624 | case Bytecodes::_dup2_x1: |
duke@435 | 1625 | // before: .. c, b, a |
duke@435 | 1626 | // after: .. b, a, c, b, a |
duke@435 | 1627 | // not tested |
duke@435 | 1628 | a = pop(); |
duke@435 | 1629 | b = pop(); |
duke@435 | 1630 | c = pop(); |
duke@435 | 1631 | push( b ); |
duke@435 | 1632 | push( a ); |
duke@435 | 1633 | push( c ); |
duke@435 | 1634 | push( b ); |
duke@435 | 1635 | push( a ); |
duke@435 | 1636 | break; |
duke@435 | 1637 | case Bytecodes::_dup2_x2: |
duke@435 | 1638 | // before: .. d, c, b, a |
duke@435 | 1639 | // after: .. b, a, d, c, b, a |
duke@435 | 1640 | // not tested |
duke@435 | 1641 | a = pop(); |
duke@435 | 1642 | b = pop(); |
duke@435 | 1643 | c = pop(); |
duke@435 | 1644 | d = pop(); |
duke@435 | 1645 | push( b ); |
duke@435 | 1646 | push( a ); |
duke@435 | 1647 | push( d ); |
duke@435 | 1648 | push( c ); |
duke@435 | 1649 | push( b ); |
duke@435 | 1650 | push( a ); |
duke@435 | 1651 | break; |
duke@435 | 1652 | |
duke@435 | 1653 | case Bytecodes::_arraylength: { |
duke@435 | 1654 | // Must do null-check with value on expression stack |
twisti@4313 | 1655 | Node *ary = null_check(peek(), T_ARRAY); |
duke@435 | 1656 | // Compile-time detect of null-exception? |
duke@435 | 1657 | if (stopped()) return; |
duke@435 | 1658 | a = pop(); |
duke@435 | 1659 | push(load_array_length(a)); |
duke@435 | 1660 | break; |
duke@435 | 1661 | } |
duke@435 | 1662 | |
duke@435 | 1663 | case Bytecodes::_baload: array_load(T_BYTE); break; |
duke@435 | 1664 | case Bytecodes::_caload: array_load(T_CHAR); break; |
duke@435 | 1665 | case Bytecodes::_iaload: array_load(T_INT); break; |
duke@435 | 1666 | case Bytecodes::_saload: array_load(T_SHORT); break; |
duke@435 | 1667 | case Bytecodes::_faload: array_load(T_FLOAT); break; |
duke@435 | 1668 | case Bytecodes::_aaload: array_load(T_OBJECT); break; |
duke@435 | 1669 | case Bytecodes::_laload: { |
duke@435 | 1670 | a = array_addressing(T_LONG, 0); |
twisti@1040 | 1671 | if (stopped()) return; // guaranteed null or range check |
twisti@4313 | 1672 | dec_sp(2); // Pop array and index |
twisti@4313 | 1673 | push_pair(make_load(control(), a, TypeLong::LONG, T_LONG, TypeAryPtr::LONGS)); |
duke@435 | 1674 | break; |
duke@435 | 1675 | } |
duke@435 | 1676 | case Bytecodes::_daload: { |
duke@435 | 1677 | a = array_addressing(T_DOUBLE, 0); |
twisti@1040 | 1678 | if (stopped()) return; // guaranteed null or range check |
twisti@4313 | 1679 | dec_sp(2); // Pop array and index |
twisti@4313 | 1680 | push_pair(make_load(control(), a, Type::DOUBLE, T_DOUBLE, TypeAryPtr::DOUBLES)); |
duke@435 | 1681 | break; |
duke@435 | 1682 | } |
duke@435 | 1683 | case Bytecodes::_bastore: array_store(T_BYTE); break; |
duke@435 | 1684 | case Bytecodes::_castore: array_store(T_CHAR); break; |
duke@435 | 1685 | case Bytecodes::_iastore: array_store(T_INT); break; |
duke@435 | 1686 | case Bytecodes::_sastore: array_store(T_SHORT); break; |
duke@435 | 1687 | case Bytecodes::_fastore: array_store(T_FLOAT); break; |
duke@435 | 1688 | case Bytecodes::_aastore: { |
duke@435 | 1689 | d = array_addressing(T_OBJECT, 1); |
twisti@1040 | 1690 | if (stopped()) return; // guaranteed null or range check |
duke@435 | 1691 | array_store_check(); |
duke@435 | 1692 | c = pop(); // Oop to store |
duke@435 | 1693 | b = pop(); // index (already used) |
duke@435 | 1694 | a = pop(); // the array itself |
never@1262 | 1695 | const TypeOopPtr* elemtype = _gvn.type(a)->is_aryptr()->elem()->make_oopptr(); |
duke@435 | 1696 | const TypeAryPtr* adr_type = TypeAryPtr::OOPS; |
duke@435 | 1697 | Node* store = store_oop_to_array(control(), a, d, adr_type, c, elemtype, T_OBJECT); |
duke@435 | 1698 | break; |
duke@435 | 1699 | } |
duke@435 | 1700 | case Bytecodes::_lastore: { |
duke@435 | 1701 | a = array_addressing(T_LONG, 2); |
twisti@1040 | 1702 | if (stopped()) return; // guaranteed null or range check |
duke@435 | 1703 | c = pop_pair(); |
twisti@4313 | 1704 | dec_sp(2); // Pop array and index |
duke@435 | 1705 | store_to_memory(control(), a, c, T_LONG, TypeAryPtr::LONGS); |
duke@435 | 1706 | break; |
duke@435 | 1707 | } |
duke@435 | 1708 | case Bytecodes::_dastore: { |
duke@435 | 1709 | a = array_addressing(T_DOUBLE, 2); |
twisti@1040 | 1710 | if (stopped()) return; // guaranteed null or range check |
duke@435 | 1711 | c = pop_pair(); |
twisti@4313 | 1712 | dec_sp(2); // Pop array and index |
duke@435 | 1713 | c = dstore_rounding(c); |
duke@435 | 1714 | store_to_memory(control(), a, c, T_DOUBLE, TypeAryPtr::DOUBLES); |
duke@435 | 1715 | break; |
duke@435 | 1716 | } |
duke@435 | 1717 | case Bytecodes::_getfield: |
duke@435 | 1718 | do_getfield(); |
duke@435 | 1719 | break; |
duke@435 | 1720 | |
duke@435 | 1721 | case Bytecodes::_getstatic: |
duke@435 | 1722 | do_getstatic(); |
duke@435 | 1723 | break; |
duke@435 | 1724 | |
duke@435 | 1725 | case Bytecodes::_putfield: |
duke@435 | 1726 | do_putfield(); |
duke@435 | 1727 | break; |
duke@435 | 1728 | |
duke@435 | 1729 | case Bytecodes::_putstatic: |
duke@435 | 1730 | do_putstatic(); |
duke@435 | 1731 | break; |
duke@435 | 1732 | |
duke@435 | 1733 | case Bytecodes::_irem: |
duke@435 | 1734 | do_irem(); |
duke@435 | 1735 | break; |
duke@435 | 1736 | case Bytecodes::_idiv: |
duke@435 | 1737 | // Must keep both values on the expression-stack during null-check |
twisti@4313 | 1738 | zero_check_int(peek()); |
duke@435 | 1739 | // Compile-time detect of null-exception? |
duke@435 | 1740 | if (stopped()) return; |
duke@435 | 1741 | b = pop(); |
duke@435 | 1742 | a = pop(); |
kvn@4115 | 1743 | push( _gvn.transform( new (C) DivINode(control(),a,b) ) ); |
duke@435 | 1744 | break; |
duke@435 | 1745 | case Bytecodes::_imul: |
duke@435 | 1746 | b = pop(); a = pop(); |
kvn@4115 | 1747 | push( _gvn.transform( new (C) MulINode(a,b) ) ); |
duke@435 | 1748 | break; |
duke@435 | 1749 | case Bytecodes::_iadd: |
duke@435 | 1750 | b = pop(); a = pop(); |
kvn@4115 | 1751 | push( _gvn.transform( new (C) AddINode(a,b) ) ); |
duke@435 | 1752 | break; |
duke@435 | 1753 | case Bytecodes::_ineg: |
duke@435 | 1754 | a = pop(); |
kvn@4115 | 1755 | push( _gvn.transform( new (C) SubINode(_gvn.intcon(0),a)) ); |
duke@435 | 1756 | break; |
duke@435 | 1757 | case Bytecodes::_isub: |
duke@435 | 1758 | b = pop(); a = pop(); |
kvn@4115 | 1759 | push( _gvn.transform( new (C) SubINode(a,b) ) ); |
duke@435 | 1760 | break; |
duke@435 | 1761 | case Bytecodes::_iand: |
duke@435 | 1762 | b = pop(); a = pop(); |
kvn@4115 | 1763 | push( _gvn.transform( new (C) AndINode(a,b) ) ); |
duke@435 | 1764 | break; |
duke@435 | 1765 | case Bytecodes::_ior: |
duke@435 | 1766 | b = pop(); a = pop(); |
kvn@4115 | 1767 | push( _gvn.transform( new (C) OrINode(a,b) ) ); |
duke@435 | 1768 | break; |
duke@435 | 1769 | case Bytecodes::_ixor: |
duke@435 | 1770 | b = pop(); a = pop(); |
kvn@4115 | 1771 | push( _gvn.transform( new (C) XorINode(a,b) ) ); |
duke@435 | 1772 | break; |
duke@435 | 1773 | case Bytecodes::_ishl: |
duke@435 | 1774 | b = pop(); a = pop(); |
kvn@4115 | 1775 | push( _gvn.transform( new (C) LShiftINode(a,b) ) ); |
duke@435 | 1776 | break; |
duke@435 | 1777 | case Bytecodes::_ishr: |
duke@435 | 1778 | b = pop(); a = pop(); |
kvn@4115 | 1779 | push( _gvn.transform( new (C) RShiftINode(a,b) ) ); |
duke@435 | 1780 | break; |
duke@435 | 1781 | case Bytecodes::_iushr: |
duke@435 | 1782 | b = pop(); a = pop(); |
kvn@4115 | 1783 | push( _gvn.transform( new (C) URShiftINode(a,b) ) ); |
duke@435 | 1784 | break; |
duke@435 | 1785 | |
duke@435 | 1786 | case Bytecodes::_fneg: |
duke@435 | 1787 | a = pop(); |
kvn@4115 | 1788 | b = _gvn.transform(new (C) NegFNode (a)); |
duke@435 | 1789 | push(b); |
duke@435 | 1790 | break; |
duke@435 | 1791 | |
duke@435 | 1792 | case Bytecodes::_fsub: |
duke@435 | 1793 | b = pop(); |
duke@435 | 1794 | a = pop(); |
kvn@4115 | 1795 | c = _gvn.transform( new (C) SubFNode(a,b) ); |
duke@435 | 1796 | d = precision_rounding(c); |
duke@435 | 1797 | push( d ); |
duke@435 | 1798 | break; |
duke@435 | 1799 | |
duke@435 | 1800 | case Bytecodes::_fadd: |
duke@435 | 1801 | b = pop(); |
duke@435 | 1802 | a = pop(); |
kvn@4115 | 1803 | c = _gvn.transform( new (C) AddFNode(a,b) ); |
duke@435 | 1804 | d = precision_rounding(c); |
duke@435 | 1805 | push( d ); |
duke@435 | 1806 | break; |
duke@435 | 1807 | |
duke@435 | 1808 | case Bytecodes::_fmul: |
duke@435 | 1809 | b = pop(); |
duke@435 | 1810 | a = pop(); |
kvn@4115 | 1811 | c = _gvn.transform( new (C) MulFNode(a,b) ); |
duke@435 | 1812 | d = precision_rounding(c); |
duke@435 | 1813 | push( d ); |
duke@435 | 1814 | break; |
duke@435 | 1815 | |
duke@435 | 1816 | case Bytecodes::_fdiv: |
duke@435 | 1817 | b = pop(); |
duke@435 | 1818 | a = pop(); |
kvn@4115 | 1819 | c = _gvn.transform( new (C) DivFNode(0,a,b) ); |
duke@435 | 1820 | d = precision_rounding(c); |
duke@435 | 1821 | push( d ); |
duke@435 | 1822 | break; |
duke@435 | 1823 | |
duke@435 | 1824 | case Bytecodes::_frem: |
duke@435 | 1825 | if (Matcher::has_match_rule(Op_ModF)) { |
duke@435 | 1826 | // Generate a ModF node. |
duke@435 | 1827 | b = pop(); |
duke@435 | 1828 | a = pop(); |
kvn@4115 | 1829 | c = _gvn.transform( new (C) ModFNode(0,a,b) ); |
duke@435 | 1830 | d = precision_rounding(c); |
duke@435 | 1831 | push( d ); |
duke@435 | 1832 | } |
duke@435 | 1833 | else { |
duke@435 | 1834 | // Generate a call. |
duke@435 | 1835 | modf(); |
duke@435 | 1836 | } |
duke@435 | 1837 | break; |
duke@435 | 1838 | |
duke@435 | 1839 | case Bytecodes::_fcmpl: |
duke@435 | 1840 | b = pop(); |
duke@435 | 1841 | a = pop(); |
kvn@4115 | 1842 | c = _gvn.transform( new (C) CmpF3Node( a, b)); |
duke@435 | 1843 | push(c); |
duke@435 | 1844 | break; |
duke@435 | 1845 | case Bytecodes::_fcmpg: |
duke@435 | 1846 | b = pop(); |
duke@435 | 1847 | a = pop(); |
duke@435 | 1848 | |
duke@435 | 1849 | // Same as fcmpl but need to flip the unordered case. Swap the inputs, |
duke@435 | 1850 | // which negates the result sign except for unordered. Flip the unordered |
duke@435 | 1851 | // as well by using CmpF3 which implements unordered-lesser instead of |
duke@435 | 1852 | // unordered-greater semantics. Finally, commute the result bits. Result |
duke@435 | 1853 | // is same as using a CmpF3Greater except we did it with CmpF3 alone. |
kvn@4115 | 1854 | c = _gvn.transform( new (C) CmpF3Node( b, a)); |
kvn@4115 | 1855 | c = _gvn.transform( new (C) SubINode(_gvn.intcon(0),c) ); |
duke@435 | 1856 | push(c); |
duke@435 | 1857 | break; |
duke@435 | 1858 | |
duke@435 | 1859 | case Bytecodes::_f2i: |
duke@435 | 1860 | a = pop(); |
kvn@4115 | 1861 | push(_gvn.transform(new (C) ConvF2INode(a))); |
duke@435 | 1862 | break; |
duke@435 | 1863 | |
duke@435 | 1864 | case Bytecodes::_d2i: |
duke@435 | 1865 | a = pop_pair(); |
kvn@4115 | 1866 | b = _gvn.transform(new (C) ConvD2INode(a)); |
duke@435 | 1867 | push( b ); |
duke@435 | 1868 | break; |
duke@435 | 1869 | |
duke@435 | 1870 | case Bytecodes::_f2d: |
duke@435 | 1871 | a = pop(); |
kvn@4115 | 1872 | b = _gvn.transform( new (C) ConvF2DNode(a)); |
duke@435 | 1873 | push_pair( b ); |
duke@435 | 1874 | break; |
duke@435 | 1875 | |
duke@435 | 1876 | case Bytecodes::_d2f: |
duke@435 | 1877 | a = pop_pair(); |
kvn@4115 | 1878 | b = _gvn.transform( new (C) ConvD2FNode(a)); |
duke@435 | 1879 | // This breaks _227_mtrt (speed & correctness) and _222_mpegaudio (speed) |
kvn@4115 | 1880 | //b = _gvn.transform(new (C) RoundFloatNode(0, b) ); |
duke@435 | 1881 | push( b ); |
duke@435 | 1882 | break; |
duke@435 | 1883 | |
duke@435 | 1884 | case Bytecodes::_l2f: |
duke@435 | 1885 | if (Matcher::convL2FSupported()) { |
duke@435 | 1886 | a = pop_pair(); |
kvn@4115 | 1887 | b = _gvn.transform( new (C) ConvL2FNode(a)); |
duke@435 | 1888 | // For i486.ad, FILD doesn't restrict precision to 24 or 53 bits. |
duke@435 | 1889 | // Rather than storing the result into an FP register then pushing |
duke@435 | 1890 | // out to memory to round, the machine instruction that implements |
duke@435 | 1891 | // ConvL2D is responsible for rounding. |
duke@435 | 1892 | // c = precision_rounding(b); |
duke@435 | 1893 | c = _gvn.transform(b); |
duke@435 | 1894 | push(c); |
duke@435 | 1895 | } else { |
duke@435 | 1896 | l2f(); |
duke@435 | 1897 | } |
duke@435 | 1898 | break; |
duke@435 | 1899 | |
duke@435 | 1900 | case Bytecodes::_l2d: |
duke@435 | 1901 | a = pop_pair(); |
kvn@4115 | 1902 | b = _gvn.transform( new (C) ConvL2DNode(a)); |
duke@435 | 1903 | // For i486.ad, rounding is always necessary (see _l2f above). |
duke@435 | 1904 | // c = dprecision_rounding(b); |
duke@435 | 1905 | c = _gvn.transform(b); |
duke@435 | 1906 | push_pair(c); |
duke@435 | 1907 | break; |
duke@435 | 1908 | |
duke@435 | 1909 | case Bytecodes::_f2l: |
duke@435 | 1910 | a = pop(); |
kvn@4115 | 1911 | b = _gvn.transform( new (C) ConvF2LNode(a)); |
duke@435 | 1912 | push_pair(b); |
duke@435 | 1913 | break; |
duke@435 | 1914 | |
duke@435 | 1915 | case Bytecodes::_d2l: |
duke@435 | 1916 | a = pop_pair(); |
kvn@4115 | 1917 | b = _gvn.transform( new (C) ConvD2LNode(a)); |
duke@435 | 1918 | push_pair(b); |
duke@435 | 1919 | break; |
duke@435 | 1920 | |
duke@435 | 1921 | case Bytecodes::_dsub: |
duke@435 | 1922 | b = pop_pair(); |
duke@435 | 1923 | a = pop_pair(); |
kvn@4115 | 1924 | c = _gvn.transform( new (C) SubDNode(a,b) ); |
duke@435 | 1925 | d = dprecision_rounding(c); |
duke@435 | 1926 | push_pair( d ); |
duke@435 | 1927 | break; |
duke@435 | 1928 | |
duke@435 | 1929 | case Bytecodes::_dadd: |
duke@435 | 1930 | b = pop_pair(); |
duke@435 | 1931 | a = pop_pair(); |
kvn@4115 | 1932 | c = _gvn.transform( new (C) AddDNode(a,b) ); |
duke@435 | 1933 | d = dprecision_rounding(c); |
duke@435 | 1934 | push_pair( d ); |
duke@435 | 1935 | break; |
duke@435 | 1936 | |
duke@435 | 1937 | case Bytecodes::_dmul: |
duke@435 | 1938 | b = pop_pair(); |
duke@435 | 1939 | a = pop_pair(); |
kvn@4115 | 1940 | c = _gvn.transform( new (C) MulDNode(a,b) ); |
duke@435 | 1941 | d = dprecision_rounding(c); |
duke@435 | 1942 | push_pair( d ); |
duke@435 | 1943 | break; |
duke@435 | 1944 | |
duke@435 | 1945 | case Bytecodes::_ddiv: |
duke@435 | 1946 | b = pop_pair(); |
duke@435 | 1947 | a = pop_pair(); |
kvn@4115 | 1948 | c = _gvn.transform( new (C) DivDNode(0,a,b) ); |
duke@435 | 1949 | d = dprecision_rounding(c); |
duke@435 | 1950 | push_pair( d ); |
duke@435 | 1951 | break; |
duke@435 | 1952 | |
duke@435 | 1953 | case Bytecodes::_dneg: |
duke@435 | 1954 | a = pop_pair(); |
kvn@4115 | 1955 | b = _gvn.transform(new (C) NegDNode (a)); |
duke@435 | 1956 | push_pair(b); |
duke@435 | 1957 | break; |
duke@435 | 1958 | |
duke@435 | 1959 | case Bytecodes::_drem: |
duke@435 | 1960 | if (Matcher::has_match_rule(Op_ModD)) { |
duke@435 | 1961 | // Generate a ModD node. |
duke@435 | 1962 | b = pop_pair(); |
duke@435 | 1963 | a = pop_pair(); |
duke@435 | 1964 | // a % b |
duke@435 | 1965 | |
kvn@4115 | 1966 | c = _gvn.transform( new (C) ModDNode(0,a,b) ); |
duke@435 | 1967 | d = dprecision_rounding(c); |
duke@435 | 1968 | push_pair( d ); |
duke@435 | 1969 | } |
duke@435 | 1970 | else { |
duke@435 | 1971 | // Generate a call. |
duke@435 | 1972 | modd(); |
duke@435 | 1973 | } |
duke@435 | 1974 | break; |
duke@435 | 1975 | |
duke@435 | 1976 | case Bytecodes::_dcmpl: |
duke@435 | 1977 | b = pop_pair(); |
duke@435 | 1978 | a = pop_pair(); |
kvn@4115 | 1979 | c = _gvn.transform( new (C) CmpD3Node( a, b)); |
duke@435 | 1980 | push(c); |
duke@435 | 1981 | break; |
duke@435 | 1982 | |
duke@435 | 1983 | case Bytecodes::_dcmpg: |
duke@435 | 1984 | b = pop_pair(); |
duke@435 | 1985 | a = pop_pair(); |
duke@435 | 1986 | // Same as dcmpl but need to flip the unordered case. |
duke@435 | 1987 | // Commute the inputs, which negates the result sign except for unordered. |
duke@435 | 1988 | // Flip the unordered as well by using CmpD3 which implements |
duke@435 | 1989 | // unordered-lesser instead of unordered-greater semantics. |
duke@435 | 1990 | // Finally, negate the result bits. Result is same as using a |
duke@435 | 1991 | // CmpD3Greater except we did it with CmpD3 alone. |
kvn@4115 | 1992 | c = _gvn.transform( new (C) CmpD3Node( b, a)); |
kvn@4115 | 1993 | c = _gvn.transform( new (C) SubINode(_gvn.intcon(0),c) ); |
duke@435 | 1994 | push(c); |
duke@435 | 1995 | break; |
duke@435 | 1996 | |
duke@435 | 1997 | |
duke@435 | 1998 | // Note for longs -> lo word is on TOS, hi word is on TOS - 1 |
duke@435 | 1999 | case Bytecodes::_land: |
duke@435 | 2000 | b = pop_pair(); |
duke@435 | 2001 | a = pop_pair(); |
kvn@4115 | 2002 | c = _gvn.transform( new (C) AndLNode(a,b) ); |
duke@435 | 2003 | push_pair(c); |
duke@435 | 2004 | break; |
duke@435 | 2005 | case Bytecodes::_lor: |
duke@435 | 2006 | b = pop_pair(); |
duke@435 | 2007 | a = pop_pair(); |
kvn@4115 | 2008 | c = _gvn.transform( new (C) OrLNode(a,b) ); |
duke@435 | 2009 | push_pair(c); |
duke@435 | 2010 | break; |
duke@435 | 2011 | case Bytecodes::_lxor: |
duke@435 | 2012 | b = pop_pair(); |
duke@435 | 2013 | a = pop_pair(); |
kvn@4115 | 2014 | c = _gvn.transform( new (C) XorLNode(a,b) ); |
duke@435 | 2015 | push_pair(c); |
duke@435 | 2016 | break; |
duke@435 | 2017 | |
duke@435 | 2018 | case Bytecodes::_lshl: |
duke@435 | 2019 | b = pop(); // the shift count |
duke@435 | 2020 | a = pop_pair(); // value to be shifted |
kvn@4115 | 2021 | c = _gvn.transform( new (C) LShiftLNode(a,b) ); |
duke@435 | 2022 | push_pair(c); |
duke@435 | 2023 | break; |
duke@435 | 2024 | case Bytecodes::_lshr: |
duke@435 | 2025 | b = pop(); // the shift count |
duke@435 | 2026 | a = pop_pair(); // value to be shifted |
kvn@4115 | 2027 | c = _gvn.transform( new (C) RShiftLNode(a,b) ); |
duke@435 | 2028 | push_pair(c); |
duke@435 | 2029 | break; |
duke@435 | 2030 | case Bytecodes::_lushr: |
duke@435 | 2031 | b = pop(); // the shift count |
duke@435 | 2032 | a = pop_pair(); // value to be shifted |
kvn@4115 | 2033 | c = _gvn.transform( new (C) URShiftLNode(a,b) ); |
duke@435 | 2034 | push_pair(c); |
duke@435 | 2035 | break; |
duke@435 | 2036 | case Bytecodes::_lmul: |
duke@435 | 2037 | b = pop_pair(); |
duke@435 | 2038 | a = pop_pair(); |
kvn@4115 | 2039 | c = _gvn.transform( new (C) MulLNode(a,b) ); |
duke@435 | 2040 | push_pair(c); |
duke@435 | 2041 | break; |
duke@435 | 2042 | |
duke@435 | 2043 | case Bytecodes::_lrem: |
duke@435 | 2044 | // Must keep both values on the expression-stack during null-check |
duke@435 | 2045 | assert(peek(0) == top(), "long word order"); |
twisti@4313 | 2046 | zero_check_long(peek(1)); |
duke@435 | 2047 | // Compile-time detect of null-exception? |
duke@435 | 2048 | if (stopped()) return; |
duke@435 | 2049 | b = pop_pair(); |
duke@435 | 2050 | a = pop_pair(); |
kvn@4115 | 2051 | c = _gvn.transform( new (C) ModLNode(control(),a,b) ); |
duke@435 | 2052 | push_pair(c); |
duke@435 | 2053 | break; |
duke@435 | 2054 | |
duke@435 | 2055 | case Bytecodes::_ldiv: |
duke@435 | 2056 | // Must keep both values on the expression-stack during null-check |
duke@435 | 2057 | assert(peek(0) == top(), "long word order"); |
twisti@4313 | 2058 | zero_check_long(peek(1)); |
duke@435 | 2059 | // Compile-time detect of null-exception? |
duke@435 | 2060 | if (stopped()) return; |
duke@435 | 2061 | b = pop_pair(); |
duke@435 | 2062 | a = pop_pair(); |
kvn@4115 | 2063 | c = _gvn.transform( new (C) DivLNode(control(),a,b) ); |
duke@435 | 2064 | push_pair(c); |
duke@435 | 2065 | break; |
duke@435 | 2066 | |
duke@435 | 2067 | case Bytecodes::_ladd: |
duke@435 | 2068 | b = pop_pair(); |
duke@435 | 2069 | a = pop_pair(); |
kvn@4115 | 2070 | c = _gvn.transform( new (C) AddLNode(a,b) ); |
duke@435 | 2071 | push_pair(c); |
duke@435 | 2072 | break; |
duke@435 | 2073 | case Bytecodes::_lsub: |
duke@435 | 2074 | b = pop_pair(); |
duke@435 | 2075 | a = pop_pair(); |
kvn@4115 | 2076 | c = _gvn.transform( new (C) SubLNode(a,b) ); |
duke@435 | 2077 | push_pair(c); |
duke@435 | 2078 | break; |
duke@435 | 2079 | case Bytecodes::_lcmp: |
duke@435 | 2080 | // Safepoints are now inserted _before_ branches. The long-compare |
duke@435 | 2081 | // bytecode painfully produces a 3-way value (-1,0,+1) which requires a |
duke@435 | 2082 | // slew of control flow. These are usually followed by a CmpI vs zero and |
duke@435 | 2083 | // a branch; this pattern then optimizes to the obvious long-compare and |
duke@435 | 2084 | // branch. However, if the branch is backwards there's a Safepoint |
duke@435 | 2085 | // inserted. The inserted Safepoint captures the JVM state at the |
duke@435 | 2086 | // pre-branch point, i.e. it captures the 3-way value. Thus if a |
duke@435 | 2087 | // long-compare is used to control a loop the debug info will force |
duke@435 | 2088 | // computation of the 3-way value, even though the generated code uses a |
duke@435 | 2089 | // long-compare and branch. We try to rectify the situation by inserting |
duke@435 | 2090 | // a SafePoint here and have it dominate and kill the safepoint added at a |
duke@435 | 2091 | // following backwards branch. At this point the JVM state merely holds 2 |
duke@435 | 2092 | // longs but not the 3-way value. |
duke@435 | 2093 | if( UseLoopSafepoints ) { |
duke@435 | 2094 | switch( iter().next_bc() ) { |
duke@435 | 2095 | case Bytecodes::_ifgt: |
duke@435 | 2096 | case Bytecodes::_iflt: |
duke@435 | 2097 | case Bytecodes::_ifge: |
duke@435 | 2098 | case Bytecodes::_ifle: |
duke@435 | 2099 | case Bytecodes::_ifne: |
duke@435 | 2100 | case Bytecodes::_ifeq: |
duke@435 | 2101 | // If this is a backwards branch in the bytecodes, add Safepoint |
duke@435 | 2102 | maybe_add_safepoint(iter().next_get_dest()); |
duke@435 | 2103 | } |
duke@435 | 2104 | } |
duke@435 | 2105 | b = pop_pair(); |
duke@435 | 2106 | a = pop_pair(); |
kvn@4115 | 2107 | c = _gvn.transform( new (C) CmpL3Node( a, b )); |
duke@435 | 2108 | push(c); |
duke@435 | 2109 | break; |
duke@435 | 2110 | |
duke@435 | 2111 | case Bytecodes::_lneg: |
duke@435 | 2112 | a = pop_pair(); |
kvn@4115 | 2113 | b = _gvn.transform( new (C) SubLNode(longcon(0),a)); |
duke@435 | 2114 | push_pair(b); |
duke@435 | 2115 | break; |
duke@435 | 2116 | case Bytecodes::_l2i: |
duke@435 | 2117 | a = pop_pair(); |
kvn@4115 | 2118 | push( _gvn.transform( new (C) ConvL2INode(a))); |
duke@435 | 2119 | break; |
duke@435 | 2120 | case Bytecodes::_i2l: |
duke@435 | 2121 | a = pop(); |
kvn@4115 | 2122 | b = _gvn.transform( new (C) ConvI2LNode(a)); |
duke@435 | 2123 | push_pair(b); |
duke@435 | 2124 | break; |
duke@435 | 2125 | case Bytecodes::_i2b: |
duke@435 | 2126 | // Sign extend |
duke@435 | 2127 | a = pop(); |
kvn@4115 | 2128 | a = _gvn.transform( new (C) LShiftINode(a,_gvn.intcon(24)) ); |
kvn@4115 | 2129 | a = _gvn.transform( new (C) RShiftINode(a,_gvn.intcon(24)) ); |
duke@435 | 2130 | push( a ); |
duke@435 | 2131 | break; |
duke@435 | 2132 | case Bytecodes::_i2s: |
duke@435 | 2133 | a = pop(); |
kvn@4115 | 2134 | a = _gvn.transform( new (C) LShiftINode(a,_gvn.intcon(16)) ); |
kvn@4115 | 2135 | a = _gvn.transform( new (C) RShiftINode(a,_gvn.intcon(16)) ); |
duke@435 | 2136 | push( a ); |
duke@435 | 2137 | break; |
duke@435 | 2138 | case Bytecodes::_i2c: |
duke@435 | 2139 | a = pop(); |
kvn@4115 | 2140 | push( _gvn.transform( new (C) AndINode(a,_gvn.intcon(0xFFFF)) ) ); |
duke@435 | 2141 | break; |
duke@435 | 2142 | |
duke@435 | 2143 | case Bytecodes::_i2f: |
duke@435 | 2144 | a = pop(); |
kvn@4115 | 2145 | b = _gvn.transform( new (C) ConvI2FNode(a) ) ; |
duke@435 | 2146 | c = precision_rounding(b); |
duke@435 | 2147 | push (b); |
duke@435 | 2148 | break; |
duke@435 | 2149 | |
duke@435 | 2150 | case Bytecodes::_i2d: |
duke@435 | 2151 | a = pop(); |
kvn@4115 | 2152 | b = _gvn.transform( new (C) ConvI2DNode(a)); |
duke@435 | 2153 | push_pair(b); |
duke@435 | 2154 | break; |
duke@435 | 2155 | |
duke@435 | 2156 | case Bytecodes::_iinc: // Increment local |
duke@435 | 2157 | i = iter().get_index(); // Get local index |
kvn@4115 | 2158 | set_local( i, _gvn.transform( new (C) AddINode( _gvn.intcon(iter().get_iinc_con()), local(i) ) ) ); |
duke@435 | 2159 | break; |
duke@435 | 2160 | |
duke@435 | 2161 | // Exit points of synchronized methods must have an unlock node |
duke@435 | 2162 | case Bytecodes::_return: |
duke@435 | 2163 | return_current(NULL); |
duke@435 | 2164 | break; |
duke@435 | 2165 | |
duke@435 | 2166 | case Bytecodes::_ireturn: |
duke@435 | 2167 | case Bytecodes::_areturn: |
duke@435 | 2168 | case Bytecodes::_freturn: |
duke@435 | 2169 | return_current(pop()); |
duke@435 | 2170 | break; |
duke@435 | 2171 | case Bytecodes::_lreturn: |
duke@435 | 2172 | return_current(pop_pair()); |
duke@435 | 2173 | break; |
duke@435 | 2174 | case Bytecodes::_dreturn: |
duke@435 | 2175 | return_current(pop_pair()); |
duke@435 | 2176 | break; |
duke@435 | 2177 | |
duke@435 | 2178 | case Bytecodes::_athrow: |
duke@435 | 2179 | // null exception oop throws NULL pointer exception |
twisti@4313 | 2180 | null_check(peek()); |
duke@435 | 2181 | if (stopped()) return; |
duke@435 | 2182 | // Hook the thrown exception directly to subsequent handlers. |
duke@435 | 2183 | if (BailoutToInterpreterForThrows) { |
duke@435 | 2184 | // Keep method interpreted from now on. |
duke@435 | 2185 | uncommon_trap(Deoptimization::Reason_unhandled, |
duke@435 | 2186 | Deoptimization::Action_make_not_compilable); |
duke@435 | 2187 | return; |
duke@435 | 2188 | } |
dcubed@1648 | 2189 | if (env()->jvmti_can_post_on_exceptions()) { |
dcubed@1648 | 2190 | // check if we must post exception events, take uncommon trap if so (with must_throw = false) |
dcubed@1648 | 2191 | uncommon_trap_if_should_post_on_exceptions(Deoptimization::Reason_unhandled, false); |
dcubed@1648 | 2192 | } |
dcubed@1648 | 2193 | // Here if either can_post_on_exceptions or should_post_on_exceptions is false |
duke@435 | 2194 | add_exception_state(make_exception_state(peek())); |
duke@435 | 2195 | break; |
duke@435 | 2196 | |
duke@435 | 2197 | case Bytecodes::_goto: // fall through |
duke@435 | 2198 | case Bytecodes::_goto_w: { |
duke@435 | 2199 | int target_bci = (bc() == Bytecodes::_goto) ? iter().get_dest() : iter().get_far_dest(); |
duke@435 | 2200 | |
duke@435 | 2201 | // If this is a backwards branch in the bytecodes, add Safepoint |
duke@435 | 2202 | maybe_add_safepoint(target_bci); |
duke@435 | 2203 | |
duke@435 | 2204 | // Update method data |
duke@435 | 2205 | profile_taken_branch(target_bci); |
duke@435 | 2206 | |
duke@435 | 2207 | // Merge the current control into the target basic block |
duke@435 | 2208 | merge(target_bci); |
duke@435 | 2209 | |
duke@435 | 2210 | // See if we can get some profile data and hand it off to the next block |
duke@435 | 2211 | Block *target_block = block()->successor_for_bci(target_bci); |
duke@435 | 2212 | if (target_block->pred_count() != 1) break; |
duke@435 | 2213 | ciMethodData* methodData = method()->method_data(); |
duke@435 | 2214 | if (!methodData->is_mature()) break; |
duke@435 | 2215 | ciProfileData* data = methodData->bci_to_data(bci()); |
duke@435 | 2216 | assert( data->is_JumpData(), "" ); |
duke@435 | 2217 | int taken = ((ciJumpData*)data)->taken(); |
duke@435 | 2218 | taken = method()->scale_count(taken); |
duke@435 | 2219 | target_block->set_count(taken); |
duke@435 | 2220 | break; |
duke@435 | 2221 | } |
duke@435 | 2222 | |
rasbold@683 | 2223 | case Bytecodes::_ifnull: btest = BoolTest::eq; goto handle_if_null; |
rasbold@683 | 2224 | case Bytecodes::_ifnonnull: btest = BoolTest::ne; goto handle_if_null; |
rasbold@683 | 2225 | handle_if_null: |
rasbold@689 | 2226 | // If this is a backwards branch in the bytecodes, add Safepoint |
rasbold@689 | 2227 | maybe_add_safepoint(iter().get_dest()); |
rasbold@683 | 2228 | a = null(); |
rasbold@683 | 2229 | b = pop(); |
kvn@4115 | 2230 | c = _gvn.transform( new (C) CmpPNode(b, a) ); |
rasbold@683 | 2231 | do_ifnull(btest, c); |
duke@435 | 2232 | break; |
duke@435 | 2233 | |
duke@435 | 2234 | case Bytecodes::_if_acmpeq: btest = BoolTest::eq; goto handle_if_acmp; |
duke@435 | 2235 | case Bytecodes::_if_acmpne: btest = BoolTest::ne; goto handle_if_acmp; |
duke@435 | 2236 | handle_if_acmp: |
rasbold@689 | 2237 | // If this is a backwards branch in the bytecodes, add Safepoint |
rasbold@689 | 2238 | maybe_add_safepoint(iter().get_dest()); |
duke@435 | 2239 | a = pop(); |
duke@435 | 2240 | b = pop(); |
kvn@4115 | 2241 | c = _gvn.transform( new (C) CmpPNode(b, a) ); |
duke@435 | 2242 | do_if(btest, c); |
duke@435 | 2243 | break; |
duke@435 | 2244 | |
duke@435 | 2245 | case Bytecodes::_ifeq: btest = BoolTest::eq; goto handle_ifxx; |
duke@435 | 2246 | case Bytecodes::_ifne: btest = BoolTest::ne; goto handle_ifxx; |
duke@435 | 2247 | case Bytecodes::_iflt: btest = BoolTest::lt; goto handle_ifxx; |
duke@435 | 2248 | case Bytecodes::_ifle: btest = BoolTest::le; goto handle_ifxx; |
duke@435 | 2249 | case Bytecodes::_ifgt: btest = BoolTest::gt; goto handle_ifxx; |
duke@435 | 2250 | case Bytecodes::_ifge: btest = BoolTest::ge; goto handle_ifxx; |
duke@435 | 2251 | handle_ifxx: |
rasbold@689 | 2252 | // If this is a backwards branch in the bytecodes, add Safepoint |
rasbold@689 | 2253 | maybe_add_safepoint(iter().get_dest()); |
duke@435 | 2254 | a = _gvn.intcon(0); |
duke@435 | 2255 | b = pop(); |
kvn@4115 | 2256 | c = _gvn.transform( new (C) CmpINode(b, a) ); |
duke@435 | 2257 | do_if(btest, c); |
duke@435 | 2258 | break; |
duke@435 | 2259 | |
duke@435 | 2260 | case Bytecodes::_if_icmpeq: btest = BoolTest::eq; goto handle_if_icmp; |
duke@435 | 2261 | case Bytecodes::_if_icmpne: btest = BoolTest::ne; goto handle_if_icmp; |
duke@435 | 2262 | case Bytecodes::_if_icmplt: btest = BoolTest::lt; goto handle_if_icmp; |
duke@435 | 2263 | case Bytecodes::_if_icmple: btest = BoolTest::le; goto handle_if_icmp; |
duke@435 | 2264 | case Bytecodes::_if_icmpgt: btest = BoolTest::gt; goto handle_if_icmp; |
duke@435 | 2265 | case Bytecodes::_if_icmpge: btest = BoolTest::ge; goto handle_if_icmp; |
duke@435 | 2266 | handle_if_icmp: |
rasbold@689 | 2267 | // If this is a backwards branch in the bytecodes, add Safepoint |
rasbold@689 | 2268 | maybe_add_safepoint(iter().get_dest()); |
duke@435 | 2269 | a = pop(); |
duke@435 | 2270 | b = pop(); |
kvn@4115 | 2271 | c = _gvn.transform( new (C) CmpINode( b, a ) ); |
duke@435 | 2272 | do_if(btest, c); |
duke@435 | 2273 | break; |
duke@435 | 2274 | |
duke@435 | 2275 | case Bytecodes::_tableswitch: |
duke@435 | 2276 | do_tableswitch(); |
duke@435 | 2277 | break; |
duke@435 | 2278 | |
duke@435 | 2279 | case Bytecodes::_lookupswitch: |
duke@435 | 2280 | do_lookupswitch(); |
duke@435 | 2281 | break; |
duke@435 | 2282 | |
duke@435 | 2283 | case Bytecodes::_invokestatic: |
jrose@1161 | 2284 | case Bytecodes::_invokedynamic: |
duke@435 | 2285 | case Bytecodes::_invokespecial: |
duke@435 | 2286 | case Bytecodes::_invokevirtual: |
duke@435 | 2287 | case Bytecodes::_invokeinterface: |
duke@435 | 2288 | do_call(); |
duke@435 | 2289 | break; |
duke@435 | 2290 | case Bytecodes::_checkcast: |
duke@435 | 2291 | do_checkcast(); |
duke@435 | 2292 | break; |
duke@435 | 2293 | case Bytecodes::_instanceof: |
duke@435 | 2294 | do_instanceof(); |
duke@435 | 2295 | break; |
duke@435 | 2296 | case Bytecodes::_anewarray: |
duke@435 | 2297 | do_anewarray(); |
duke@435 | 2298 | break; |
duke@435 | 2299 | case Bytecodes::_newarray: |
duke@435 | 2300 | do_newarray((BasicType)iter().get_index()); |
duke@435 | 2301 | break; |
duke@435 | 2302 | case Bytecodes::_multianewarray: |
duke@435 | 2303 | do_multianewarray(); |
duke@435 | 2304 | break; |
duke@435 | 2305 | case Bytecodes::_new: |
duke@435 | 2306 | do_new(); |
duke@435 | 2307 | break; |
duke@435 | 2308 | |
duke@435 | 2309 | case Bytecodes::_jsr: |
duke@435 | 2310 | case Bytecodes::_jsr_w: |
duke@435 | 2311 | do_jsr(); |
duke@435 | 2312 | break; |
duke@435 | 2313 | |
duke@435 | 2314 | case Bytecodes::_ret: |
duke@435 | 2315 | do_ret(); |
duke@435 | 2316 | break; |
duke@435 | 2317 | |
duke@435 | 2318 | |
duke@435 | 2319 | case Bytecodes::_monitorenter: |
duke@435 | 2320 | do_monitor_enter(); |
duke@435 | 2321 | break; |
duke@435 | 2322 | |
duke@435 | 2323 | case Bytecodes::_monitorexit: |
duke@435 | 2324 | do_monitor_exit(); |
duke@435 | 2325 | break; |
duke@435 | 2326 | |
duke@435 | 2327 | case Bytecodes::_breakpoint: |
duke@435 | 2328 | // Breakpoint set concurrently to compile |
duke@435 | 2329 | // %%% use an uncommon trap? |
duke@435 | 2330 | C->record_failure("breakpoint in method"); |
duke@435 | 2331 | return; |
duke@435 | 2332 | |
duke@435 | 2333 | default: |
duke@435 | 2334 | #ifndef PRODUCT |
duke@435 | 2335 | map()->dump(99); |
duke@435 | 2336 | #endif |
duke@435 | 2337 | tty->print("\nUnhandled bytecode %s\n", Bytecodes::name(bc()) ); |
duke@435 | 2338 | ShouldNotReachHere(); |
duke@435 | 2339 | } |
duke@435 | 2340 | |
duke@435 | 2341 | #ifndef PRODUCT |
duke@435 | 2342 | IdealGraphPrinter *printer = IdealGraphPrinter::printer(); |
duke@435 | 2343 | if(printer) { |
duke@435 | 2344 | char buffer[256]; |
duke@435 | 2345 | sprintf(buffer, "Bytecode %d: %s", bci(), Bytecodes::name(bc())); |
duke@435 | 2346 | bool old = printer->traverse_outs(); |
duke@435 | 2347 | printer->set_traverse_outs(true); |
never@657 | 2348 | printer->print_method(C, buffer, 4); |
duke@435 | 2349 | printer->set_traverse_outs(old); |
duke@435 | 2350 | } |
duke@435 | 2351 | #endif |
duke@435 | 2352 | } |