src/share/vm/opto/parse1.cpp

Thu, 24 May 2018 19:26:50 +0800

author
aoqi
date
Thu, 24 May 2018 19:26:50 +0800
changeset 8862
fd13a567f179
parent 8856
ac27a9c85bea
permissions
-rw-r--r--

#7046 C2 supports long branch
Contributed-by: fujie

aoqi@0 1 /*
kevinw@8368 2 * Copyright (c) 1997, 2016, Oracle and/or its affiliates. All rights reserved.
aoqi@0 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
aoqi@0 4 *
aoqi@0 5 * This code is free software; you can redistribute it and/or modify it
aoqi@0 6 * under the terms of the GNU General Public License version 2 only, as
aoqi@0 7 * published by the Free Software Foundation.
aoqi@0 8 *
aoqi@0 9 * This code is distributed in the hope that it will be useful, but WITHOUT
aoqi@0 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
aoqi@0 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
aoqi@0 12 * version 2 for more details (a copy is included in the LICENSE file that
aoqi@0 13 * accompanied this code).
aoqi@0 14 *
aoqi@0 15 * You should have received a copy of the GNU General Public License version
aoqi@0 16 * 2 along with this work; if not, write to the Free Software Foundation,
aoqi@0 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
aoqi@0 18 *
aoqi@0 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
aoqi@0 20 * or visit www.oracle.com if you need additional information or have any
aoqi@0 21 * questions.
aoqi@0 22 *
aoqi@0 23 */
aoqi@0 24
aoqi@0 25 #include "precompiled.hpp"
aoqi@0 26 #include "compiler/compileLog.hpp"
aoqi@0 27 #include "interpreter/linkResolver.hpp"
aoqi@0 28 #include "oops/method.hpp"
aoqi@0 29 #include "opto/addnode.hpp"
shshahma@8421 30 #include "opto/c2compiler.hpp"
aoqi@0 31 #include "opto/idealGraphPrinter.hpp"
aoqi@0 32 #include "opto/locknode.hpp"
aoqi@0 33 #include "opto/memnode.hpp"
aoqi@0 34 #include "opto/parse.hpp"
aoqi@0 35 #include "opto/rootnode.hpp"
aoqi@0 36 #include "opto/runtime.hpp"
aoqi@0 37 #include "runtime/arguments.hpp"
aoqi@0 38 #include "runtime/handles.inline.hpp"
aoqi@0 39 #include "runtime/sharedRuntime.hpp"
aoqi@0 40 #include "utilities/copy.hpp"
aoqi@0 41
aoqi@0 42 // Static array so we can figure out which bytecodes stop us from compiling
aoqi@0 43 // the most. Some of the non-static variables are needed in bytecodeInfo.cpp
aoqi@0 44 // and eventually should be encapsulated in a proper class (gri 8/18/98).
aoqi@0 45
aoqi@0 46 int nodes_created = 0;
aoqi@0 47 int methods_parsed = 0;
aoqi@0 48 int methods_seen = 0;
aoqi@0 49 int blocks_parsed = 0;
aoqi@0 50 int blocks_seen = 0;
aoqi@0 51
aoqi@0 52 int explicit_null_checks_inserted = 0;
aoqi@0 53 int explicit_null_checks_elided = 0;
aoqi@0 54 int all_null_checks_found = 0, implicit_null_checks = 0;
aoqi@0 55 int implicit_null_throws = 0;
aoqi@0 56
aoqi@0 57 int reclaim_idx = 0;
aoqi@0 58 int reclaim_in = 0;
aoqi@0 59 int reclaim_node = 0;
aoqi@0 60
aoqi@0 61 #ifndef PRODUCT
aoqi@0 62 bool Parse::BytecodeParseHistogram::_initialized = false;
aoqi@0 63 uint Parse::BytecodeParseHistogram::_bytecodes_parsed [Bytecodes::number_of_codes];
aoqi@0 64 uint Parse::BytecodeParseHistogram::_nodes_constructed[Bytecodes::number_of_codes];
aoqi@0 65 uint Parse::BytecodeParseHistogram::_nodes_transformed[Bytecodes::number_of_codes];
aoqi@0 66 uint Parse::BytecodeParseHistogram::_new_values [Bytecodes::number_of_codes];
aoqi@0 67 #endif
aoqi@0 68
aoqi@0 69 //------------------------------print_statistics-------------------------------
aoqi@0 70 #ifndef PRODUCT
aoqi@0 71 void Parse::print_statistics() {
aoqi@0 72 tty->print_cr("--- Compiler Statistics ---");
aoqi@0 73 tty->print("Methods seen: %d Methods parsed: %d", methods_seen, methods_parsed);
aoqi@0 74 tty->print(" Nodes created: %d", nodes_created);
aoqi@0 75 tty->cr();
aoqi@0 76 if (methods_seen != methods_parsed)
aoqi@0 77 tty->print_cr("Reasons for parse failures (NOT cumulative):");
aoqi@0 78 tty->print_cr("Blocks parsed: %d Blocks seen: %d", blocks_parsed, blocks_seen);
aoqi@0 79
aoqi@0 80 if( explicit_null_checks_inserted )
aoqi@0 81 tty->print_cr("%d original NULL checks - %d elided (%2d%%); optimizer leaves %d,", explicit_null_checks_inserted, explicit_null_checks_elided, (100*explicit_null_checks_elided)/explicit_null_checks_inserted, all_null_checks_found);
aoqi@0 82 if( all_null_checks_found )
aoqi@0 83 tty->print_cr("%d made implicit (%2d%%)", implicit_null_checks,
aoqi@0 84 (100*implicit_null_checks)/all_null_checks_found);
aoqi@0 85 if( implicit_null_throws )
aoqi@0 86 tty->print_cr("%d implicit null exceptions at runtime",
aoqi@0 87 implicit_null_throws);
aoqi@0 88
aoqi@0 89 if( PrintParseStatistics && BytecodeParseHistogram::initialized() ) {
aoqi@0 90 BytecodeParseHistogram::print();
aoqi@0 91 }
aoqi@0 92 }
aoqi@0 93 #endif
aoqi@0 94
aoqi@0 95 //------------------------------ON STACK REPLACEMENT---------------------------
aoqi@0 96
aoqi@0 97 // Construct a node which can be used to get incoming state for
aoqi@0 98 // on stack replacement.
aoqi@0 99 Node *Parse::fetch_interpreter_state(int index,
aoqi@0 100 BasicType bt,
aoqi@0 101 Node *local_addrs,
aoqi@0 102 Node *local_addrs_base) {
aoqi@0 103 Node *mem = memory(Compile::AliasIdxRaw);
aoqi@0 104 Node *adr = basic_plus_adr( local_addrs_base, local_addrs, -index*wordSize );
aoqi@0 105 Node *ctl = control();
aoqi@0 106
aoqi@0 107 // Very similar to LoadNode::make, except we handle un-aligned longs and
aoqi@0 108 // doubles on Sparc. Intel can handle them just fine directly.
csahu@8316 109 Node *l = NULL;
aoqi@0 110 switch (bt) { // Signature is flattened
aoqi@0 111 case T_INT: l = new (C) LoadINode(ctl, mem, adr, TypeRawPtr::BOTTOM, TypeInt::INT, MemNode::unordered); break;
aoqi@0 112 case T_FLOAT: l = new (C) LoadFNode(ctl, mem, adr, TypeRawPtr::BOTTOM, Type::FLOAT, MemNode::unordered); break;
aoqi@0 113 case T_ADDRESS: l = new (C) LoadPNode(ctl, mem, adr, TypeRawPtr::BOTTOM, TypeRawPtr::BOTTOM, MemNode::unordered); break;
aoqi@0 114 case T_OBJECT: l = new (C) LoadPNode(ctl, mem, adr, TypeRawPtr::BOTTOM, TypeInstPtr::BOTTOM, MemNode::unordered); break;
aoqi@0 115 case T_LONG:
aoqi@0 116 case T_DOUBLE: {
aoqi@0 117 // Since arguments are in reverse order, the argument address 'adr'
aoqi@0 118 // refers to the back half of the long/double. Recompute adr.
aoqi@0 119 adr = basic_plus_adr(local_addrs_base, local_addrs, -(index+1)*wordSize);
aoqi@0 120 if (Matcher::misaligned_doubles_ok) {
aoqi@0 121 l = (bt == T_DOUBLE)
aoqi@0 122 ? (Node*)new (C) LoadDNode(ctl, mem, adr, TypeRawPtr::BOTTOM, Type::DOUBLE, MemNode::unordered)
aoqi@0 123 : (Node*)new (C) LoadLNode(ctl, mem, adr, TypeRawPtr::BOTTOM, TypeLong::LONG, MemNode::unordered);
aoqi@0 124 } else {
aoqi@0 125 l = (bt == T_DOUBLE)
aoqi@0 126 ? (Node*)new (C) LoadD_unalignedNode(ctl, mem, adr, TypeRawPtr::BOTTOM, MemNode::unordered)
aoqi@0 127 : (Node*)new (C) LoadL_unalignedNode(ctl, mem, adr, TypeRawPtr::BOTTOM, MemNode::unordered);
aoqi@0 128 }
aoqi@0 129 break;
aoqi@0 130 }
aoqi@0 131 default: ShouldNotReachHere();
aoqi@0 132 }
aoqi@0 133 return _gvn.transform(l);
aoqi@0 134 }
aoqi@0 135
aoqi@0 136 // Helper routine to prevent the interpreter from handing
aoqi@0 137 // unexpected typestate to an OSR method.
aoqi@0 138 // The Node l is a value newly dug out of the interpreter frame.
aoqi@0 139 // The type is the type predicted by ciTypeFlow. Note that it is
aoqi@0 140 // not a general type, but can only come from Type::get_typeflow_type.
aoqi@0 141 // The safepoint is a map which will feed an uncommon trap.
aoqi@0 142 Node* Parse::check_interpreter_type(Node* l, const Type* type,
aoqi@0 143 SafePointNode* &bad_type_exit) {
aoqi@0 144
aoqi@0 145 const TypeOopPtr* tp = type->isa_oopptr();
aoqi@0 146
aoqi@0 147 // TypeFlow may assert null-ness if a type appears unloaded.
aoqi@0 148 if (type == TypePtr::NULL_PTR ||
aoqi@0 149 (tp != NULL && !tp->klass()->is_loaded())) {
aoqi@0 150 // Value must be null, not a real oop.
aoqi@0 151 Node* chk = _gvn.transform( new (C) CmpPNode(l, null()) );
aoqi@0 152 Node* tst = _gvn.transform( new (C) BoolNode(chk, BoolTest::eq) );
aoqi@0 153 IfNode* iff = create_and_map_if(control(), tst, PROB_MAX, COUNT_UNKNOWN);
aoqi@0 154 set_control(_gvn.transform( new (C) IfTrueNode(iff) ));
aoqi@0 155 Node* bad_type = _gvn.transform( new (C) IfFalseNode(iff) );
aoqi@0 156 bad_type_exit->control()->add_req(bad_type);
aoqi@0 157 l = null();
aoqi@0 158 }
aoqi@0 159
aoqi@0 160 // Typeflow can also cut off paths from the CFG, based on
aoqi@0 161 // types which appear unloaded, or call sites which appear unlinked.
aoqi@0 162 // When paths are cut off, values at later merge points can rise
aoqi@0 163 // toward more specific classes. Make sure these specific classes
aoqi@0 164 // are still in effect.
aoqi@0 165 if (tp != NULL && tp->klass() != C->env()->Object_klass()) {
aoqi@0 166 // TypeFlow asserted a specific object type. Value must have that type.
aoqi@0 167 Node* bad_type_ctrl = NULL;
aoqi@0 168 l = gen_checkcast(l, makecon(TypeKlassPtr::make(tp->klass())), &bad_type_ctrl);
aoqi@0 169 bad_type_exit->control()->add_req(bad_type_ctrl);
aoqi@0 170 }
aoqi@0 171
aoqi@0 172 BasicType bt_l = _gvn.type(l)->basic_type();
aoqi@0 173 BasicType bt_t = type->basic_type();
aoqi@0 174 assert(_gvn.type(l)->higher_equal(type), "must constrain OSR typestate");
aoqi@0 175 return l;
aoqi@0 176 }
aoqi@0 177
aoqi@0 178 // Helper routine which sets up elements of the initial parser map when
aoqi@0 179 // performing a parse for on stack replacement. Add values into map.
aoqi@0 180 // The only parameter contains the address of a interpreter arguments.
aoqi@0 181 void Parse::load_interpreter_state(Node* osr_buf) {
aoqi@0 182 int index;
aoqi@0 183 int max_locals = jvms()->loc_size();
aoqi@0 184 int max_stack = jvms()->stk_size();
aoqi@0 185
aoqi@0 186
aoqi@0 187 // Mismatch between method and jvms can occur since map briefly held
aoqi@0 188 // an OSR entry state (which takes up one RawPtr word).
aoqi@0 189 assert(max_locals == method()->max_locals(), "sanity");
aoqi@0 190 assert(max_stack >= method()->max_stack(), "sanity");
aoqi@0 191 assert((int)jvms()->endoff() == TypeFunc::Parms + max_locals + max_stack, "sanity");
aoqi@0 192 assert((int)jvms()->endoff() == (int)map()->req(), "sanity");
aoqi@0 193
aoqi@0 194 // Find the start block.
aoqi@0 195 Block* osr_block = start_block();
aoqi@0 196 assert(osr_block->start() == osr_bci(), "sanity");
aoqi@0 197
aoqi@0 198 // Set initial BCI.
aoqi@0 199 set_parse_bci(osr_block->start());
aoqi@0 200
aoqi@0 201 // Set initial stack depth.
aoqi@0 202 set_sp(osr_block->start_sp());
aoqi@0 203
aoqi@0 204 // Check bailouts. We currently do not perform on stack replacement
aoqi@0 205 // of loops in catch blocks or loops which branch with a non-empty stack.
aoqi@0 206 if (sp() != 0) {
aoqi@0 207 C->record_method_not_compilable("OSR starts with non-empty stack");
aoqi@0 208 return;
aoqi@0 209 }
aoqi@0 210 // Do not OSR inside finally clauses:
aoqi@0 211 if (osr_block->has_trap_at(osr_block->start())) {
aoqi@0 212 C->record_method_not_compilable("OSR starts with an immediate trap");
aoqi@0 213 return;
aoqi@0 214 }
aoqi@0 215
aoqi@0 216 // Commute monitors from interpreter frame to compiler frame.
aoqi@0 217 assert(jvms()->monitor_depth() == 0, "should be no active locks at beginning of osr");
aoqi@0 218 int mcnt = osr_block->flow()->monitor_count();
aoqi@0 219 Node *monitors_addr = basic_plus_adr(osr_buf, osr_buf, (max_locals+mcnt*2-1)*wordSize);
aoqi@0 220 for (index = 0; index < mcnt; index++) {
aoqi@0 221 // Make a BoxLockNode for the monitor.
aoqi@0 222 Node *box = _gvn.transform(new (C) BoxLockNode(next_monitor()));
aoqi@0 223
aoqi@0 224
aoqi@0 225 // Displaced headers and locked objects are interleaved in the
aoqi@0 226 // temp OSR buffer. We only copy the locked objects out here.
aoqi@0 227 // Fetch the locked object from the OSR temp buffer and copy to our fastlock node.
aoqi@0 228 Node *lock_object = fetch_interpreter_state(index*2, T_OBJECT, monitors_addr, osr_buf);
aoqi@0 229 // Try and copy the displaced header to the BoxNode
aoqi@0 230 Node *displaced_hdr = fetch_interpreter_state((index*2) + 1, T_ADDRESS, monitors_addr, osr_buf);
aoqi@0 231
aoqi@0 232
aoqi@0 233 store_to_memory(control(), box, displaced_hdr, T_ADDRESS, Compile::AliasIdxRaw, MemNode::unordered);
aoqi@0 234
aoqi@0 235 // Build a bogus FastLockNode (no code will be generated) and push the
aoqi@0 236 // monitor into our debug info.
aoqi@0 237 const FastLockNode *flock = _gvn.transform(new (C) FastLockNode( 0, lock_object, box ))->as_FastLock();
aoqi@0 238 map()->push_monitor(flock);
aoqi@0 239
aoqi@0 240 // If the lock is our method synchronization lock, tuck it away in
aoqi@0 241 // _sync_lock for return and rethrow exit paths.
aoqi@0 242 if (index == 0 && method()->is_synchronized()) {
aoqi@0 243 _synch_lock = flock;
aoqi@0 244 }
aoqi@0 245 }
aoqi@0 246
aoqi@0 247 // Use the raw liveness computation to make sure that unexpected
aoqi@0 248 // values don't propagate into the OSR frame.
aoqi@0 249 MethodLivenessResult live_locals = method()->liveness_at_bci(osr_bci());
aoqi@0 250 if (!live_locals.is_valid()) {
aoqi@0 251 // Degenerate or breakpointed method.
aoqi@0 252 C->record_method_not_compilable("OSR in empty or breakpointed method");
aoqi@0 253 return;
aoqi@0 254 }
aoqi@0 255
aoqi@0 256 // Extract the needed locals from the interpreter frame.
aoqi@0 257 Node *locals_addr = basic_plus_adr(osr_buf, osr_buf, (max_locals-1)*wordSize);
aoqi@0 258
aoqi@0 259 // find all the locals that the interpreter thinks contain live oops
aoqi@0 260 const BitMap live_oops = method()->live_local_oops_at_bci(osr_bci());
aoqi@0 261 for (index = 0; index < max_locals; index++) {
aoqi@0 262
aoqi@0 263 if (!live_locals.at(index)) {
aoqi@0 264 continue;
aoqi@0 265 }
aoqi@0 266
aoqi@0 267 const Type *type = osr_block->local_type_at(index);
aoqi@0 268
aoqi@0 269 if (type->isa_oopptr() != NULL) {
aoqi@0 270
aoqi@0 271 // 6403625: Verify that the interpreter oopMap thinks that the oop is live
aoqi@0 272 // else we might load a stale oop if the MethodLiveness disagrees with the
aoqi@0 273 // result of the interpreter. If the interpreter says it is dead we agree
aoqi@0 274 // by making the value go to top.
aoqi@0 275 //
aoqi@0 276
aoqi@0 277 if (!live_oops.at(index)) {
aoqi@0 278 if (C->log() != NULL) {
aoqi@0 279 C->log()->elem("OSR_mismatch local_index='%d'",index);
aoqi@0 280 }
aoqi@0 281 set_local(index, null());
aoqi@0 282 // and ignore it for the loads
aoqi@0 283 continue;
aoqi@0 284 }
aoqi@0 285 }
aoqi@0 286
aoqi@0 287 // Filter out TOP, HALF, and BOTTOM. (Cf. ensure_phi.)
aoqi@0 288 if (type == Type::TOP || type == Type::HALF) {
aoqi@0 289 continue;
aoqi@0 290 }
aoqi@0 291 // If the type falls to bottom, then this must be a local that
aoqi@0 292 // is mixing ints and oops or some such. Forcing it to top
aoqi@0 293 // makes it go dead.
aoqi@0 294 if (type == Type::BOTTOM) {
aoqi@0 295 continue;
aoqi@0 296 }
aoqi@0 297 // Construct code to access the appropriate local.
aoqi@0 298 BasicType bt = type->basic_type();
aoqi@0 299 if (type == TypePtr::NULL_PTR) {
aoqi@0 300 // Ptr types are mixed together with T_ADDRESS but NULL is
aoqi@0 301 // really for T_OBJECT types so correct it.
aoqi@0 302 bt = T_OBJECT;
aoqi@0 303 }
aoqi@0 304 Node *value = fetch_interpreter_state(index, bt, locals_addr, osr_buf);
aoqi@0 305 set_local(index, value);
aoqi@0 306 }
aoqi@0 307
aoqi@0 308 // Extract the needed stack entries from the interpreter frame.
aoqi@0 309 for (index = 0; index < sp(); index++) {
aoqi@0 310 const Type *type = osr_block->stack_type_at(index);
aoqi@0 311 if (type != Type::TOP) {
aoqi@0 312 // Currently the compiler bails out when attempting to on stack replace
aoqi@0 313 // at a bci with a non-empty stack. We should not reach here.
aoqi@0 314 ShouldNotReachHere();
aoqi@0 315 }
aoqi@0 316 }
aoqi@0 317
aoqi@0 318 // End the OSR migration
aoqi@0 319 make_runtime_call(RC_LEAF, OptoRuntime::osr_end_Type(),
aoqi@0 320 CAST_FROM_FN_PTR(address, SharedRuntime::OSR_migration_end),
aoqi@0 321 "OSR_migration_end", TypeRawPtr::BOTTOM,
aoqi@0 322 osr_buf);
aoqi@0 323
aoqi@0 324 // Now that the interpreter state is loaded, make sure it will match
aoqi@0 325 // at execution time what the compiler is expecting now:
aoqi@0 326 SafePointNode* bad_type_exit = clone_map();
aoqi@0 327 bad_type_exit->set_control(new (C) RegionNode(1));
aoqi@0 328
aoqi@0 329 assert(osr_block->flow()->jsrs()->size() == 0, "should be no jsrs live at osr point");
aoqi@0 330 for (index = 0; index < max_locals; index++) {
aoqi@0 331 if (stopped()) break;
aoqi@0 332 Node* l = local(index);
aoqi@0 333 if (l->is_top()) continue; // nothing here
aoqi@0 334 const Type *type = osr_block->local_type_at(index);
aoqi@0 335 if (type->isa_oopptr() != NULL) {
aoqi@0 336 if (!live_oops.at(index)) {
aoqi@0 337 // skip type check for dead oops
aoqi@0 338 continue;
aoqi@0 339 }
aoqi@0 340 }
aoqi@0 341 if (osr_block->flow()->local_type_at(index)->is_return_address()) {
aoqi@0 342 // In our current system it's illegal for jsr addresses to be
aoqi@0 343 // live into an OSR entry point because the compiler performs
aoqi@0 344 // inlining of jsrs. ciTypeFlow has a bailout that detect this
aoqi@0 345 // case and aborts the compile if addresses are live into an OSR
aoqi@0 346 // entry point. Because of that we can assume that any address
aoqi@0 347 // locals at the OSR entry point are dead. Method liveness
aoqi@0 348 // isn't precise enought to figure out that they are dead in all
aoqi@0 349 // cases so simply skip checking address locals all
aoqi@0 350 // together. Any type check is guaranteed to fail since the
aoqi@0 351 // interpreter type is the result of a load which might have any
aoqi@0 352 // value and the expected type is a constant.
aoqi@0 353 continue;
aoqi@0 354 }
aoqi@0 355 set_local(index, check_interpreter_type(l, type, bad_type_exit));
aoqi@0 356 }
aoqi@0 357
aoqi@0 358 for (index = 0; index < sp(); index++) {
aoqi@0 359 if (stopped()) break;
aoqi@0 360 Node* l = stack(index);
aoqi@0 361 if (l->is_top()) continue; // nothing here
aoqi@0 362 const Type *type = osr_block->stack_type_at(index);
aoqi@0 363 set_stack(index, check_interpreter_type(l, type, bad_type_exit));
aoqi@0 364 }
aoqi@0 365
aoqi@0 366 if (bad_type_exit->control()->req() > 1) {
aoqi@0 367 // Build an uncommon trap here, if any inputs can be unexpected.
aoqi@0 368 bad_type_exit->set_control(_gvn.transform( bad_type_exit->control() ));
aoqi@0 369 record_for_igvn(bad_type_exit->control());
aoqi@0 370 SafePointNode* types_are_good = map();
aoqi@0 371 set_map(bad_type_exit);
aoqi@0 372 // The unexpected type happens because a new edge is active
aoqi@0 373 // in the CFG, which typeflow had previously ignored.
aoqi@0 374 // E.g., Object x = coldAtFirst() && notReached()? "str": new Integer(123).
aoqi@0 375 // This x will be typed as Integer if notReached is not yet linked.
aoqi@0 376 // It could also happen due to a problem in ciTypeFlow analysis.
aoqi@0 377 uncommon_trap(Deoptimization::Reason_constraint,
aoqi@0 378 Deoptimization::Action_reinterpret);
aoqi@0 379 set_map(types_are_good);
aoqi@0 380 }
aoqi@0 381 }
aoqi@0 382
aoqi@0 383 //------------------------------Parse------------------------------------------
aoqi@0 384 // Main parser constructor.
roland@7041 385 Parse::Parse(JVMState* caller, ciMethod* parse_method, float expected_uses)
roland@7041 386 : _exits(caller)
aoqi@0 387 {
aoqi@0 388 // Init some variables
aoqi@0 389 _caller = caller;
aoqi@0 390 _method = parse_method;
aoqi@0 391 _expected_uses = expected_uses;
aoqi@0 392 _depth = 1 + (caller->has_method() ? caller->depth() : 0);
aoqi@0 393 _wrote_final = false;
aoqi@0 394 _wrote_volatile = false;
aoqi@0 395 _alloc_with_final = NULL;
aoqi@0 396 _entry_bci = InvocationEntryBci;
aoqi@0 397 _tf = NULL;
aoqi@0 398 _block = NULL;
roland@7041 399 _first_return = true;
roland@7041 400 _replaced_nodes_for_exceptions = false;
roland@7041 401 _new_idx = C->unique();
aoqi@0 402 debug_only(_block_count = -1);
aoqi@0 403 debug_only(_blocks = (Block*)-1);
aoqi@0 404 #ifndef PRODUCT
aoqi@0 405 if (PrintCompilation || PrintOpto) {
aoqi@0 406 // Make sure I have an inline tree, so I can print messages about it.
aoqi@0 407 JVMState* ilt_caller = is_osr_parse() ? caller->caller() : caller;
aoqi@0 408 InlineTree::find_subtree_from_root(C->ilt(), ilt_caller, parse_method);
aoqi@0 409 }
aoqi@0 410 _max_switch_depth = 0;
aoqi@0 411 _est_switch_depth = 0;
aoqi@0 412 #endif
aoqi@0 413
aoqi@0 414 _tf = TypeFunc::make(method());
aoqi@0 415 _iter.reset_to_method(method());
aoqi@0 416 _flow = method()->get_flow_analysis();
aoqi@0 417 if (_flow->failing()) {
aoqi@0 418 C->record_method_not_compilable_all_tiers(_flow->failure_reason());
aoqi@0 419 }
aoqi@0 420
aoqi@0 421 #ifndef PRODUCT
aoqi@0 422 if (_flow->has_irreducible_entry()) {
aoqi@0 423 C->set_parsed_irreducible_loop(true);
aoqi@0 424 }
aoqi@0 425 #endif
aoqi@0 426
aoqi@0 427 if (_expected_uses <= 0) {
aoqi@0 428 _prof_factor = 1;
aoqi@0 429 } else {
aoqi@0 430 float prof_total = parse_method->interpreter_invocation_count();
aoqi@0 431 if (prof_total <= _expected_uses) {
aoqi@0 432 _prof_factor = 1;
aoqi@0 433 } else {
aoqi@0 434 _prof_factor = _expected_uses / prof_total;
aoqi@0 435 }
aoqi@0 436 }
aoqi@0 437
aoqi@0 438 CompileLog* log = C->log();
aoqi@0 439 if (log != NULL) {
aoqi@0 440 log->begin_head("parse method='%d' uses='%g'",
aoqi@0 441 log->identify(parse_method), expected_uses);
aoqi@0 442 if (depth() == 1 && C->is_osr_compilation()) {
aoqi@0 443 log->print(" osr_bci='%d'", C->entry_bci());
aoqi@0 444 }
aoqi@0 445 log->stamp();
aoqi@0 446 log->end_head();
aoqi@0 447 }
aoqi@0 448
aoqi@0 449 // Accumulate deoptimization counts.
aoqi@0 450 // (The range_check and store_check counts are checked elsewhere.)
aoqi@0 451 ciMethodData* md = method()->method_data();
aoqi@0 452 for (uint reason = 0; reason < md->trap_reason_limit(); reason++) {
aoqi@0 453 uint md_count = md->trap_count(reason);
aoqi@0 454 if (md_count != 0) {
aoqi@0 455 if (md_count == md->trap_count_limit())
aoqi@0 456 md_count += md->overflow_trap_count();
aoqi@0 457 uint total_count = C->trap_count(reason);
aoqi@0 458 uint old_count = total_count;
aoqi@0 459 total_count += md_count;
aoqi@0 460 // Saturate the add if it overflows.
aoqi@0 461 if (total_count < old_count || total_count < md_count)
aoqi@0 462 total_count = (uint)-1;
aoqi@0 463 C->set_trap_count(reason, total_count);
aoqi@0 464 if (log != NULL)
aoqi@0 465 log->elem("observe trap='%s' count='%d' total='%d'",
aoqi@0 466 Deoptimization::trap_reason_name(reason),
aoqi@0 467 md_count, total_count);
aoqi@0 468 }
aoqi@0 469 }
aoqi@0 470 // Accumulate total sum of decompilations, also.
aoqi@0 471 C->set_decompile_count(C->decompile_count() + md->decompile_count());
aoqi@0 472
aoqi@0 473 _count_invocations = C->do_count_invocations();
aoqi@0 474 _method_data_update = C->do_method_data_update();
aoqi@0 475
aoqi@0 476 if (log != NULL && method()->has_exception_handlers()) {
aoqi@0 477 log->elem("observe that='has_exception_handlers'");
aoqi@0 478 }
aoqi@0 479
aoqi@0 480 assert(method()->can_be_compiled(), "Can not parse this method, cutout earlier");
aoqi@0 481 assert(method()->has_balanced_monitors(), "Can not parse unbalanced monitors, cutout earlier");
aoqi@0 482
aoqi@0 483 // Always register dependence if JVMTI is enabled, because
aoqi@0 484 // either breakpoint setting or hotswapping of methods may
aoqi@0 485 // cause deoptimization.
aoqi@0 486 if (C->env()->jvmti_can_hotswap_or_post_breakpoint()) {
aoqi@0 487 C->dependencies()->assert_evol_method(method());
aoqi@0 488 }
aoqi@0 489
aoqi@0 490 methods_seen++;
aoqi@0 491
aoqi@0 492 // Do some special top-level things.
aoqi@0 493 if (depth() == 1 && C->is_osr_compilation()) {
aoqi@0 494 _entry_bci = C->entry_bci();
aoqi@0 495 _flow = method()->get_osr_flow_analysis(osr_bci());
aoqi@0 496 if (_flow->failing()) {
aoqi@0 497 C->record_method_not_compilable(_flow->failure_reason());
aoqi@0 498 #ifndef PRODUCT
aoqi@0 499 if (PrintOpto && (Verbose || WizardMode)) {
aoqi@0 500 tty->print_cr("OSR @%d type flow bailout: %s", _entry_bci, _flow->failure_reason());
aoqi@0 501 if (Verbose) {
aoqi@0 502 method()->print();
aoqi@0 503 method()->print_codes();
aoqi@0 504 _flow->print();
aoqi@0 505 }
aoqi@0 506 }
aoqi@0 507 #endif
aoqi@0 508 }
aoqi@0 509 _tf = C->tf(); // the OSR entry type is different
aoqi@0 510 }
aoqi@0 511
aoqi@0 512 #ifdef ASSERT
aoqi@0 513 if (depth() == 1) {
aoqi@0 514 assert(C->is_osr_compilation() == this->is_osr_parse(), "OSR in sync");
aoqi@0 515 if (C->tf() != tf()) {
aoqi@0 516 MutexLockerEx ml(Compile_lock, Mutex::_no_safepoint_check_flag);
aoqi@0 517 assert(C->env()->system_dictionary_modification_counter_changed(),
aoqi@0 518 "Must invalidate if TypeFuncs differ");
aoqi@0 519 }
aoqi@0 520 } else {
aoqi@0 521 assert(!this->is_osr_parse(), "no recursive OSR");
aoqi@0 522 }
aoqi@0 523 #endif
aoqi@0 524
aoqi@0 525 methods_parsed++;
aoqi@0 526 #ifndef PRODUCT
aoqi@0 527 // add method size here to guarantee that inlined methods are added too
aoqi@0 528 if (TimeCompiler)
aoqi@0 529 _total_bytes_compiled += method()->code_size();
aoqi@0 530
aoqi@0 531 show_parse_info();
aoqi@0 532 #endif
aoqi@0 533
aoqi@0 534 if (failing()) {
aoqi@0 535 if (log) log->done("parse");
aoqi@0 536 return;
aoqi@0 537 }
aoqi@0 538
aoqi@0 539 gvn().set_type(root(), root()->bottom_type());
aoqi@0 540 gvn().transform(top());
aoqi@0 541
aoqi@0 542 // Import the results of the ciTypeFlow.
aoqi@0 543 init_blocks();
aoqi@0 544
aoqi@0 545 // Merge point for all normal exits
aoqi@0 546 build_exits();
aoqi@0 547
aoqi@0 548 // Setup the initial JVM state map.
aoqi@0 549 SafePointNode* entry_map = create_entry_map();
aoqi@0 550
aoqi@0 551 // Check for bailouts during map initialization
aoqi@0 552 if (failing() || entry_map == NULL) {
aoqi@0 553 if (log) log->done("parse");
aoqi@0 554 return;
aoqi@0 555 }
aoqi@0 556
aoqi@0 557 Node_Notes* caller_nn = C->default_node_notes();
aoqi@0 558 // Collect debug info for inlined calls unless -XX:-DebugInlinedCalls.
aoqi@0 559 if (DebugInlinedCalls || depth() == 1) {
aoqi@0 560 C->set_default_node_notes(make_node_notes(caller_nn));
aoqi@0 561 }
aoqi@0 562
aoqi@0 563 if (is_osr_parse()) {
aoqi@0 564 Node* osr_buf = entry_map->in(TypeFunc::Parms+0);
aoqi@0 565 entry_map->set_req(TypeFunc::Parms+0, top());
aoqi@0 566 set_map(entry_map);
aoqi@0 567 load_interpreter_state(osr_buf);
aoqi@0 568 } else {
aoqi@0 569 set_map(entry_map);
aoqi@0 570 do_method_entry();
aoqi@0 571 }
fzhinkin@6997 572
fzhinkin@6997 573 if (depth() == 1 && !failing()) {
aoqi@0 574 // Add check to deoptimize the nmethod if RTM state was changed
aoqi@0 575 rtm_deopt();
aoqi@0 576 }
aoqi@0 577
fzhinkin@6997 578 // Check for bailouts during method entry or RTM state check setup.
aoqi@0 579 if (failing()) {
aoqi@0 580 if (log) log->done("parse");
aoqi@0 581 C->set_default_node_notes(caller_nn);
aoqi@0 582 return;
aoqi@0 583 }
aoqi@0 584
aoqi@0 585 entry_map = map(); // capture any changes performed by method setup code
aoqi@0 586 assert(jvms()->endoff() == map()->req(), "map matches JVMS layout");
aoqi@0 587
aoqi@0 588 // We begin parsing as if we have just encountered a jump to the
aoqi@0 589 // method entry.
aoqi@0 590 Block* entry_block = start_block();
aoqi@0 591 assert(entry_block->start() == (is_osr_parse() ? osr_bci() : 0), "");
aoqi@0 592 set_map_clone(entry_map);
aoqi@0 593 merge_common(entry_block, entry_block->next_path_num());
aoqi@0 594
aoqi@0 595 #ifndef PRODUCT
aoqi@0 596 BytecodeParseHistogram *parse_histogram_obj = new (C->env()->arena()) BytecodeParseHistogram(this, C);
aoqi@0 597 set_parse_histogram( parse_histogram_obj );
aoqi@0 598 #endif
aoqi@0 599
aoqi@0 600 // Parse all the basic blocks.
aoqi@0 601 do_all_blocks();
aoqi@0 602
aoqi@0 603 C->set_default_node_notes(caller_nn);
aoqi@0 604
aoqi@0 605 // Check for bailouts during conversion to graph
aoqi@0 606 if (failing()) {
aoqi@0 607 if (log) log->done("parse");
aoqi@0 608 return;
aoqi@0 609 }
aoqi@0 610
aoqi@0 611 // Fix up all exiting control flow.
aoqi@0 612 set_map(entry_map);
aoqi@0 613 do_exits();
aoqi@0 614
aoqi@0 615 if (log) log->done("parse nodes='%d' live='%d' memory='" SIZE_FORMAT "'",
aoqi@0 616 C->unique(), C->live_nodes(), C->node_arena()->used());
aoqi@0 617 }
aoqi@0 618
aoqi@0 619 //---------------------------do_all_blocks-------------------------------------
aoqi@0 620 void Parse::do_all_blocks() {
aoqi@0 621 bool has_irreducible = flow()->has_irreducible_entry();
aoqi@0 622
aoqi@0 623 // Walk over all blocks in Reverse Post-Order.
aoqi@0 624 while (true) {
aoqi@0 625 bool progress = false;
aoqi@0 626 for (int rpo = 0; rpo < block_count(); rpo++) {
aoqi@0 627 Block* block = rpo_at(rpo);
aoqi@0 628
aoqi@0 629 if (block->is_parsed()) continue;
aoqi@0 630
aoqi@0 631 if (!block->is_merged()) {
aoqi@0 632 // Dead block, no state reaches this block
aoqi@0 633 continue;
aoqi@0 634 }
aoqi@0 635
aoqi@0 636 // Prepare to parse this block.
aoqi@0 637 load_state_from(block);
aoqi@0 638
aoqi@0 639 if (stopped()) {
aoqi@0 640 // Block is dead.
aoqi@0 641 continue;
aoqi@0 642 }
aoqi@0 643
aoqi@0 644 blocks_parsed++;
aoqi@0 645
aoqi@0 646 progress = true;
aoqi@0 647 if (block->is_loop_head() || block->is_handler() || has_irreducible && !block->is_ready()) {
aoqi@0 648 // Not all preds have been parsed. We must build phis everywhere.
aoqi@0 649 // (Note that dead locals do not get phis built, ever.)
aoqi@0 650 ensure_phis_everywhere();
aoqi@0 651
aoqi@0 652 if (block->is_SEL_head() &&
aoqi@0 653 (UseLoopPredicate || LoopLimitCheck)) {
aoqi@0 654 // Add predicate to single entry (not irreducible) loop head.
aoqi@0 655 assert(!block->has_merged_backedge(), "only entry paths should be merged for now");
aoqi@0 656 // Need correct bci for predicate.
aoqi@0 657 // It is fine to set it here since do_one_block() will set it anyway.
aoqi@0 658 set_parse_bci(block->start());
aoqi@0 659 add_predicate();
aoqi@0 660 // Add new region for back branches.
aoqi@0 661 int edges = block->pred_count() - block->preds_parsed() + 1; // +1 for original region
aoqi@0 662 RegionNode *r = new (C) RegionNode(edges+1);
aoqi@0 663 _gvn.set_type(r, Type::CONTROL);
aoqi@0 664 record_for_igvn(r);
aoqi@0 665 r->init_req(edges, control());
aoqi@0 666 set_control(r);
aoqi@0 667 // Add new phis.
aoqi@0 668 ensure_phis_everywhere();
aoqi@0 669 }
aoqi@0 670
aoqi@0 671 // Leave behind an undisturbed copy of the map, for future merges.
aoqi@0 672 set_map(clone_map());
aoqi@0 673 }
aoqi@0 674
aoqi@0 675 if (control()->is_Region() && !block->is_loop_head() && !has_irreducible && !block->is_handler()) {
aoqi@0 676 // In the absence of irreducible loops, the Region and Phis
aoqi@0 677 // associated with a merge that doesn't involve a backedge can
aoqi@0 678 // be simplified now since the RPO parsing order guarantees
aoqi@0 679 // that any path which was supposed to reach here has already
aoqi@0 680 // been parsed or must be dead.
aoqi@0 681 Node* c = control();
aoqi@0 682 Node* result = _gvn.transform_no_reclaim(control());
aoqi@0 683 if (c != result && TraceOptoParse) {
aoqi@0 684 tty->print_cr("Block #%d replace %d with %d", block->rpo(), c->_idx, result->_idx);
aoqi@0 685 }
aoqi@0 686 if (result != top()) {
aoqi@0 687 record_for_igvn(result);
aoqi@0 688 }
aoqi@0 689 }
aoqi@0 690
aoqi@0 691 // Parse the block.
aoqi@0 692 do_one_block();
aoqi@0 693
aoqi@0 694 // Check for bailouts.
aoqi@0 695 if (failing()) return;
aoqi@0 696 }
aoqi@0 697
aoqi@0 698 // with irreducible loops multiple passes might be necessary to parse everything
aoqi@0 699 if (!has_irreducible || !progress) {
aoqi@0 700 break;
aoqi@0 701 }
aoqi@0 702 }
aoqi@0 703
aoqi@0 704 blocks_seen += block_count();
aoqi@0 705
aoqi@0 706 #ifndef PRODUCT
aoqi@0 707 // Make sure there are no half-processed blocks remaining.
aoqi@0 708 // Every remaining unprocessed block is dead and may be ignored now.
aoqi@0 709 for (int rpo = 0; rpo < block_count(); rpo++) {
aoqi@0 710 Block* block = rpo_at(rpo);
aoqi@0 711 if (!block->is_parsed()) {
aoqi@0 712 if (TraceOptoParse) {
aoqi@0 713 tty->print_cr("Skipped dead block %d at bci:%d", rpo, block->start());
aoqi@0 714 }
aoqi@0 715 assert(!block->is_merged(), "no half-processed blocks");
aoqi@0 716 }
aoqi@0 717 }
aoqi@0 718 #endif
aoqi@0 719 }
aoqi@0 720
kevinw@8368 721 static Node* mask_int_value(Node* v, BasicType bt, PhaseGVN* gvn) {
kevinw@8368 722 Compile* C = gvn->C;
kevinw@8368 723 switch (bt) {
kevinw@8368 724 case T_BYTE:
kevinw@8368 725 v = gvn->transform(new (C) LShiftINode(v, gvn->intcon(24)));
kevinw@8368 726 v = gvn->transform(new (C) RShiftINode(v, gvn->intcon(24)));
kevinw@8368 727 break;
kevinw@8368 728 case T_SHORT:
kevinw@8368 729 v = gvn->transform(new (C) LShiftINode(v, gvn->intcon(16)));
kevinw@8368 730 v = gvn->transform(new (C) RShiftINode(v, gvn->intcon(16)));
kevinw@8368 731 break;
kevinw@8368 732 case T_CHAR:
kevinw@8368 733 v = gvn->transform(new (C) AndINode(v, gvn->intcon(0xFFFF)));
kevinw@8368 734 break;
kevinw@8368 735 case T_BOOLEAN:
kevinw@8368 736 v = gvn->transform(new (C) AndINode(v, gvn->intcon(0x1)));
kevinw@8368 737 break;
kevinw@8368 738 }
kevinw@8368 739 return v;
kevinw@8368 740 }
kevinw@8368 741
aoqi@0 742 //-------------------------------build_exits----------------------------------
aoqi@0 743 // Build normal and exceptional exit merge points.
aoqi@0 744 void Parse::build_exits() {
aoqi@0 745 // make a clone of caller to prevent sharing of side-effects
aoqi@0 746 _exits.set_map(_exits.clone_map());
aoqi@0 747 _exits.clean_stack(_exits.sp());
aoqi@0 748 _exits.sync_jvms();
aoqi@0 749
aoqi@0 750 RegionNode* region = new (C) RegionNode(1);
aoqi@0 751 record_for_igvn(region);
aoqi@0 752 gvn().set_type_bottom(region);
aoqi@0 753 _exits.set_control(region);
aoqi@0 754
aoqi@0 755 // Note: iophi and memphi are not transformed until do_exits.
aoqi@0 756 Node* iophi = new (C) PhiNode(region, Type::ABIO);
aoqi@0 757 Node* memphi = new (C) PhiNode(region, Type::MEMORY, TypePtr::BOTTOM);
aoqi@0 758 gvn().set_type_bottom(iophi);
aoqi@0 759 gvn().set_type_bottom(memphi);
aoqi@0 760 _exits.set_i_o(iophi);
aoqi@0 761 _exits.set_all_memory(memphi);
aoqi@0 762
aoqi@0 763 // Add a return value to the exit state. (Do not push it yet.)
aoqi@0 764 if (tf()->range()->cnt() > TypeFunc::Parms) {
aoqi@0 765 const Type* ret_type = tf()->range()->field_at(TypeFunc::Parms);
kevinw@8368 766 if (ret_type->isa_int()) {
kevinw@8368 767 BasicType ret_bt = method()->return_type()->basic_type();
kevinw@8368 768 if (ret_bt == T_BOOLEAN ||
kevinw@8368 769 ret_bt == T_CHAR ||
kevinw@8368 770 ret_bt == T_BYTE ||
kevinw@8368 771 ret_bt == T_SHORT) {
kevinw@8368 772 ret_type = TypeInt::INT;
kevinw@8368 773 }
kevinw@8368 774 }
kevinw@8368 775
aoqi@0 776 // Don't "bind" an unloaded return klass to the ret_phi. If the klass
aoqi@0 777 // becomes loaded during the subsequent parsing, the loaded and unloaded
aoqi@0 778 // types will not join when we transform and push in do_exits().
aoqi@0 779 const TypeOopPtr* ret_oop_type = ret_type->isa_oopptr();
aoqi@0 780 if (ret_oop_type && !ret_oop_type->klass()->is_loaded()) {
aoqi@0 781 ret_type = TypeOopPtr::BOTTOM;
aoqi@0 782 }
aoqi@0 783 int ret_size = type2size[ret_type->basic_type()];
aoqi@0 784 Node* ret_phi = new (C) PhiNode(region, ret_type);
aoqi@0 785 gvn().set_type_bottom(ret_phi);
aoqi@0 786 _exits.ensure_stack(ret_size);
aoqi@0 787 assert((int)(tf()->range()->cnt() - TypeFunc::Parms) == ret_size, "good tf range");
aoqi@0 788 assert(method()->return_type()->size() == ret_size, "tf agrees w/ method");
aoqi@0 789 _exits.set_argument(0, ret_phi); // here is where the parser finds it
aoqi@0 790 // Note: ret_phi is not yet pushed, until do_exits.
aoqi@0 791 }
aoqi@0 792 }
aoqi@0 793
aoqi@0 794
aoqi@0 795 //----------------------------build_start_state-------------------------------
aoqi@0 796 // Construct a state which contains only the incoming arguments from an
aoqi@0 797 // unknown caller. The method & bci will be NULL & InvocationEntryBci.
aoqi@0 798 JVMState* Compile::build_start_state(StartNode* start, const TypeFunc* tf) {
aoqi@0 799 int arg_size = tf->domain()->cnt();
aoqi@0 800 int max_size = MAX2(arg_size, (int)tf->range()->cnt());
aoqi@0 801 JVMState* jvms = new (this) JVMState(max_size - TypeFunc::Parms);
aoqi@0 802 SafePointNode* map = new (this) SafePointNode(max_size, NULL);
aoqi@0 803 record_for_igvn(map);
aoqi@0 804 assert(arg_size == TypeFunc::Parms + (is_osr_compilation() ? 1 : method()->arg_size()), "correct arg_size");
aoqi@0 805 Node_Notes* old_nn = default_node_notes();
aoqi@0 806 if (old_nn != NULL && has_method()) {
aoqi@0 807 Node_Notes* entry_nn = old_nn->clone(this);
aoqi@0 808 JVMState* entry_jvms = new(this) JVMState(method(), old_nn->jvms());
aoqi@0 809 entry_jvms->set_offsets(0);
aoqi@0 810 entry_jvms->set_bci(entry_bci());
aoqi@0 811 entry_nn->set_jvms(entry_jvms);
aoqi@0 812 set_default_node_notes(entry_nn);
aoqi@0 813 }
aoqi@0 814 uint i;
aoqi@0 815 for (i = 0; i < (uint)arg_size; i++) {
aoqi@0 816 Node* parm = initial_gvn()->transform(new (this) ParmNode(start, i));
aoqi@0 817 map->init_req(i, parm);
aoqi@0 818 // Record all these guys for later GVN.
aoqi@0 819 record_for_igvn(parm);
aoqi@0 820 }
aoqi@0 821 for (; i < map->req(); i++) {
aoqi@0 822 map->init_req(i, top());
aoqi@0 823 }
aoqi@0 824 assert(jvms->argoff() == TypeFunc::Parms, "parser gets arguments here");
aoqi@0 825 set_default_node_notes(old_nn);
aoqi@0 826 map->set_jvms(jvms);
aoqi@0 827 jvms->set_map(map);
aoqi@0 828 return jvms;
aoqi@0 829 }
aoqi@0 830
aoqi@0 831 //-----------------------------make_node_notes---------------------------------
aoqi@0 832 Node_Notes* Parse::make_node_notes(Node_Notes* caller_nn) {
aoqi@0 833 if (caller_nn == NULL) return NULL;
aoqi@0 834 Node_Notes* nn = caller_nn->clone(C);
aoqi@0 835 JVMState* caller_jvms = nn->jvms();
aoqi@0 836 JVMState* jvms = new (C) JVMState(method(), caller_jvms);
aoqi@0 837 jvms->set_offsets(0);
aoqi@0 838 jvms->set_bci(_entry_bci);
aoqi@0 839 nn->set_jvms(jvms);
aoqi@0 840 return nn;
aoqi@0 841 }
aoqi@0 842
aoqi@0 843
aoqi@0 844 //--------------------------return_values--------------------------------------
aoqi@0 845 void Compile::return_values(JVMState* jvms) {
aoqi@0 846 GraphKit kit(jvms);
aoqi@0 847 Node* ret = new (this) ReturnNode(TypeFunc::Parms,
aoqi@0 848 kit.control(),
aoqi@0 849 kit.i_o(),
aoqi@0 850 kit.reset_memory(),
aoqi@0 851 kit.frameptr(),
aoqi@0 852 kit.returnadr());
aoqi@0 853 // Add zero or 1 return values
aoqi@0 854 int ret_size = tf()->range()->cnt() - TypeFunc::Parms;
aoqi@0 855 if (ret_size > 0) {
aoqi@0 856 kit.inc_sp(-ret_size); // pop the return value(s)
aoqi@0 857 kit.sync_jvms();
aoqi@0 858 ret->add_req(kit.argument(0));
aoqi@0 859 // Note: The second dummy edge is not needed by a ReturnNode.
aoqi@0 860 }
aoqi@0 861 // bind it to root
aoqi@0 862 root()->add_req(ret);
aoqi@0 863 record_for_igvn(ret);
aoqi@0 864 initial_gvn()->transform_no_reclaim(ret);
aoqi@0 865 }
aoqi@0 866
aoqi@0 867 //------------------------rethrow_exceptions-----------------------------------
aoqi@0 868 // Bind all exception states in the list into a single RethrowNode.
aoqi@0 869 void Compile::rethrow_exceptions(JVMState* jvms) {
aoqi@0 870 GraphKit kit(jvms);
aoqi@0 871 if (!kit.has_exceptions()) return; // nothing to generate
aoqi@0 872 // Load my combined exception state into the kit, with all phis transformed:
aoqi@0 873 SafePointNode* ex_map = kit.combine_and_pop_all_exception_states();
aoqi@0 874 Node* ex_oop = kit.use_exception_state(ex_map);
aoqi@0 875 RethrowNode* exit = new (this) RethrowNode(kit.control(),
aoqi@0 876 kit.i_o(), kit.reset_memory(),
aoqi@0 877 kit.frameptr(), kit.returnadr(),
aoqi@0 878 // like a return but with exception input
aoqi@0 879 ex_oop);
aoqi@0 880 // bind to root
aoqi@0 881 root()->add_req(exit);
aoqi@0 882 record_for_igvn(exit);
aoqi@0 883 initial_gvn()->transform_no_reclaim(exit);
aoqi@0 884 }
aoqi@0 885
aoqi@0 886 //---------------------------do_exceptions-------------------------------------
aoqi@0 887 // Process exceptions arising from the current bytecode.
aoqi@0 888 // Send caught exceptions to the proper handler within this method.
aoqi@0 889 // Unhandled exceptions feed into _exit.
aoqi@0 890 void Parse::do_exceptions() {
aoqi@0 891 if (!has_exceptions()) return;
aoqi@0 892
aoqi@0 893 if (failing()) {
aoqi@0 894 // Pop them all off and throw them away.
aoqi@0 895 while (pop_exception_state() != NULL) ;
aoqi@0 896 return;
aoqi@0 897 }
aoqi@0 898
aoqi@0 899 PreserveJVMState pjvms(this, false);
aoqi@0 900
aoqi@0 901 SafePointNode* ex_map;
aoqi@0 902 while ((ex_map = pop_exception_state()) != NULL) {
aoqi@0 903 if (!method()->has_exception_handlers()) {
aoqi@0 904 // Common case: Transfer control outward.
aoqi@0 905 // Doing it this early allows the exceptions to common up
aoqi@0 906 // even between adjacent method calls.
aoqi@0 907 throw_to_exit(ex_map);
aoqi@0 908 } else {
aoqi@0 909 // Have to look at the exception first.
aoqi@0 910 assert(stopped(), "catch_inline_exceptions trashes the map");
aoqi@0 911 catch_inline_exceptions(ex_map);
aoqi@0 912 stop_and_kill_map(); // we used up this exception state; kill it
aoqi@0 913 }
aoqi@0 914 }
aoqi@0 915
aoqi@0 916 // We now return to our regularly scheduled program:
aoqi@0 917 }
aoqi@0 918
aoqi@0 919 //---------------------------throw_to_exit-------------------------------------
aoqi@0 920 // Merge the given map into an exception exit from this method.
aoqi@0 921 // The exception exit will handle any unlocking of receiver.
aoqi@0 922 // The ex_oop must be saved within the ex_map, unlike merge_exception.
aoqi@0 923 void Parse::throw_to_exit(SafePointNode* ex_map) {
aoqi@0 924 // Pop the JVMS to (a copy of) the caller.
aoqi@0 925 GraphKit caller;
aoqi@0 926 caller.set_map_clone(_caller->map());
aoqi@0 927 caller.set_bci(_caller->bci());
aoqi@0 928 caller.set_sp(_caller->sp());
aoqi@0 929 // Copy out the standard machine state:
aoqi@0 930 for (uint i = 0; i < TypeFunc::Parms; i++) {
aoqi@0 931 caller.map()->set_req(i, ex_map->in(i));
aoqi@0 932 }
roland@7041 933 if (ex_map->has_replaced_nodes()) {
roland@7041 934 _replaced_nodes_for_exceptions = true;
roland@7041 935 }
roland@7041 936 caller.map()->transfer_replaced_nodes_from(ex_map, _new_idx);
aoqi@0 937 // ...and the exception:
aoqi@0 938 Node* ex_oop = saved_ex_oop(ex_map);
aoqi@0 939 SafePointNode* caller_ex_map = caller.make_exception_state(ex_oop);
aoqi@0 940 // Finally, collect the new exception state in my exits:
aoqi@0 941 _exits.add_exception_state(caller_ex_map);
aoqi@0 942 }
aoqi@0 943
aoqi@0 944 //------------------------------do_exits---------------------------------------
aoqi@0 945 void Parse::do_exits() {
aoqi@0 946 set_parse_bci(InvocationEntryBci);
aoqi@0 947
aoqi@0 948 // Now peephole on the return bits
aoqi@0 949 Node* region = _exits.control();
aoqi@0 950 _exits.set_control(gvn().transform(region));
aoqi@0 951
aoqi@0 952 Node* iophi = _exits.i_o();
aoqi@0 953 _exits.set_i_o(gvn().transform(iophi));
aoqi@0 954
aoqi@0 955 // On PPC64, also add MemBarRelease for constructors which write
aoqi@0 956 // volatile fields. As support_IRIW_for_not_multiple_copy_atomic_cpu
aoqi@0 957 // is set on PPC64, no sync instruction is issued after volatile
aoqi@0 958 // stores. We want to quarantee the same behaviour as on platforms
aoqi@0 959 // with total store order, although this is not required by the Java
aoqi@0 960 // memory model. So as with finals, we add a barrier here.
aoqi@0 961 if (wrote_final() PPC64_ONLY(|| (wrote_volatile() && method()->is_initializer()))) {
aoqi@0 962 // This method (which must be a constructor by the rules of Java)
aoqi@0 963 // wrote a final. The effects of all initializations must be
aoqi@0 964 // committed to memory before any code after the constructor
aoqi@0 965 // publishes the reference to the newly constructor object.
aoqi@0 966 // Rather than wait for the publication, we simply block the
aoqi@0 967 // writes here. Rather than put a barrier on only those writes
aoqi@0 968 // which are required to complete, we force all writes to complete.
aoqi@0 969 //
aoqi@0 970 // "All bets are off" unless the first publication occurs after a
aoqi@0 971 // normal return from the constructor. We do not attempt to detect
aoqi@0 972 // such unusual early publications. But no barrier is needed on
aoqi@0 973 // exceptional returns, since they cannot publish normally.
aoqi@0 974 //
aoqi@0 975 _exits.insert_mem_bar(Op_MemBarRelease, alloc_with_final());
aoqi@0 976 #ifndef PRODUCT
aoqi@0 977 if (PrintOpto && (Verbose || WizardMode)) {
aoqi@0 978 method()->print_name();
aoqi@0 979 tty->print_cr(" writes finals and needs a memory barrier");
aoqi@0 980 }
aoqi@0 981 #endif
aoqi@0 982 }
aoqi@0 983
aoqi@0 984 for (MergeMemStream mms(_exits.merged_memory()); mms.next_non_empty(); ) {
aoqi@0 985 // transform each slice of the original memphi:
aoqi@0 986 mms.set_memory(_gvn.transform(mms.memory()));
aoqi@0 987 }
aoqi@0 988
aoqi@0 989 if (tf()->range()->cnt() > TypeFunc::Parms) {
aoqi@0 990 const Type* ret_type = tf()->range()->field_at(TypeFunc::Parms);
aoqi@0 991 Node* ret_phi = _gvn.transform( _exits.argument(0) );
shshahma@8421 992 if (!_exits.control()->is_top() && _gvn.type(ret_phi)->empty()) {
shshahma@8421 993 // In case of concurrent class loading, the type we set for the
shshahma@8421 994 // ret_phi in build_exits() may have been too optimistic and the
shshahma@8421 995 // ret_phi may be top now.
shshahma@8422 996 // Otherwise, we've encountered an error and have to mark the method as
shshahma@8422 997 // not compilable. Just using an assertion instead would be dangerous
shshahma@8422 998 // as this could lead to an infinite compile loop in non-debug builds.
shshahma@8421 999 {
shshahma@8421 1000 MutexLockerEx ml(Compile_lock, Mutex::_no_safepoint_check_flag);
shshahma@8422 1001 if (C->env()->system_dictionary_modification_counter_changed()) {
shshahma@8422 1002 C->record_failure(C2Compiler::retry_class_loading_during_parsing());
shshahma@8422 1003 } else {
shshahma@8422 1004 C->record_method_not_compilable("Can't determine return type.");
shshahma@8422 1005 }
shshahma@8421 1006 }
shshahma@8422 1007 return;
shshahma@8421 1008 }
kevinw@8368 1009 if (ret_type->isa_int()) {
kevinw@8368 1010 BasicType ret_bt = method()->return_type()->basic_type();
kevinw@8368 1011 ret_phi = mask_int_value(ret_phi, ret_bt, &_gvn);
kevinw@8368 1012 }
aoqi@0 1013 _exits.push_node(ret_type->basic_type(), ret_phi);
aoqi@0 1014 }
aoqi@0 1015
aoqi@0 1016 // Note: Logic for creating and optimizing the ReturnNode is in Compile.
aoqi@0 1017
aoqi@0 1018 // Unlock along the exceptional paths.
aoqi@0 1019 // This is done late so that we can common up equivalent exceptions
aoqi@0 1020 // (e.g., null checks) arising from multiple points within this method.
aoqi@0 1021 // See GraphKit::add_exception_state, which performs the commoning.
aoqi@0 1022 bool do_synch = method()->is_synchronized() && GenerateSynchronizationCode;
aoqi@0 1023
aoqi@0 1024 // record exit from a method if compiled while Dtrace is turned on.
roland@7041 1025 if (do_synch || C->env()->dtrace_method_probes() || _replaced_nodes_for_exceptions) {
aoqi@0 1026 // First move the exception list out of _exits:
aoqi@0 1027 GraphKit kit(_exits.transfer_exceptions_into_jvms());
aoqi@0 1028 SafePointNode* normal_map = kit.map(); // keep this guy safe
aoqi@0 1029 // Now re-collect the exceptions into _exits:
aoqi@0 1030 SafePointNode* ex_map;
aoqi@0 1031 while ((ex_map = kit.pop_exception_state()) != NULL) {
aoqi@0 1032 Node* ex_oop = kit.use_exception_state(ex_map);
aoqi@0 1033 // Force the exiting JVM state to have this method at InvocationEntryBci.
aoqi@0 1034 // The exiting JVM state is otherwise a copy of the calling JVMS.
aoqi@0 1035 JVMState* caller = kit.jvms();
aoqi@0 1036 JVMState* ex_jvms = caller->clone_shallow(C);
aoqi@0 1037 ex_jvms->set_map(kit.clone_map());
aoqi@0 1038 ex_jvms->map()->set_jvms(ex_jvms);
aoqi@0 1039 ex_jvms->set_bci( InvocationEntryBci);
aoqi@0 1040 kit.set_jvms(ex_jvms);
aoqi@0 1041 if (do_synch) {
aoqi@0 1042 // Add on the synchronized-method box/object combo
aoqi@0 1043 kit.map()->push_monitor(_synch_lock);
aoqi@0 1044 // Unlock!
aoqi@0 1045 kit.shared_unlock(_synch_lock->box_node(), _synch_lock->obj_node());
aoqi@0 1046 }
aoqi@0 1047 if (C->env()->dtrace_method_probes()) {
aoqi@0 1048 kit.make_dtrace_method_exit(method());
aoqi@0 1049 }
roland@7041 1050 if (_replaced_nodes_for_exceptions) {
roland@8723 1051 kit.map()->apply_replaced_nodes(_new_idx);
roland@7041 1052 }
aoqi@0 1053 // Done with exception-path processing.
aoqi@0 1054 ex_map = kit.make_exception_state(ex_oop);
aoqi@0 1055 assert(ex_jvms->same_calls_as(ex_map->jvms()), "sanity");
aoqi@0 1056 // Pop the last vestige of this method:
aoqi@0 1057 ex_map->set_jvms(caller->clone_shallow(C));
aoqi@0 1058 ex_map->jvms()->set_map(ex_map);
aoqi@0 1059 _exits.push_exception_state(ex_map);
aoqi@0 1060 }
aoqi@0 1061 assert(_exits.map() == normal_map, "keep the same return state");
aoqi@0 1062 }
aoqi@0 1063
aoqi@0 1064 {
aoqi@0 1065 // Capture very early exceptions (receiver null checks) from caller JVMS
aoqi@0 1066 GraphKit caller(_caller);
aoqi@0 1067 SafePointNode* ex_map;
aoqi@0 1068 while ((ex_map = caller.pop_exception_state()) != NULL) {
aoqi@0 1069 _exits.add_exception_state(ex_map);
aoqi@0 1070 }
aoqi@0 1071 }
roland@8723 1072 _exits.map()->apply_replaced_nodes(_new_idx);
aoqi@0 1073 }
aoqi@0 1074
aoqi@0 1075 //-----------------------------create_entry_map-------------------------------
aoqi@0 1076 // Initialize our parser map to contain the types at method entry.
aoqi@0 1077 // For OSR, the map contains a single RawPtr parameter.
aoqi@0 1078 // Initial monitor locking for sync. methods is performed by do_method_entry.
aoqi@0 1079 SafePointNode* Parse::create_entry_map() {
aoqi@0 1080 // Check for really stupid bail-out cases.
aoqi@0 1081 uint len = TypeFunc::Parms + method()->max_locals() + method()->max_stack();
aoqi@0 1082 if (len >= 32760) {
aoqi@0 1083 C->record_method_not_compilable_all_tiers("too many local variables");
aoqi@0 1084 return NULL;
aoqi@0 1085 }
aoqi@0 1086
roland@7041 1087 // clear current replaced nodes that are of no use from here on (map was cloned in build_exits).
roland@7041 1088 _caller->map()->delete_replaced_nodes();
roland@7041 1089
aoqi@0 1090 // If this is an inlined method, we may have to do a receiver null check.
aoqi@0 1091 if (_caller->has_method() && is_normal_parse() && !method()->is_static()) {
aoqi@0 1092 GraphKit kit(_caller);
aoqi@0 1093 kit.null_check_receiver_before_call(method());
aoqi@0 1094 _caller = kit.transfer_exceptions_into_jvms();
aoqi@0 1095 if (kit.stopped()) {
aoqi@0 1096 _exits.add_exception_states_from(_caller);
aoqi@0 1097 _exits.set_jvms(_caller);
aoqi@0 1098 return NULL;
aoqi@0 1099 }
aoqi@0 1100 }
aoqi@0 1101
aoqi@0 1102 assert(method() != NULL, "parser must have a method");
aoqi@0 1103
aoqi@0 1104 // Create an initial safepoint to hold JVM state during parsing
aoqi@0 1105 JVMState* jvms = new (C) JVMState(method(), _caller->has_method() ? _caller : NULL);
aoqi@0 1106 set_map(new (C) SafePointNode(len, jvms));
aoqi@0 1107 jvms->set_map(map());
aoqi@0 1108 record_for_igvn(map());
aoqi@0 1109 assert(jvms->endoff() == len, "correct jvms sizing");
aoqi@0 1110
aoqi@0 1111 SafePointNode* inmap = _caller->map();
aoqi@0 1112 assert(inmap != NULL, "must have inmap");
roland@7041 1113 // In case of null check on receiver above
roland@7041 1114 map()->transfer_replaced_nodes_from(inmap, _new_idx);
aoqi@0 1115
aoqi@0 1116 uint i;
aoqi@0 1117
aoqi@0 1118 // Pass thru the predefined input parameters.
aoqi@0 1119 for (i = 0; i < TypeFunc::Parms; i++) {
aoqi@0 1120 map()->init_req(i, inmap->in(i));
aoqi@0 1121 }
aoqi@0 1122
aoqi@0 1123 if (depth() == 1) {
aoqi@0 1124 assert(map()->memory()->Opcode() == Op_Parm, "");
aoqi@0 1125 // Insert the memory aliasing node
aoqi@0 1126 set_all_memory(reset_memory());
aoqi@0 1127 }
aoqi@0 1128 assert(merged_memory(), "");
aoqi@0 1129
aoqi@0 1130 // Now add the locals which are initially bound to arguments:
aoqi@0 1131 uint arg_size = tf()->domain()->cnt();
aoqi@0 1132 ensure_stack(arg_size - TypeFunc::Parms); // OSR methods have funny args
aoqi@0 1133 for (i = TypeFunc::Parms; i < arg_size; i++) {
aoqi@0 1134 map()->init_req(i, inmap->argument(_caller, i - TypeFunc::Parms));
aoqi@0 1135 }
aoqi@0 1136
aoqi@0 1137 // Clear out the rest of the map (locals and stack)
aoqi@0 1138 for (i = arg_size; i < len; i++) {
aoqi@0 1139 map()->init_req(i, top());
aoqi@0 1140 }
aoqi@0 1141
aoqi@0 1142 SafePointNode* entry_map = stop();
aoqi@0 1143 return entry_map;
aoqi@0 1144 }
aoqi@0 1145
aoqi@0 1146 //-----------------------------do_method_entry--------------------------------
aoqi@0 1147 // Emit any code needed in the pseudo-block before BCI zero.
aoqi@0 1148 // The main thing to do is lock the receiver of a synchronized method.
aoqi@0 1149 void Parse::do_method_entry() {
aoqi@0 1150 set_parse_bci(InvocationEntryBci); // Pseudo-BCP
aoqi@0 1151 set_sp(0); // Java Stack Pointer
aoqi@0 1152
aoqi@0 1153 NOT_PRODUCT( count_compiled_calls(true/*at_method_entry*/, false/*is_inline*/); )
aoqi@0 1154
aoqi@0 1155 if (C->env()->dtrace_method_probes()) {
aoqi@0 1156 make_dtrace_method_entry(method());
aoqi@0 1157 }
aoqi@0 1158
aoqi@0 1159 // If the method is synchronized, we need to construct a lock node, attach
aoqi@0 1160 // it to the Start node, and pin it there.
aoqi@0 1161 if (method()->is_synchronized()) {
aoqi@0 1162 // Insert a FastLockNode right after the Start which takes as arguments
aoqi@0 1163 // the current thread pointer, the "this" pointer & the address of the
aoqi@0 1164 // stack slot pair used for the lock. The "this" pointer is a projection
aoqi@0 1165 // off the start node, but the locking spot has to be constructed by
aoqi@0 1166 // creating a ConLNode of 0, and boxing it with a BoxLockNode. The BoxLockNode
aoqi@0 1167 // becomes the second argument to the FastLockNode call. The
aoqi@0 1168 // FastLockNode becomes the new control parent to pin it to the start.
aoqi@0 1169
aoqi@0 1170 // Setup Object Pointer
aoqi@0 1171 Node *lock_obj = NULL;
aoqi@0 1172 if(method()->is_static()) {
aoqi@0 1173 ciInstance* mirror = _method->holder()->java_mirror();
aoqi@0 1174 const TypeInstPtr *t_lock = TypeInstPtr::make(mirror);
aoqi@0 1175 lock_obj = makecon(t_lock);
aoqi@0 1176 } else { // Else pass the "this" pointer,
aoqi@0 1177 lock_obj = local(0); // which is Parm0 from StartNode
aoqi@0 1178 }
aoqi@0 1179 // Clear out dead values from the debug info.
aoqi@0 1180 kill_dead_locals();
aoqi@0 1181 // Build the FastLockNode
aoqi@0 1182 _synch_lock = shared_lock(lock_obj);
aoqi@0 1183 }
aoqi@0 1184
aoqi@0 1185 // Feed profiling data for parameters to the type system so it can
aoqi@0 1186 // propagate it as speculative types
aoqi@0 1187 record_profiled_parameters_for_speculation();
aoqi@0 1188
aoqi@0 1189 if (depth() == 1) {
aoqi@0 1190 increment_and_test_invocation_counter(Tier2CompileThreshold);
aoqi@0 1191 }
aoqi@0 1192 }
aoqi@0 1193
aoqi@0 1194 //------------------------------init_blocks------------------------------------
aoqi@0 1195 // Initialize our parser map to contain the types/monitors at method entry.
aoqi@0 1196 void Parse::init_blocks() {
aoqi@0 1197 // Create the blocks.
aoqi@0 1198 _block_count = flow()->block_count();
aoqi@0 1199 _blocks = NEW_RESOURCE_ARRAY(Block, _block_count);
aoqi@0 1200 Copy::zero_to_bytes(_blocks, sizeof(Block)*_block_count);
aoqi@0 1201
aoqi@0 1202 int rpo;
aoqi@0 1203
aoqi@0 1204 // Initialize the structs.
aoqi@0 1205 for (rpo = 0; rpo < block_count(); rpo++) {
aoqi@0 1206 Block* block = rpo_at(rpo);
aoqi@0 1207 block->init_node(this, rpo);
aoqi@0 1208 }
aoqi@0 1209
aoqi@0 1210 // Collect predecessor and successor information.
aoqi@0 1211 for (rpo = 0; rpo < block_count(); rpo++) {
aoqi@0 1212 Block* block = rpo_at(rpo);
aoqi@0 1213 block->init_graph(this);
aoqi@0 1214 }
aoqi@0 1215 }
aoqi@0 1216
aoqi@0 1217 //-------------------------------init_node-------------------------------------
aoqi@0 1218 void Parse::Block::init_node(Parse* outer, int rpo) {
aoqi@0 1219 _flow = outer->flow()->rpo_at(rpo);
aoqi@0 1220 _pred_count = 0;
aoqi@0 1221 _preds_parsed = 0;
aoqi@0 1222 _count = 0;
aoqi@0 1223 assert(pred_count() == 0 && preds_parsed() == 0, "sanity");
aoqi@0 1224 assert(!(is_merged() || is_parsed() || is_handler() || has_merged_backedge()), "sanity");
aoqi@0 1225 assert(_live_locals.size() == 0, "sanity");
aoqi@0 1226
aoqi@0 1227 // entry point has additional predecessor
aoqi@0 1228 if (flow()->is_start()) _pred_count++;
aoqi@0 1229 assert(flow()->is_start() == (this == outer->start_block()), "");
aoqi@0 1230 }
aoqi@0 1231
aoqi@0 1232 //-------------------------------init_graph------------------------------------
aoqi@0 1233 void Parse::Block::init_graph(Parse* outer) {
aoqi@0 1234 // Create the successor list for this parser block.
aoqi@0 1235 GrowableArray<ciTypeFlow::Block*>* tfs = flow()->successors();
aoqi@0 1236 GrowableArray<ciTypeFlow::Block*>* tfe = flow()->exceptions();
aoqi@0 1237 int ns = tfs->length();
aoqi@0 1238 int ne = tfe->length();
aoqi@0 1239 _num_successors = ns;
aoqi@0 1240 _all_successors = ns+ne;
aoqi@0 1241 _successors = (ns+ne == 0) ? NULL : NEW_RESOURCE_ARRAY(Block*, ns+ne);
aoqi@0 1242 int p = 0;
aoqi@0 1243 for (int i = 0; i < ns+ne; i++) {
aoqi@0 1244 ciTypeFlow::Block* tf2 = (i < ns) ? tfs->at(i) : tfe->at(i-ns);
aoqi@0 1245 Block* block2 = outer->rpo_at(tf2->rpo());
aoqi@0 1246 _successors[i] = block2;
aoqi@0 1247
aoqi@0 1248 // Accumulate pred info for the other block, too.
aoqi@0 1249 if (i < ns) {
aoqi@0 1250 block2->_pred_count++;
aoqi@0 1251 } else {
aoqi@0 1252 block2->_is_handler = true;
aoqi@0 1253 }
aoqi@0 1254
aoqi@0 1255 #ifdef ASSERT
aoqi@0 1256 // A block's successors must be distinguishable by BCI.
aoqi@0 1257 // That is, no bytecode is allowed to branch to two different
aoqi@0 1258 // clones of the same code location.
aoqi@0 1259 for (int j = 0; j < i; j++) {
aoqi@0 1260 Block* block1 = _successors[j];
aoqi@0 1261 if (block1 == block2) continue; // duplicates are OK
aoqi@0 1262 assert(block1->start() != block2->start(), "successors have unique bcis");
aoqi@0 1263 }
aoqi@0 1264 #endif
aoqi@0 1265 }
aoqi@0 1266
aoqi@0 1267 // Note: We never call next_path_num along exception paths, so they
aoqi@0 1268 // never get processed as "ready". Also, the input phis of exception
aoqi@0 1269 // handlers get specially processed, so that
aoqi@0 1270 }
aoqi@0 1271
aoqi@0 1272 //---------------------------successor_for_bci---------------------------------
aoqi@0 1273 Parse::Block* Parse::Block::successor_for_bci(int bci) {
aoqi@0 1274 for (int i = 0; i < all_successors(); i++) {
aoqi@0 1275 Block* block2 = successor_at(i);
aoqi@0 1276 if (block2->start() == bci) return block2;
aoqi@0 1277 }
aoqi@0 1278 // We can actually reach here if ciTypeFlow traps out a block
aoqi@0 1279 // due to an unloaded class, and concurrently with compilation the
aoqi@0 1280 // class is then loaded, so that a later phase of the parser is
aoqi@0 1281 // able to see more of the bytecode CFG. Or, the flow pass and
aoqi@0 1282 // the parser can have a minor difference of opinion about executability
aoqi@0 1283 // of bytecodes. For example, "obj.field = null" is executable even
aoqi@0 1284 // if the field's type is an unloaded class; the flow pass used to
aoqi@0 1285 // make a trap for such code.
aoqi@0 1286 return NULL;
aoqi@0 1287 }
aoqi@0 1288
aoqi@0 1289
aoqi@0 1290 //-----------------------------stack_type_at-----------------------------------
aoqi@0 1291 const Type* Parse::Block::stack_type_at(int i) const {
aoqi@0 1292 return get_type(flow()->stack_type_at(i));
aoqi@0 1293 }
aoqi@0 1294
aoqi@0 1295
aoqi@0 1296 //-----------------------------local_type_at-----------------------------------
aoqi@0 1297 const Type* Parse::Block::local_type_at(int i) const {
aoqi@0 1298 // Make dead locals fall to bottom.
aoqi@0 1299 if (_live_locals.size() == 0) {
aoqi@0 1300 MethodLivenessResult live_locals = flow()->outer()->method()->liveness_at_bci(start());
aoqi@0 1301 // This bitmap can be zero length if we saw a breakpoint.
aoqi@0 1302 // In such cases, pretend they are all live.
aoqi@0 1303 ((Block*)this)->_live_locals = live_locals;
aoqi@0 1304 }
aoqi@0 1305 if (_live_locals.size() > 0 && !_live_locals.at(i))
aoqi@0 1306 return Type::BOTTOM;
aoqi@0 1307
aoqi@0 1308 return get_type(flow()->local_type_at(i));
aoqi@0 1309 }
aoqi@0 1310
aoqi@0 1311
aoqi@0 1312 #ifndef PRODUCT
aoqi@0 1313
aoqi@0 1314 //----------------------------name_for_bc--------------------------------------
aoqi@0 1315 // helper method for BytecodeParseHistogram
aoqi@0 1316 static const char* name_for_bc(int i) {
aoqi@0 1317 return Bytecodes::is_defined(i) ? Bytecodes::name(Bytecodes::cast(i)) : "xxxunusedxxx";
aoqi@0 1318 }
aoqi@0 1319
aoqi@0 1320 //----------------------------BytecodeParseHistogram------------------------------------
aoqi@0 1321 Parse::BytecodeParseHistogram::BytecodeParseHistogram(Parse *p, Compile *c) {
aoqi@0 1322 _parser = p;
aoqi@0 1323 _compiler = c;
aoqi@0 1324 if( ! _initialized ) { _initialized = true; reset(); }
aoqi@0 1325 }
aoqi@0 1326
aoqi@0 1327 //----------------------------current_count------------------------------------
aoqi@0 1328 int Parse::BytecodeParseHistogram::current_count(BPHType bph_type) {
aoqi@0 1329 switch( bph_type ) {
aoqi@0 1330 case BPH_transforms: { return _parser->gvn().made_progress(); }
aoqi@0 1331 case BPH_values: { return _parser->gvn().made_new_values(); }
aoqi@0 1332 default: { ShouldNotReachHere(); return 0; }
aoqi@0 1333 }
aoqi@0 1334 }
aoqi@0 1335
aoqi@0 1336 //----------------------------initialized--------------------------------------
aoqi@0 1337 bool Parse::BytecodeParseHistogram::initialized() { return _initialized; }
aoqi@0 1338
aoqi@0 1339 //----------------------------reset--------------------------------------------
aoqi@0 1340 void Parse::BytecodeParseHistogram::reset() {
aoqi@0 1341 int i = Bytecodes::number_of_codes;
aoqi@0 1342 while (i-- > 0) { _bytecodes_parsed[i] = 0; _nodes_constructed[i] = 0; _nodes_transformed[i] = 0; _new_values[i] = 0; }
aoqi@0 1343 }
aoqi@0 1344
aoqi@0 1345 //----------------------------set_initial_state--------------------------------
aoqi@0 1346 // Record info when starting to parse one bytecode
aoqi@0 1347 void Parse::BytecodeParseHistogram::set_initial_state( Bytecodes::Code bc ) {
aoqi@0 1348 if( PrintParseStatistics && !_parser->is_osr_parse() ) {
aoqi@0 1349 _initial_bytecode = bc;
aoqi@0 1350 _initial_node_count = _compiler->unique();
aoqi@0 1351 _initial_transforms = current_count(BPH_transforms);
aoqi@0 1352 _initial_values = current_count(BPH_values);
aoqi@0 1353 }
aoqi@0 1354 }
aoqi@0 1355
aoqi@0 1356 //----------------------------record_change--------------------------------
aoqi@0 1357 // Record results of parsing one bytecode
aoqi@0 1358 void Parse::BytecodeParseHistogram::record_change() {
aoqi@0 1359 if( PrintParseStatistics && !_parser->is_osr_parse() ) {
aoqi@0 1360 ++_bytecodes_parsed[_initial_bytecode];
aoqi@0 1361 _nodes_constructed [_initial_bytecode] += (_compiler->unique() - _initial_node_count);
aoqi@0 1362 _nodes_transformed [_initial_bytecode] += (current_count(BPH_transforms) - _initial_transforms);
aoqi@0 1363 _new_values [_initial_bytecode] += (current_count(BPH_values) - _initial_values);
aoqi@0 1364 }
aoqi@0 1365 }
aoqi@0 1366
aoqi@0 1367
aoqi@0 1368 //----------------------------print--------------------------------------------
aoqi@0 1369 void Parse::BytecodeParseHistogram::print(float cutoff) {
aoqi@0 1370 ResourceMark rm;
aoqi@0 1371 // print profile
aoqi@0 1372 int total = 0;
aoqi@0 1373 int i = 0;
aoqi@0 1374 for( i = 0; i < Bytecodes::number_of_codes; ++i ) { total += _bytecodes_parsed[i]; }
aoqi@0 1375 int abs_sum = 0;
aoqi@0 1376 tty->cr(); //0123456789012345678901234567890123456789012345678901234567890123456789
aoqi@0 1377 tty->print_cr("Histogram of %d parsed bytecodes:", total);
aoqi@0 1378 if( total == 0 ) { return; }
aoqi@0 1379 tty->cr();
aoqi@0 1380 tty->print_cr("absolute: count of compiled bytecodes of this type");
aoqi@0 1381 tty->print_cr("relative: percentage contribution to compiled nodes");
aoqi@0 1382 tty->print_cr("nodes : Average number of nodes constructed per bytecode");
aoqi@0 1383 tty->print_cr("rnodes : Significance towards total nodes constructed, (nodes*relative)");
aoqi@0 1384 tty->print_cr("transforms: Average amount of tranform progress per bytecode compiled");
aoqi@0 1385 tty->print_cr("values : Average number of node values improved per bytecode");
aoqi@0 1386 tty->print_cr("name : Bytecode name");
aoqi@0 1387 tty->cr();
aoqi@0 1388 tty->print_cr(" absolute relative nodes rnodes transforms values name");
aoqi@0 1389 tty->print_cr("----------------------------------------------------------------------");
aoqi@0 1390 while (--i > 0) {
aoqi@0 1391 int abs = _bytecodes_parsed[i];
aoqi@0 1392 float rel = abs * 100.0F / total;
aoqi@0 1393 float nodes = _bytecodes_parsed[i] == 0 ? 0 : (1.0F * _nodes_constructed[i])/_bytecodes_parsed[i];
aoqi@0 1394 float rnodes = _bytecodes_parsed[i] == 0 ? 0 : rel * nodes;
aoqi@0 1395 float xforms = _bytecodes_parsed[i] == 0 ? 0 : (1.0F * _nodes_transformed[i])/_bytecodes_parsed[i];
aoqi@0 1396 float values = _bytecodes_parsed[i] == 0 ? 0 : (1.0F * _new_values [i])/_bytecodes_parsed[i];
aoqi@0 1397 if (cutoff <= rel) {
aoqi@0 1398 tty->print_cr("%10d %7.2f%% %6.1f %6.2f %6.1f %6.1f %s", abs, rel, nodes, rnodes, xforms, values, name_for_bc(i));
aoqi@0 1399 abs_sum += abs;
aoqi@0 1400 }
aoqi@0 1401 }
aoqi@0 1402 tty->print_cr("----------------------------------------------------------------------");
aoqi@0 1403 float rel_sum = abs_sum * 100.0F / total;
aoqi@0 1404 tty->print_cr("%10d %7.2f%% (cutoff = %.2f%%)", abs_sum, rel_sum, cutoff);
aoqi@0 1405 tty->print_cr("----------------------------------------------------------------------");
aoqi@0 1406 tty->cr();
aoqi@0 1407 }
aoqi@0 1408 #endif
aoqi@0 1409
aoqi@0 1410 //----------------------------load_state_from----------------------------------
aoqi@0 1411 // Load block/map/sp. But not do not touch iter/bci.
aoqi@0 1412 void Parse::load_state_from(Block* block) {
aoqi@0 1413 set_block(block);
aoqi@0 1414 // load the block's JVM state:
aoqi@0 1415 set_map(block->start_map());
aoqi@0 1416 set_sp( block->start_sp());
aoqi@0 1417 }
aoqi@0 1418
aoqi@0 1419
aoqi@0 1420 //-----------------------------record_state------------------------------------
aoqi@0 1421 void Parse::Block::record_state(Parse* p) {
aoqi@0 1422 assert(!is_merged(), "can only record state once, on 1st inflow");
aoqi@0 1423 assert(start_sp() == p->sp(), "stack pointer must agree with ciTypeFlow");
aoqi@0 1424 set_start_map(p->stop());
aoqi@0 1425 }
aoqi@0 1426
aoqi@0 1427
aoqi@0 1428 //------------------------------do_one_block-----------------------------------
aoqi@0 1429 void Parse::do_one_block() {
aoqi@0 1430 if (TraceOptoParse) {
aoqi@0 1431 Block *b = block();
aoqi@0 1432 int ns = b->num_successors();
aoqi@0 1433 int nt = b->all_successors();
aoqi@0 1434
aoqi@0 1435 tty->print("Parsing block #%d at bci [%d,%d), successors: ",
aoqi@0 1436 block()->rpo(), block()->start(), block()->limit());
aoqi@0 1437 for (int i = 0; i < nt; i++) {
aoqi@0 1438 tty->print((( i < ns) ? " %d" : " %d(e)"), b->successor_at(i)->rpo());
aoqi@0 1439 }
aoqi@0 1440 if (b->is_loop_head()) tty->print(" lphd");
aoqi@0 1441 tty->cr();
aoqi@0 1442 }
aoqi@0 1443
aoqi@0 1444 assert(block()->is_merged(), "must be merged before being parsed");
aoqi@0 1445 block()->mark_parsed();
aoqi@0 1446 ++_blocks_parsed;
aoqi@0 1447
aoqi@0 1448 // Set iterator to start of block.
aoqi@0 1449 iter().reset_to_bci(block()->start());
aoqi@0 1450
aoqi@0 1451 CompileLog* log = C->log();
aoqi@0 1452
aoqi@0 1453 // Parse bytecodes
aoqi@0 1454 while (!stopped() && !failing()) {
aoqi@0 1455 iter().next();
aoqi@0 1456
aoqi@0 1457 // Learn the current bci from the iterator:
aoqi@0 1458 set_parse_bci(iter().cur_bci());
aoqi@0 1459
aoqi@0 1460 if (bci() == block()->limit()) {
aoqi@0 1461 // Do not walk into the next block until directed by do_all_blocks.
aoqi@0 1462 merge(bci());
aoqi@0 1463 break;
aoqi@0 1464 }
aoqi@0 1465 assert(bci() < block()->limit(), "bci still in block");
aoqi@0 1466
aoqi@0 1467 if (log != NULL) {
aoqi@0 1468 // Output an optional context marker, to help place actions
aoqi@0 1469 // that occur during parsing of this BC. If there is no log
aoqi@0 1470 // output until the next context string, this context string
aoqi@0 1471 // will be silently ignored.
aoqi@0 1472 log->set_context("bc code='%d' bci='%d'", (int)bc(), bci());
aoqi@0 1473 }
aoqi@0 1474
aoqi@0 1475 if (block()->has_trap_at(bci())) {
aoqi@0 1476 // We must respect the flow pass's traps, because it will refuse
aoqi@0 1477 // to produce successors for trapping blocks.
aoqi@0 1478 int trap_index = block()->flow()->trap_index();
aoqi@0 1479 assert(trap_index != 0, "trap index must be valid");
aoqi@0 1480 uncommon_trap(trap_index);
aoqi@0 1481 break;
aoqi@0 1482 }
aoqi@0 1483
aoqi@0 1484 NOT_PRODUCT( parse_histogram()->set_initial_state(bc()); );
aoqi@0 1485
aoqi@0 1486 #ifdef ASSERT
aoqi@0 1487 int pre_bc_sp = sp();
aoqi@0 1488 int inputs, depth;
aoqi@0 1489 bool have_se = !stopped() && compute_stack_effects(inputs, depth);
aoqi@0 1490 assert(!have_se || pre_bc_sp >= inputs, err_msg_res("have enough stack to execute this BC: pre_bc_sp=%d, inputs=%d", pre_bc_sp, inputs));
aoqi@0 1491 #endif //ASSERT
aoqi@0 1492
aoqi@0 1493 do_one_bytecode();
aoqi@0 1494
aoqi@0 1495 assert(!have_se || stopped() || failing() || (sp() - pre_bc_sp) == depth,
aoqi@0 1496 err_msg_res("incorrect depth prediction: sp=%d, pre_bc_sp=%d, depth=%d", sp(), pre_bc_sp, depth));
aoqi@0 1497
aoqi@0 1498 do_exceptions();
aoqi@0 1499
aoqi@0 1500 NOT_PRODUCT( parse_histogram()->record_change(); );
aoqi@0 1501
aoqi@0 1502 if (log != NULL)
aoqi@0 1503 log->clear_context(); // skip marker if nothing was printed
aoqi@0 1504
aoqi@0 1505 // Fall into next bytecode. Each bytecode normally has 1 sequential
aoqi@0 1506 // successor which is typically made ready by visiting this bytecode.
aoqi@0 1507 // If the successor has several predecessors, then it is a merge
aoqi@0 1508 // point, starts a new basic block, and is handled like other basic blocks.
aoqi@0 1509 }
aoqi@0 1510 }
aoqi@0 1511
aoqi@0 1512
aoqi@0 1513 //------------------------------merge------------------------------------------
aoqi@0 1514 void Parse::set_parse_bci(int bci) {
aoqi@0 1515 set_bci(bci);
aoqi@0 1516 Node_Notes* nn = C->default_node_notes();
aoqi@0 1517 if (nn == NULL) return;
aoqi@0 1518
aoqi@0 1519 // Collect debug info for inlined calls unless -XX:-DebugInlinedCalls.
aoqi@0 1520 if (!DebugInlinedCalls && depth() > 1) {
aoqi@0 1521 return;
aoqi@0 1522 }
aoqi@0 1523
aoqi@0 1524 // Update the JVMS annotation, if present.
aoqi@0 1525 JVMState* jvms = nn->jvms();
aoqi@0 1526 if (jvms != NULL && jvms->bci() != bci) {
aoqi@0 1527 // Update the JVMS.
aoqi@0 1528 jvms = jvms->clone_shallow(C);
aoqi@0 1529 jvms->set_bci(bci);
aoqi@0 1530 nn->set_jvms(jvms);
aoqi@0 1531 }
aoqi@0 1532 }
aoqi@0 1533
aoqi@0 1534 //------------------------------merge------------------------------------------
aoqi@0 1535 // Merge the current mapping into the basic block starting at bci
aoqi@0 1536 void Parse::merge(int target_bci) {
aoqi@0 1537 Block* target = successor_for_bci(target_bci);
aoqi@0 1538 if (target == NULL) { handle_missing_successor(target_bci); return; }
aoqi@0 1539 assert(!target->is_ready(), "our arrival must be expected");
aoqi@0 1540 int pnum = target->next_path_num();
aoqi@0 1541 merge_common(target, pnum);
aoqi@0 1542 }
aoqi@0 1543
aoqi@0 1544 //-------------------------merge_new_path--------------------------------------
aoqi@0 1545 // Merge the current mapping into the basic block, using a new path
aoqi@0 1546 void Parse::merge_new_path(int target_bci) {
aoqi@0 1547 Block* target = successor_for_bci(target_bci);
aoqi@0 1548 if (target == NULL) { handle_missing_successor(target_bci); return; }
aoqi@0 1549 assert(!target->is_ready(), "new path into frozen graph");
aoqi@0 1550 int pnum = target->add_new_path();
aoqi@0 1551 merge_common(target, pnum);
aoqi@0 1552 }
aoqi@0 1553
aoqi@0 1554 //-------------------------merge_exception-------------------------------------
aoqi@0 1555 // Merge the current mapping into the basic block starting at bci
aoqi@0 1556 // The ex_oop must be pushed on the stack, unlike throw_to_exit.
aoqi@0 1557 void Parse::merge_exception(int target_bci) {
aoqi@0 1558 assert(sp() == 1, "must have only the throw exception on the stack");
aoqi@0 1559 Block* target = successor_for_bci(target_bci);
aoqi@0 1560 if (target == NULL) { handle_missing_successor(target_bci); return; }
aoqi@0 1561 assert(target->is_handler(), "exceptions are handled by special blocks");
aoqi@0 1562 int pnum = target->add_new_path();
aoqi@0 1563 merge_common(target, pnum);
aoqi@0 1564 }
aoqi@0 1565
aoqi@0 1566 //--------------------handle_missing_successor---------------------------------
aoqi@0 1567 void Parse::handle_missing_successor(int target_bci) {
aoqi@0 1568 #ifndef PRODUCT
aoqi@0 1569 Block* b = block();
aoqi@0 1570 int trap_bci = b->flow()->has_trap()? b->flow()->trap_bci(): -1;
aoqi@0 1571 tty->print_cr("### Missing successor at bci:%d for block #%d (trap_bci:%d)", target_bci, b->rpo(), trap_bci);
aoqi@0 1572 #endif
aoqi@0 1573 ShouldNotReachHere();
aoqi@0 1574 }
aoqi@0 1575
aoqi@0 1576 //--------------------------merge_common---------------------------------------
aoqi@0 1577 void Parse::merge_common(Parse::Block* target, int pnum) {
aoqi@0 1578 if (TraceOptoParse) {
aoqi@0 1579 tty->print("Merging state at block #%d bci:%d", target->rpo(), target->start());
aoqi@0 1580 }
aoqi@0 1581
aoqi@0 1582 // Zap extra stack slots to top
aoqi@0 1583 assert(sp() == target->start_sp(), "");
aoqi@0 1584 clean_stack(sp());
aoqi@0 1585
aoqi@0 1586 if (!target->is_merged()) { // No prior mapping at this bci
aoqi@0 1587 if (TraceOptoParse) { tty->print(" with empty state"); }
aoqi@0 1588
aoqi@0 1589 // If this path is dead, do not bother capturing it as a merge.
aoqi@0 1590 // It is "as if" we had 1 fewer predecessors from the beginning.
aoqi@0 1591 if (stopped()) {
aoqi@0 1592 if (TraceOptoParse) tty->print_cr(", but path is dead and doesn't count");
aoqi@0 1593 return;
aoqi@0 1594 }
aoqi@0 1595
aoqi@0 1596 // Record that a new block has been merged.
aoqi@0 1597 ++_blocks_merged;
aoqi@0 1598
aoqi@0 1599 // Make a region if we know there are multiple or unpredictable inputs.
aoqi@0 1600 // (Also, if this is a plain fall-through, we might see another region,
aoqi@0 1601 // which must not be allowed into this block's map.)
aoqi@0 1602 if (pnum > PhiNode::Input // Known multiple inputs.
aoqi@0 1603 || target->is_handler() // These have unpredictable inputs.
aoqi@0 1604 || target->is_loop_head() // Known multiple inputs
aoqi@0 1605 || control()->is_Region()) { // We must hide this guy.
aoqi@0 1606
aoqi@0 1607 int current_bci = bci();
aoqi@0 1608 set_parse_bci(target->start()); // Set target bci
aoqi@0 1609 if (target->is_SEL_head()) {
aoqi@0 1610 DEBUG_ONLY( target->mark_merged_backedge(block()); )
aoqi@0 1611 if (target->start() == 0) {
aoqi@0 1612 // Add loop predicate for the special case when
aoqi@0 1613 // there are backbranches to the method entry.
aoqi@0 1614 add_predicate();
aoqi@0 1615 }
aoqi@0 1616 }
aoqi@0 1617 // Add a Region to start the new basic block. Phis will be added
aoqi@0 1618 // later lazily.
aoqi@0 1619 int edges = target->pred_count();
aoqi@0 1620 if (edges < pnum) edges = pnum; // might be a new path!
aoqi@0 1621 RegionNode *r = new (C) RegionNode(edges+1);
aoqi@0 1622 gvn().set_type(r, Type::CONTROL);
aoqi@0 1623 record_for_igvn(r);
aoqi@0 1624 // zap all inputs to NULL for debugging (done in Node(uint) constructor)
aoqi@0 1625 // for (int j = 1; j < edges+1; j++) { r->init_req(j, NULL); }
aoqi@0 1626 r->init_req(pnum, control());
aoqi@0 1627 set_control(r);
aoqi@0 1628 set_parse_bci(current_bci); // Restore bci
aoqi@0 1629 }
aoqi@0 1630
aoqi@0 1631 // Convert the existing Parser mapping into a mapping at this bci.
aoqi@0 1632 store_state_to(target);
aoqi@0 1633 assert(target->is_merged(), "do not come here twice");
aoqi@0 1634
aoqi@0 1635 } else { // Prior mapping at this bci
aoqi@0 1636 if (TraceOptoParse) { tty->print(" with previous state"); }
aoqi@0 1637 #ifdef ASSERT
aoqi@0 1638 if (target->is_SEL_head()) {
aoqi@0 1639 target->mark_merged_backedge(block());
aoqi@0 1640 }
aoqi@0 1641 #endif
aoqi@0 1642 // We must not manufacture more phis if the target is already parsed.
aoqi@0 1643 bool nophi = target->is_parsed();
aoqi@0 1644
aoqi@0 1645 SafePointNode* newin = map();// Hang on to incoming mapping
aoqi@0 1646 Block* save_block = block(); // Hang on to incoming block;
aoqi@0 1647 load_state_from(target); // Get prior mapping
aoqi@0 1648
aoqi@0 1649 assert(newin->jvms()->locoff() == jvms()->locoff(), "JVMS layouts agree");
aoqi@0 1650 assert(newin->jvms()->stkoff() == jvms()->stkoff(), "JVMS layouts agree");
aoqi@0 1651 assert(newin->jvms()->monoff() == jvms()->monoff(), "JVMS layouts agree");
aoqi@0 1652 assert(newin->jvms()->endoff() == jvms()->endoff(), "JVMS layouts agree");
aoqi@0 1653
aoqi@0 1654 // Iterate over my current mapping and the old mapping.
aoqi@0 1655 // Where different, insert Phi functions.
aoqi@0 1656 // Use any existing Phi functions.
aoqi@0 1657 assert(control()->is_Region(), "must be merging to a region");
aoqi@0 1658 RegionNode* r = control()->as_Region();
aoqi@0 1659
aoqi@0 1660 // Compute where to merge into
aoqi@0 1661 // Merge incoming control path
aoqi@0 1662 r->init_req(pnum, newin->control());
aoqi@0 1663
aoqi@0 1664 if (pnum == 1) { // Last merge for this Region?
aoqi@0 1665 if (!block()->flow()->is_irreducible_entry()) {
aoqi@0 1666 Node* result = _gvn.transform_no_reclaim(r);
aoqi@0 1667 if (r != result && TraceOptoParse) {
aoqi@0 1668 tty->print_cr("Block #%d replace %d with %d", block()->rpo(), r->_idx, result->_idx);
aoqi@0 1669 }
aoqi@0 1670 }
aoqi@0 1671 record_for_igvn(r);
aoqi@0 1672 }
aoqi@0 1673
aoqi@0 1674 // Update all the non-control inputs to map:
aoqi@0 1675 assert(TypeFunc::Parms == newin->jvms()->locoff(), "parser map should contain only youngest jvms");
aoqi@0 1676 bool check_elide_phi = target->is_SEL_backedge(save_block);
aoqi@0 1677 for (uint j = 1; j < newin->req(); j++) {
aoqi@0 1678 Node* m = map()->in(j); // Current state of target.
aoqi@0 1679 Node* n = newin->in(j); // Incoming change to target state.
aoqi@0 1680 PhiNode* phi;
aoqi@0 1681 if (m->is_Phi() && m->as_Phi()->region() == r)
aoqi@0 1682 phi = m->as_Phi();
aoqi@0 1683 else
aoqi@0 1684 phi = NULL;
aoqi@0 1685 if (m != n) { // Different; must merge
aoqi@0 1686 switch (j) {
aoqi@0 1687 // Frame pointer and Return Address never changes
aoqi@0 1688 case TypeFunc::FramePtr:// Drop m, use the original value
aoqi@0 1689 case TypeFunc::ReturnAdr:
aoqi@0 1690 break;
aoqi@0 1691 case TypeFunc::Memory: // Merge inputs to the MergeMem node
aoqi@0 1692 assert(phi == NULL, "the merge contains phis, not vice versa");
aoqi@0 1693 merge_memory_edges(n->as_MergeMem(), pnum, nophi);
aoqi@0 1694 continue;
aoqi@0 1695 default: // All normal stuff
aoqi@0 1696 if (phi == NULL) {
aoqi@0 1697 const JVMState* jvms = map()->jvms();
aoqi@0 1698 if (EliminateNestedLocks &&
aoqi@0 1699 jvms->is_mon(j) && jvms->is_monitor_box(j)) {
aoqi@0 1700 // BoxLock nodes are not commoning.
aoqi@0 1701 // Use old BoxLock node as merged box.
aoqi@0 1702 assert(newin->jvms()->is_monitor_box(j), "sanity");
aoqi@0 1703 // This assert also tests that nodes are BoxLock.
aoqi@0 1704 assert(BoxLockNode::same_slot(n, m), "sanity");
aoqi@0 1705 C->gvn_replace_by(n, m);
aoqi@0 1706 } else if (!check_elide_phi || !target->can_elide_SEL_phi(j)) {
aoqi@0 1707 phi = ensure_phi(j, nophi);
aoqi@0 1708 }
aoqi@0 1709 }
aoqi@0 1710 break;
aoqi@0 1711 }
aoqi@0 1712 }
aoqi@0 1713 // At this point, n might be top if:
aoqi@0 1714 // - there is no phi (because TypeFlow detected a conflict), or
aoqi@0 1715 // - the corresponding control edges is top (a dead incoming path)
aoqi@0 1716 // It is a bug if we create a phi which sees a garbage value on a live path.
aoqi@0 1717
aoqi@0 1718 if (phi != NULL) {
aoqi@0 1719 assert(n != top() || r->in(pnum) == top(), "live value must not be garbage");
aoqi@0 1720 assert(phi->region() == r, "");
aoqi@0 1721 phi->set_req(pnum, n); // Then add 'n' to the merge
aoqi@0 1722 if (pnum == PhiNode::Input) {
aoqi@0 1723 // Last merge for this Phi.
aoqi@0 1724 // So far, Phis have had a reasonable type from ciTypeFlow.
aoqi@0 1725 // Now _gvn will join that with the meet of current inputs.
aoqi@0 1726 // BOTTOM is never permissible here, 'cause pessimistically
aoqi@0 1727 // Phis of pointers cannot lose the basic pointer type.
aoqi@0 1728 debug_only(const Type* bt1 = phi->bottom_type());
aoqi@0 1729 assert(bt1 != Type::BOTTOM, "should not be building conflict phis");
aoqi@0 1730 map()->set_req(j, _gvn.transform_no_reclaim(phi));
aoqi@0 1731 debug_only(const Type* bt2 = phi->bottom_type());
aoqi@0 1732 assert(bt2->higher_equal_speculative(bt1), "must be consistent with type-flow");
aoqi@0 1733 record_for_igvn(phi);
aoqi@0 1734 }
aoqi@0 1735 }
aoqi@0 1736 } // End of for all values to be merged
aoqi@0 1737
aoqi@0 1738 if (pnum == PhiNode::Input &&
aoqi@0 1739 !r->in(0)) { // The occasional useless Region
aoqi@0 1740 assert(control() == r, "");
aoqi@0 1741 set_control(r->nonnull_req());
aoqi@0 1742 }
aoqi@0 1743
roland@7041 1744 map()->merge_replaced_nodes_with(newin);
roland@7041 1745
aoqi@0 1746 // newin has been subsumed into the lazy merge, and is now dead.
aoqi@0 1747 set_block(save_block);
aoqi@0 1748
aoqi@0 1749 stop(); // done with this guy, for now
aoqi@0 1750 }
aoqi@0 1751
aoqi@0 1752 if (TraceOptoParse) {
aoqi@0 1753 tty->print_cr(" on path %d", pnum);
aoqi@0 1754 }
aoqi@0 1755
aoqi@0 1756 // Done with this parser state.
aoqi@0 1757 assert(stopped(), "");
aoqi@0 1758 }
aoqi@0 1759
aoqi@0 1760
aoqi@0 1761 //--------------------------merge_memory_edges---------------------------------
aoqi@0 1762 void Parse::merge_memory_edges(MergeMemNode* n, int pnum, bool nophi) {
aoqi@0 1763 // (nophi means we must not create phis, because we already parsed here)
aoqi@0 1764 assert(n != NULL, "");
aoqi@0 1765 // Merge the inputs to the MergeMems
aoqi@0 1766 MergeMemNode* m = merged_memory();
aoqi@0 1767
aoqi@0 1768 assert(control()->is_Region(), "must be merging to a region");
aoqi@0 1769 RegionNode* r = control()->as_Region();
aoqi@0 1770
aoqi@0 1771 PhiNode* base = NULL;
aoqi@0 1772 MergeMemNode* remerge = NULL;
aoqi@0 1773 for (MergeMemStream mms(m, n); mms.next_non_empty2(); ) {
aoqi@0 1774 Node *p = mms.force_memory();
aoqi@0 1775 Node *q = mms.memory2();
aoqi@0 1776 if (mms.is_empty() && nophi) {
aoqi@0 1777 // Trouble: No new splits allowed after a loop body is parsed.
aoqi@0 1778 // Instead, wire the new split into a MergeMem on the backedge.
aoqi@0 1779 // The optimizer will sort it out, slicing the phi.
aoqi@0 1780 if (remerge == NULL) {
aoqi@0 1781 assert(base != NULL, "");
aoqi@0 1782 assert(base->in(0) != NULL, "should not be xformed away");
aoqi@0 1783 remerge = MergeMemNode::make(C, base->in(pnum));
aoqi@0 1784 gvn().set_type(remerge, Type::MEMORY);
aoqi@0 1785 base->set_req(pnum, remerge);
aoqi@0 1786 }
aoqi@0 1787 remerge->set_memory_at(mms.alias_idx(), q);
aoqi@0 1788 continue;
aoqi@0 1789 }
aoqi@0 1790 assert(!q->is_MergeMem(), "");
aoqi@0 1791 PhiNode* phi;
aoqi@0 1792 if (p != q) {
aoqi@0 1793 phi = ensure_memory_phi(mms.alias_idx(), nophi);
aoqi@0 1794 } else {
aoqi@0 1795 if (p->is_Phi() && p->as_Phi()->region() == r)
aoqi@0 1796 phi = p->as_Phi();
aoqi@0 1797 else
aoqi@0 1798 phi = NULL;
aoqi@0 1799 }
aoqi@0 1800 // Insert q into local phi
aoqi@0 1801 if (phi != NULL) {
aoqi@0 1802 assert(phi->region() == r, "");
aoqi@0 1803 p = phi;
aoqi@0 1804 phi->set_req(pnum, q);
aoqi@0 1805 if (mms.at_base_memory()) {
aoqi@0 1806 base = phi; // delay transforming it
aoqi@0 1807 } else if (pnum == 1) {
aoqi@0 1808 record_for_igvn(phi);
aoqi@0 1809 p = _gvn.transform_no_reclaim(phi);
aoqi@0 1810 }
aoqi@0 1811 mms.set_memory(p);// store back through the iterator
aoqi@0 1812 }
aoqi@0 1813 }
aoqi@0 1814 // Transform base last, in case we must fiddle with remerging.
aoqi@0 1815 if (base != NULL && pnum == 1) {
aoqi@0 1816 record_for_igvn(base);
aoqi@0 1817 m->set_base_memory( _gvn.transform_no_reclaim(base) );
aoqi@0 1818 }
aoqi@0 1819 }
aoqi@0 1820
aoqi@0 1821
aoqi@0 1822 //------------------------ensure_phis_everywhere-------------------------------
aoqi@0 1823 void Parse::ensure_phis_everywhere() {
aoqi@0 1824 ensure_phi(TypeFunc::I_O);
aoqi@0 1825
aoqi@0 1826 // Ensure a phi on all currently known memories.
aoqi@0 1827 for (MergeMemStream mms(merged_memory()); mms.next_non_empty(); ) {
aoqi@0 1828 ensure_memory_phi(mms.alias_idx());
aoqi@0 1829 debug_only(mms.set_memory()); // keep the iterator happy
aoqi@0 1830 }
aoqi@0 1831
aoqi@0 1832 // Note: This is our only chance to create phis for memory slices.
aoqi@0 1833 // If we miss a slice that crops up later, it will have to be
aoqi@0 1834 // merged into the base-memory phi that we are building here.
aoqi@0 1835 // Later, the optimizer will comb out the knot, and build separate
aoqi@0 1836 // phi-loops for each memory slice that matters.
aoqi@0 1837
aoqi@0 1838 // Monitors must nest nicely and not get confused amongst themselves.
aoqi@0 1839 // Phi-ify everything up to the monitors, though.
aoqi@0 1840 uint monoff = map()->jvms()->monoff();
aoqi@0 1841 uint nof_monitors = map()->jvms()->nof_monitors();
aoqi@0 1842
aoqi@0 1843 assert(TypeFunc::Parms == map()->jvms()->locoff(), "parser map should contain only youngest jvms");
aoqi@0 1844 bool check_elide_phi = block()->is_SEL_head();
aoqi@0 1845 for (uint i = TypeFunc::Parms; i < monoff; i++) {
aoqi@0 1846 if (!check_elide_phi || !block()->can_elide_SEL_phi(i)) {
aoqi@0 1847 ensure_phi(i);
aoqi@0 1848 }
aoqi@0 1849 }
aoqi@0 1850
aoqi@0 1851 // Even monitors need Phis, though they are well-structured.
aoqi@0 1852 // This is true for OSR methods, and also for the rare cases where
aoqi@0 1853 // a monitor object is the subject of a replace_in_map operation.
aoqi@0 1854 // See bugs 4426707 and 5043395.
aoqi@0 1855 for (uint m = 0; m < nof_monitors; m++) {
aoqi@0 1856 ensure_phi(map()->jvms()->monitor_obj_offset(m));
aoqi@0 1857 }
aoqi@0 1858 }
aoqi@0 1859
aoqi@0 1860
aoqi@0 1861 //-----------------------------add_new_path------------------------------------
aoqi@0 1862 // Add a previously unaccounted predecessor to this block.
aoqi@0 1863 int Parse::Block::add_new_path() {
aoqi@0 1864 // If there is no map, return the lowest unused path number.
aoqi@0 1865 if (!is_merged()) return pred_count()+1; // there will be a map shortly
aoqi@0 1866
aoqi@0 1867 SafePointNode* map = start_map();
aoqi@0 1868 if (!map->control()->is_Region())
aoqi@0 1869 return pred_count()+1; // there may be a region some day
aoqi@0 1870 RegionNode* r = map->control()->as_Region();
aoqi@0 1871
aoqi@0 1872 // Add new path to the region.
aoqi@0 1873 uint pnum = r->req();
aoqi@0 1874 r->add_req(NULL);
aoqi@0 1875
aoqi@0 1876 for (uint i = 1; i < map->req(); i++) {
aoqi@0 1877 Node* n = map->in(i);
aoqi@0 1878 if (i == TypeFunc::Memory) {
aoqi@0 1879 // Ensure a phi on all currently known memories.
aoqi@0 1880 for (MergeMemStream mms(n->as_MergeMem()); mms.next_non_empty(); ) {
aoqi@0 1881 Node* phi = mms.memory();
aoqi@0 1882 if (phi->is_Phi() && phi->as_Phi()->region() == r) {
aoqi@0 1883 assert(phi->req() == pnum, "must be same size as region");
aoqi@0 1884 phi->add_req(NULL);
aoqi@0 1885 }
aoqi@0 1886 }
aoqi@0 1887 } else {
aoqi@0 1888 if (n->is_Phi() && n->as_Phi()->region() == r) {
aoqi@0 1889 assert(n->req() == pnum, "must be same size as region");
aoqi@0 1890 n->add_req(NULL);
aoqi@0 1891 }
aoqi@0 1892 }
aoqi@0 1893 }
aoqi@0 1894
aoqi@0 1895 return pnum;
aoqi@0 1896 }
aoqi@0 1897
aoqi@0 1898 //------------------------------ensure_phi-------------------------------------
aoqi@0 1899 // Turn the idx'th entry of the current map into a Phi
aoqi@0 1900 PhiNode *Parse::ensure_phi(int idx, bool nocreate) {
aoqi@0 1901 SafePointNode* map = this->map();
aoqi@0 1902 Node* region = map->control();
aoqi@0 1903 assert(region->is_Region(), "");
aoqi@0 1904
aoqi@0 1905 Node* o = map->in(idx);
aoqi@0 1906 assert(o != NULL, "");
aoqi@0 1907
aoqi@0 1908 if (o == top()) return NULL; // TOP always merges into TOP
aoqi@0 1909
aoqi@0 1910 if (o->is_Phi() && o->as_Phi()->region() == region) {
aoqi@0 1911 return o->as_Phi();
aoqi@0 1912 }
aoqi@0 1913
aoqi@0 1914 // Now use a Phi here for merging
aoqi@0 1915 assert(!nocreate, "Cannot build a phi for a block already parsed.");
aoqi@0 1916 const JVMState* jvms = map->jvms();
csahu@8316 1917 const Type* t = NULL;
aoqi@0 1918 if (jvms->is_loc(idx)) {
aoqi@0 1919 t = block()->local_type_at(idx - jvms->locoff());
aoqi@0 1920 } else if (jvms->is_stk(idx)) {
aoqi@0 1921 t = block()->stack_type_at(idx - jvms->stkoff());
aoqi@0 1922 } else if (jvms->is_mon(idx)) {
aoqi@0 1923 assert(!jvms->is_monitor_box(idx), "no phis for boxes");
aoqi@0 1924 t = TypeInstPtr::BOTTOM; // this is sufficient for a lock object
aoqi@0 1925 } else if ((uint)idx < TypeFunc::Parms) {
aoqi@0 1926 t = o->bottom_type(); // Type::RETURN_ADDRESS or such-like.
aoqi@0 1927 } else {
aoqi@0 1928 assert(false, "no type information for this phi");
aoqi@0 1929 }
aoqi@0 1930
aoqi@0 1931 // If the type falls to bottom, then this must be a local that
aoqi@0 1932 // is mixing ints and oops or some such. Forcing it to top
aoqi@0 1933 // makes it go dead.
aoqi@0 1934 if (t == Type::BOTTOM) {
aoqi@0 1935 map->set_req(idx, top());
aoqi@0 1936 return NULL;
aoqi@0 1937 }
aoqi@0 1938
aoqi@0 1939 // Do not create phis for top either.
aoqi@0 1940 // A top on a non-null control flow must be an unused even after the.phi.
aoqi@0 1941 if (t == Type::TOP || t == Type::HALF) {
aoqi@0 1942 map->set_req(idx, top());
aoqi@0 1943 return NULL;
aoqi@0 1944 }
aoqi@0 1945
aoqi@0 1946 PhiNode* phi = PhiNode::make(region, o, t);
aoqi@0 1947 gvn().set_type(phi, t);
aoqi@0 1948 if (C->do_escape_analysis()) record_for_igvn(phi);
aoqi@0 1949 map->set_req(idx, phi);
aoqi@0 1950 return phi;
aoqi@0 1951 }
aoqi@0 1952
aoqi@0 1953 //--------------------------ensure_memory_phi----------------------------------
aoqi@0 1954 // Turn the idx'th slice of the current memory into a Phi
aoqi@0 1955 PhiNode *Parse::ensure_memory_phi(int idx, bool nocreate) {
aoqi@0 1956 MergeMemNode* mem = merged_memory();
aoqi@0 1957 Node* region = control();
aoqi@0 1958 assert(region->is_Region(), "");
aoqi@0 1959
aoqi@0 1960 Node *o = (idx == Compile::AliasIdxBot)? mem->base_memory(): mem->memory_at(idx);
aoqi@0 1961 assert(o != NULL && o != top(), "");
aoqi@0 1962
aoqi@0 1963 PhiNode* phi;
aoqi@0 1964 if (o->is_Phi() && o->as_Phi()->region() == region) {
aoqi@0 1965 phi = o->as_Phi();
aoqi@0 1966 if (phi == mem->base_memory() && idx >= Compile::AliasIdxRaw) {
aoqi@0 1967 // clone the shared base memory phi to make a new memory split
aoqi@0 1968 assert(!nocreate, "Cannot build a phi for a block already parsed.");
aoqi@0 1969 const Type* t = phi->bottom_type();
aoqi@0 1970 const TypePtr* adr_type = C->get_adr_type(idx);
aoqi@0 1971 phi = phi->slice_memory(adr_type);
aoqi@0 1972 gvn().set_type(phi, t);
aoqi@0 1973 }
aoqi@0 1974 return phi;
aoqi@0 1975 }
aoqi@0 1976
aoqi@0 1977 // Now use a Phi here for merging
aoqi@0 1978 assert(!nocreate, "Cannot build a phi for a block already parsed.");
aoqi@0 1979 const Type* t = o->bottom_type();
aoqi@0 1980 const TypePtr* adr_type = C->get_adr_type(idx);
aoqi@0 1981 phi = PhiNode::make(region, o, t, adr_type);
aoqi@0 1982 gvn().set_type(phi, t);
aoqi@0 1983 if (idx == Compile::AliasIdxBot)
aoqi@0 1984 mem->set_base_memory(phi);
aoqi@0 1985 else
aoqi@0 1986 mem->set_memory_at(idx, phi);
aoqi@0 1987 return phi;
aoqi@0 1988 }
aoqi@0 1989
aoqi@0 1990 //------------------------------call_register_finalizer-----------------------
aoqi@0 1991 // Check the klass of the receiver and call register_finalizer if the
aoqi@0 1992 // class need finalization.
aoqi@0 1993 void Parse::call_register_finalizer() {
aoqi@0 1994 Node* receiver = local(0);
aoqi@0 1995 assert(receiver != NULL && receiver->bottom_type()->isa_instptr() != NULL,
aoqi@0 1996 "must have non-null instance type");
aoqi@0 1997
aoqi@0 1998 const TypeInstPtr *tinst = receiver->bottom_type()->isa_instptr();
aoqi@0 1999 if (tinst != NULL && tinst->klass()->is_loaded() && !tinst->klass_is_exact()) {
aoqi@0 2000 // The type isn't known exactly so see if CHA tells us anything.
aoqi@0 2001 ciInstanceKlass* ik = tinst->klass()->as_instance_klass();
aoqi@0 2002 if (!Dependencies::has_finalizable_subclass(ik)) {
aoqi@0 2003 // No finalizable subclasses so skip the dynamic check.
aoqi@0 2004 C->dependencies()->assert_has_no_finalizable_subclasses(ik);
aoqi@0 2005 return;
aoqi@0 2006 }
aoqi@0 2007 }
aoqi@0 2008
aoqi@0 2009 // Insert a dynamic test for whether the instance needs
aoqi@0 2010 // finalization. In general this will fold up since the concrete
aoqi@0 2011 // class is often visible so the access flags are constant.
aoqi@0 2012 Node* klass_addr = basic_plus_adr( receiver, receiver, oopDesc::klass_offset_in_bytes() );
zmajo@7341 2013 Node* klass = _gvn.transform(LoadKlassNode::make(_gvn, NULL, immutable_memory(), klass_addr, TypeInstPtr::KLASS));
aoqi@0 2014
aoqi@0 2015 Node* access_flags_addr = basic_plus_adr(klass, klass, in_bytes(Klass::access_flags_offset()));
aoqi@0 2016 Node* access_flags = make_load(NULL, access_flags_addr, TypeInt::INT, T_INT, MemNode::unordered);
aoqi@0 2017
aoqi@0 2018 Node* mask = _gvn.transform(new (C) AndINode(access_flags, intcon(JVM_ACC_HAS_FINALIZER)));
aoqi@0 2019 Node* check = _gvn.transform(new (C) CmpINode(mask, intcon(0)));
aoqi@0 2020 Node* test = _gvn.transform(new (C) BoolNode(check, BoolTest::ne));
aoqi@0 2021
aoqi@0 2022 IfNode* iff = create_and_map_if(control(), test, PROB_MAX, COUNT_UNKNOWN);
aoqi@0 2023
aoqi@0 2024 RegionNode* result_rgn = new (C) RegionNode(3);
aoqi@0 2025 record_for_igvn(result_rgn);
aoqi@0 2026
aoqi@0 2027 Node *skip_register = _gvn.transform(new (C) IfFalseNode(iff));
aoqi@0 2028 result_rgn->init_req(1, skip_register);
aoqi@0 2029
aoqi@0 2030 Node *needs_register = _gvn.transform(new (C) IfTrueNode(iff));
aoqi@0 2031 set_control(needs_register);
aoqi@0 2032 if (stopped()) {
aoqi@0 2033 // There is no slow path.
aoqi@0 2034 result_rgn->init_req(2, top());
aoqi@0 2035 } else {
aoqi@0 2036 Node *call = make_runtime_call(RC_NO_LEAF,
aoqi@0 2037 OptoRuntime::register_finalizer_Type(),
aoqi@0 2038 OptoRuntime::register_finalizer_Java(),
aoqi@0 2039 NULL, TypePtr::BOTTOM,
aoqi@0 2040 receiver);
aoqi@0 2041 make_slow_call_ex(call, env()->Throwable_klass(), true);
aoqi@0 2042
aoqi@0 2043 Node* fast_io = call->in(TypeFunc::I_O);
aoqi@0 2044 Node* fast_mem = call->in(TypeFunc::Memory);
aoqi@0 2045 // These two phis are pre-filled with copies of of the fast IO and Memory
aoqi@0 2046 Node* io_phi = PhiNode::make(result_rgn, fast_io, Type::ABIO);
aoqi@0 2047 Node* mem_phi = PhiNode::make(result_rgn, fast_mem, Type::MEMORY, TypePtr::BOTTOM);
aoqi@0 2048
aoqi@0 2049 result_rgn->init_req(2, control());
aoqi@0 2050 io_phi ->init_req(2, i_o());
aoqi@0 2051 mem_phi ->init_req(2, reset_memory());
aoqi@0 2052
aoqi@0 2053 set_all_memory( _gvn.transform(mem_phi) );
aoqi@0 2054 set_i_o( _gvn.transform(io_phi) );
aoqi@0 2055 }
aoqi@0 2056
aoqi@0 2057 set_control( _gvn.transform(result_rgn) );
aoqi@0 2058 }
aoqi@0 2059
aoqi@0 2060 // Add check to deoptimize if RTM state is not ProfileRTM
aoqi@0 2061 void Parse::rtm_deopt() {
aoqi@0 2062 #if INCLUDE_RTM_OPT
aoqi@0 2063 if (C->profile_rtm()) {
aoqi@0 2064 assert(C->method() != NULL, "only for normal compilations");
aoqi@0 2065 assert(!C->method()->method_data()->is_empty(), "MDO is needed to record RTM state");
aoqi@0 2066 assert(depth() == 1, "generate check only for main compiled method");
aoqi@0 2067
aoqi@0 2068 // Set starting bci for uncommon trap.
aoqi@0 2069 set_parse_bci(is_osr_parse() ? osr_bci() : 0);
aoqi@0 2070
aoqi@0 2071 // Load the rtm_state from the MethodData.
aoqi@0 2072 const TypePtr* adr_type = TypeMetadataPtr::make(C->method()->method_data());
aoqi@0 2073 Node* mdo = makecon(adr_type);
aoqi@0 2074 int offset = MethodData::rtm_state_offset_in_bytes();
aoqi@0 2075 Node* adr_node = basic_plus_adr(mdo, mdo, offset);
aoqi@0 2076 Node* rtm_state = make_load(control(), adr_node, TypeInt::INT, T_INT, adr_type, MemNode::unordered);
aoqi@0 2077
aoqi@0 2078 // Separate Load from Cmp by Opaque.
aoqi@0 2079 // In expand_macro_nodes() it will be replaced either
aoqi@0 2080 // with this load when there are locks in the code
aoqi@0 2081 // or with ProfileRTM (cmp->in(2)) otherwise so that
aoqi@0 2082 // the check will fold.
aoqi@0 2083 Node* profile_state = makecon(TypeInt::make(ProfileRTM));
aoqi@0 2084 Node* opq = _gvn.transform( new (C) Opaque3Node(C, rtm_state, Opaque3Node::RTM_OPT) );
aoqi@0 2085 Node* chk = _gvn.transform( new (C) CmpINode(opq, profile_state) );
aoqi@0 2086 Node* tst = _gvn.transform( new (C) BoolNode(chk, BoolTest::eq) );
aoqi@0 2087 // Branch to failure if state was changed
aoqi@0 2088 { BuildCutout unless(this, tst, PROB_ALWAYS);
aoqi@0 2089 uncommon_trap(Deoptimization::Reason_rtm_state_change,
aoqi@0 2090 Deoptimization::Action_make_not_entrant);
aoqi@0 2091 }
aoqi@0 2092 }
aoqi@0 2093 #endif
aoqi@0 2094 }
aoqi@0 2095
aoqi@0 2096 //------------------------------return_current---------------------------------
aoqi@0 2097 // Append current _map to _exit_return
aoqi@0 2098 void Parse::return_current(Node* value) {
aoqi@0 2099 if (RegisterFinalizersAtInit &&
aoqi@0 2100 method()->intrinsic_id() == vmIntrinsics::_Object_init) {
aoqi@0 2101 call_register_finalizer();
aoqi@0 2102 }
aoqi@0 2103
aoqi@0 2104 // Do not set_parse_bci, so that return goo is credited to the return insn.
aoqi@0 2105 set_bci(InvocationEntryBci);
aoqi@0 2106 if (method()->is_synchronized() && GenerateSynchronizationCode) {
aoqi@0 2107 shared_unlock(_synch_lock->box_node(), _synch_lock->obj_node());
aoqi@0 2108 }
aoqi@0 2109 if (C->env()->dtrace_method_probes()) {
aoqi@0 2110 make_dtrace_method_exit(method());
aoqi@0 2111 }
aoqi@0 2112 SafePointNode* exit_return = _exits.map();
aoqi@0 2113 exit_return->in( TypeFunc::Control )->add_req( control() );
aoqi@0 2114 exit_return->in( TypeFunc::I_O )->add_req( i_o () );
aoqi@0 2115 Node *mem = exit_return->in( TypeFunc::Memory );
aoqi@0 2116 for (MergeMemStream mms(mem->as_MergeMem(), merged_memory()); mms.next_non_empty2(); ) {
aoqi@0 2117 if (mms.is_empty()) {
aoqi@0 2118 // get a copy of the base memory, and patch just this one input
aoqi@0 2119 const TypePtr* adr_type = mms.adr_type(C);
aoqi@0 2120 Node* phi = mms.force_memory()->as_Phi()->slice_memory(adr_type);
aoqi@0 2121 assert(phi->as_Phi()->region() == mms.base_memory()->in(0), "");
aoqi@0 2122 gvn().set_type_bottom(phi);
aoqi@0 2123 phi->del_req(phi->req()-1); // prepare to re-patch
aoqi@0 2124 mms.set_memory(phi);
aoqi@0 2125 }
aoqi@0 2126 mms.memory()->add_req(mms.memory2());
aoqi@0 2127 }
aoqi@0 2128
aoqi@0 2129 // frame pointer is always same, already captured
aoqi@0 2130 if (value != NULL) {
aoqi@0 2131 // If returning oops to an interface-return, there is a silent free
aoqi@0 2132 // cast from oop to interface allowed by the Verifier. Make it explicit
aoqi@0 2133 // here.
aoqi@0 2134 Node* phi = _exits.argument(0);
aoqi@0 2135 const TypeInstPtr *tr = phi->bottom_type()->isa_instptr();
shshahma@8422 2136 if (tr && tr->klass()->is_loaded() &&
shshahma@8422 2137 tr->klass()->is_interface()) {
aoqi@0 2138 const TypeInstPtr *tp = value->bottom_type()->isa_instptr();
aoqi@0 2139 if (tp && tp->klass()->is_loaded() &&
aoqi@0 2140 !tp->klass()->is_interface()) {
aoqi@0 2141 // sharpen the type eagerly; this eases certain assert checking
aoqi@0 2142 if (tp->higher_equal(TypeInstPtr::NOTNULL))
aoqi@0 2143 tr = tr->join_speculative(TypeInstPtr::NOTNULL)->is_instptr();
shshahma@8422 2144 value = _gvn.transform(new (C) CheckCastPPNode(0, value, tr));
shshahma@8422 2145 }
shshahma@8422 2146 } else {
shshahma@8422 2147 // Also handle returns of oop-arrays to an arrays-of-interface return
shshahma@8422 2148 const TypeInstPtr* phi_tip;
shshahma@8422 2149 const TypeInstPtr* val_tip;
shshahma@8422 2150 Type::get_arrays_base_elements(phi->bottom_type(), value->bottom_type(), &phi_tip, &val_tip);
shshahma@8422 2151 if (phi_tip != NULL && phi_tip->is_loaded() && phi_tip->klass()->is_interface() &&
shshahma@8422 2152 val_tip != NULL && val_tip->is_loaded() && !val_tip->klass()->is_interface()) {
shshahma@8422 2153 value = _gvn.transform(new (C) CheckCastPPNode(0, value, phi->bottom_type()));
aoqi@0 2154 }
aoqi@0 2155 }
aoqi@0 2156 phi->add_req(value);
aoqi@0 2157 }
aoqi@0 2158
roland@7041 2159 if (_first_return) {
roland@7041 2160 _exits.map()->transfer_replaced_nodes_from(map(), _new_idx);
roland@7041 2161 _first_return = false;
roland@7041 2162 } else {
roland@7041 2163 _exits.map()->merge_replaced_nodes_with(map());
roland@7041 2164 }
roland@7041 2165
aoqi@0 2166 stop_and_kill_map(); // This CFG path dies here
aoqi@0 2167 }
aoqi@0 2168
aoqi@0 2169
aoqi@0 2170 //------------------------------add_safepoint----------------------------------
aoqi@0 2171 void Parse::add_safepoint() {
aoqi@0 2172 // See if we can avoid this safepoint. No need for a SafePoint immediately
aoqi@0 2173 // after a Call (except Leaf Call) or another SafePoint.
aoqi@0 2174 Node *proj = control();
aoqi@0 2175 bool add_poll_param = SafePointNode::needs_polling_address_input();
aoqi@0 2176 uint parms = add_poll_param ? TypeFunc::Parms+1 : TypeFunc::Parms;
aoqi@0 2177 if( proj->is_Proj() ) {
aoqi@0 2178 Node *n0 = proj->in(0);
aoqi@0 2179 if( n0->is_Catch() ) {
aoqi@0 2180 n0 = n0->in(0)->in(0);
aoqi@0 2181 assert( n0->is_Call(), "expect a call here" );
aoqi@0 2182 }
aoqi@0 2183 if( n0->is_Call() ) {
aoqi@0 2184 if( n0->as_Call()->guaranteed_safepoint() )
aoqi@0 2185 return;
aoqi@0 2186 } else if( n0->is_SafePoint() && n0->req() >= parms ) {
aoqi@0 2187 return;
aoqi@0 2188 }
aoqi@0 2189 }
aoqi@0 2190
aoqi@0 2191 // Clear out dead values from the debug info.
aoqi@0 2192 kill_dead_locals();
aoqi@0 2193
aoqi@0 2194 // Clone the JVM State
aoqi@0 2195 SafePointNode *sfpnt = new (C) SafePointNode(parms, NULL);
aoqi@0 2196
aoqi@0 2197 // Capture memory state BEFORE a SafePoint. Since we can block at a
aoqi@0 2198 // SafePoint we need our GC state to be safe; i.e. we need all our current
aoqi@0 2199 // write barriers (card marks) to not float down after the SafePoint so we
aoqi@0 2200 // must read raw memory. Likewise we need all oop stores to match the card
aoqi@0 2201 // marks. If deopt can happen, we need ALL stores (we need the correct JVM
aoqi@0 2202 // state on a deopt).
aoqi@0 2203
aoqi@0 2204 // We do not need to WRITE the memory state after a SafePoint. The control
aoqi@0 2205 // edge will keep card-marks and oop-stores from floating up from below a
aoqi@0 2206 // SafePoint and our true dependency added here will keep them from floating
aoqi@0 2207 // down below a SafePoint.
aoqi@0 2208
aoqi@0 2209 // Clone the current memory state
aoqi@0 2210 Node* mem = MergeMemNode::make(C, map()->memory());
aoqi@0 2211
aoqi@0 2212 mem = _gvn.transform(mem);
aoqi@0 2213
aoqi@0 2214 // Pass control through the safepoint
aoqi@0 2215 sfpnt->init_req(TypeFunc::Control , control());
aoqi@0 2216 // Fix edges normally used by a call
aoqi@0 2217 sfpnt->init_req(TypeFunc::I_O , top() );
aoqi@0 2218 sfpnt->init_req(TypeFunc::Memory , mem );
aoqi@0 2219 sfpnt->init_req(TypeFunc::ReturnAdr, top() );
aoqi@0 2220 sfpnt->init_req(TypeFunc::FramePtr , top() );
aoqi@0 2221
aoqi@0 2222 // Create a node for the polling address
aoqi@0 2223 if( add_poll_param ) {
aoqi@0 2224 Node *polladr = ConPNode::make(C, (address)os::get_polling_page());
aoqi@0 2225 sfpnt->init_req(TypeFunc::Parms+0, _gvn.transform(polladr));
aoqi@0 2226 }
aoqi@0 2227
aoqi@0 2228 // Fix up the JVM State edges
aoqi@0 2229 add_safepoint_edges(sfpnt);
aoqi@0 2230 Node *transformed_sfpnt = _gvn.transform(sfpnt);
aoqi@0 2231 set_control(transformed_sfpnt);
aoqi@0 2232
aoqi@0 2233 // Provide an edge from root to safepoint. This makes the safepoint
aoqi@0 2234 // appear useful until the parse has completed.
aoqi@0 2235 if( OptoRemoveUseless && transformed_sfpnt->is_SafePoint() ) {
aoqi@0 2236 assert(C->root() != NULL, "Expect parse is still valid");
aoqi@0 2237 C->root()->add_prec(transformed_sfpnt);
aoqi@0 2238 }
aoqi@0 2239 }
aoqi@0 2240
aoqi@0 2241 #ifndef PRODUCT
aoqi@0 2242 //------------------------show_parse_info--------------------------------------
aoqi@0 2243 void Parse::show_parse_info() {
aoqi@0 2244 InlineTree* ilt = NULL;
aoqi@0 2245 if (C->ilt() != NULL) {
aoqi@0 2246 JVMState* caller_jvms = is_osr_parse() ? caller()->caller() : caller();
aoqi@0 2247 ilt = InlineTree::find_subtree_from_root(C->ilt(), caller_jvms, method());
aoqi@0 2248 }
aoqi@0 2249 if (PrintCompilation && Verbose) {
aoqi@0 2250 if (depth() == 1) {
aoqi@0 2251 if( ilt->count_inlines() ) {
aoqi@0 2252 tty->print(" __inlined %d (%d bytes)", ilt->count_inlines(),
aoqi@0 2253 ilt->count_inline_bcs());
aoqi@0 2254 tty->cr();
aoqi@0 2255 }
aoqi@0 2256 } else {
aoqi@0 2257 if (method()->is_synchronized()) tty->print("s");
aoqi@0 2258 if (method()->has_exception_handlers()) tty->print("!");
aoqi@0 2259 // Check this is not the final compiled version
aoqi@0 2260 if (C->trap_can_recompile()) {
aoqi@0 2261 tty->print("-");
aoqi@0 2262 } else {
aoqi@0 2263 tty->print(" ");
aoqi@0 2264 }
aoqi@0 2265 method()->print_short_name();
aoqi@0 2266 if (is_osr_parse()) {
aoqi@0 2267 tty->print(" @ %d", osr_bci());
aoqi@0 2268 }
aoqi@0 2269 tty->print(" (%d bytes)",method()->code_size());
aoqi@0 2270 if (ilt->count_inlines()) {
aoqi@0 2271 tty->print(" __inlined %d (%d bytes)", ilt->count_inlines(),
aoqi@0 2272 ilt->count_inline_bcs());
aoqi@0 2273 }
aoqi@0 2274 tty->cr();
aoqi@0 2275 }
aoqi@0 2276 }
aoqi@0 2277 if (PrintOpto && (depth() == 1 || PrintOptoInlining)) {
aoqi@0 2278 // Print that we succeeded; suppress this message on the first osr parse.
aoqi@0 2279
aoqi@0 2280 if (method()->is_synchronized()) tty->print("s");
aoqi@0 2281 if (method()->has_exception_handlers()) tty->print("!");
aoqi@0 2282 // Check this is not the final compiled version
aoqi@0 2283 if (C->trap_can_recompile() && depth() == 1) {
aoqi@0 2284 tty->print("-");
aoqi@0 2285 } else {
aoqi@0 2286 tty->print(" ");
aoqi@0 2287 }
aoqi@0 2288 if( depth() != 1 ) { tty->print(" "); } // missing compile count
aoqi@0 2289 for (int i = 1; i < depth(); ++i) { tty->print(" "); }
aoqi@0 2290 method()->print_short_name();
aoqi@0 2291 if (is_osr_parse()) {
aoqi@0 2292 tty->print(" @ %d", osr_bci());
aoqi@0 2293 }
aoqi@0 2294 if (ilt->caller_bci() != -1) {
aoqi@0 2295 tty->print(" @ %d", ilt->caller_bci());
aoqi@0 2296 }
aoqi@0 2297 tty->print(" (%d bytes)",method()->code_size());
aoqi@0 2298 if (ilt->count_inlines()) {
aoqi@0 2299 tty->print(" __inlined %d (%d bytes)", ilt->count_inlines(),
aoqi@0 2300 ilt->count_inline_bcs());
aoqi@0 2301 }
aoqi@0 2302 tty->cr();
aoqi@0 2303 }
aoqi@0 2304 }
aoqi@0 2305
aoqi@0 2306
aoqi@0 2307 //------------------------------dump-------------------------------------------
aoqi@0 2308 // Dump information associated with the bytecodes of current _method
aoqi@0 2309 void Parse::dump() {
aoqi@0 2310 if( method() != NULL ) {
aoqi@0 2311 // Iterate over bytecodes
aoqi@0 2312 ciBytecodeStream iter(method());
aoqi@0 2313 for( Bytecodes::Code bc = iter.next(); bc != ciBytecodeStream::EOBC() ; bc = iter.next() ) {
aoqi@0 2314 dump_bci( iter.cur_bci() );
aoqi@0 2315 tty->cr();
aoqi@0 2316 }
aoqi@0 2317 }
aoqi@0 2318 }
aoqi@0 2319
aoqi@0 2320 // Dump information associated with a byte code index, 'bci'
aoqi@0 2321 void Parse::dump_bci(int bci) {
aoqi@0 2322 // Output info on merge-points, cloning, and within _jsr..._ret
aoqi@0 2323 // NYI
aoqi@0 2324 tty->print(" bci:%d", bci);
aoqi@0 2325 }
aoqi@0 2326
aoqi@0 2327 #endif

mercurial