New src/share/vm/opto/callnode.cpp

   1 /*
   2  * Copyright 1997-2008 Sun Microsystems, Inc.  All Rights Reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
  20  * CA 95054 USA or visit www.sun.com if you need additional information or
  21  * have any questions.
  22  *
  23  */
  24 
  25 // Portions of code courtesy of Clifford Click
  26 
  27 // Optimization - Graph Style
  28 
  29 #include "incls/_precompiled.incl"
  30 #include "incls/_callnode.cpp.incl"
  31 
  32 //=============================================================================
  33 uint StartNode::size_of() const { return sizeof(*this); }
  34 uint StartNode::cmp( const Node &n ) const
  35 { return _domain == ((StartNode&)n)._domain; }
  36 const Type *StartNode::bottom_type() const { return _domain; }
  37 const Type *StartNode::Value(PhaseTransform *phase) const { return _domain; }
  38 #ifndef PRODUCT
  39 void StartNode::dump_spec(outputStream *st) const { st->print(" #"); _domain->dump_on(st);}
  40 #endif
  41 
  42 //------------------------------Ideal------------------------------------------
  43 Node *StartNode::Ideal(PhaseGVN *phase, bool can_reshape){
  44   return remove_dead_region(phase, can_reshape) ? this : NULL;
  45 }
  46 
  47 //------------------------------calling_convention-----------------------------
  48 void StartNode::calling_convention( BasicType* sig_bt, VMRegPair *parm_regs, uint argcnt ) const {
  49   Matcher::calling_convention( sig_bt, parm_regs, argcnt, false );
  50 }
  51 
  52 //------------------------------Registers--------------------------------------
  53 const RegMask &StartNode::in_RegMask(uint) const {
  54   return RegMask::Empty;
  55 }
  56 
  57 //------------------------------match------------------------------------------
  58 // Construct projections for incoming parameters, and their RegMask info
  59 Node *StartNode::match( const ProjNode *proj, const Matcher *match ) {
  60   switch (proj->_con) {
  61   case TypeFunc::Control:
  62   case TypeFunc::I_O:
  63   case TypeFunc::Memory:
  64     return new (match->C, 1) MachProjNode(this,proj->_con,RegMask::Empty,MachProjNode::unmatched_proj);
  65   case TypeFunc::FramePtr:
  66     return new (match->C, 1) MachProjNode(this,proj->_con,Matcher::c_frame_ptr_mask, Op_RegP);
  67   case TypeFunc::ReturnAdr:
  68     return new (match->C, 1) MachProjNode(this,proj->_con,match->_return_addr_mask,Op_RegP);
  69   case TypeFunc::Parms:
  70   default: {
  71       uint parm_num = proj->_con - TypeFunc::Parms;
  72       const Type *t = _domain->field_at(proj->_con);
  73       if (t->base() == Type::Half)  // 2nd half of Longs and Doubles
  74         return new (match->C, 1) ConNode(Type::TOP);
  75       uint ideal_reg = Matcher::base2reg[t->base()];
  76       RegMask &rm = match->_calling_convention_mask[parm_num];
  77       return new (match->C, 1) MachProjNode(this,proj->_con,rm,ideal_reg);
  78     }
  79   }
  80   return NULL;
  81 }
  82 
  83 //------------------------------StartOSRNode----------------------------------
  84 // The method start node for an on stack replacement adapter
  85 
  86 //------------------------------osr_domain-----------------------------
  87 const TypeTuple *StartOSRNode::osr_domain() {
  88   const Type **fields = TypeTuple::fields(2);
  89   fields[TypeFunc::Parms+0] = TypeRawPtr::BOTTOM;  // address of osr buffer
  90 
  91   return TypeTuple::make(TypeFunc::Parms+1, fields);
  92 }
  93 
  94 //=============================================================================
  95 const char * const ParmNode::names[TypeFunc::Parms+1] = {
  96   "Control", "I_O", "Memory", "FramePtr", "ReturnAdr", "Parms"
  97 };
  98 
  99 #ifndef PRODUCT
 100 void ParmNode::dump_spec(outputStream *st) const {
 101   if( _con < TypeFunc::Parms ) {
 102     st->print(names[_con]);
 103   } else {
 104     st->print("Parm%d: ",_con-TypeFunc::Parms);
 105     // Verbose and WizardMode dump bottom_type for all nodes
 106     if( !Verbose && !WizardMode )   bottom_type()->dump_on(st);
 107   }
 108 }
 109 #endif
 110 
 111 uint ParmNode::ideal_reg() const {
 112   switch( _con ) {
 113   case TypeFunc::Control  : // fall through
 114   case TypeFunc::I_O      : // fall through
 115   case TypeFunc::Memory   : return 0;
 116   case TypeFunc::FramePtr : // fall through
 117   case TypeFunc::ReturnAdr: return Op_RegP;
 118   default                 : assert( _con > TypeFunc::Parms, "" );
 119     // fall through
 120   case TypeFunc::Parms    : {
 121     // Type of argument being passed
 122     const Type *t = in(0)->as_Start()->_domain->field_at(_con);
 123     return Matcher::base2reg[t->base()];
 124   }
 125   }
 126   ShouldNotReachHere();
 127   return 0;
 128 }
 129 
 130 //=============================================================================
 131 ReturnNode::ReturnNode(uint edges, Node *cntrl, Node *i_o, Node *memory, Node *frameptr, Node *retadr ) : Node(edges) {
 132   init_req(TypeFunc::Control,cntrl);
 133   init_req(TypeFunc::I_O,i_o);
 134   init_req(TypeFunc::Memory,memory);
 135   init_req(TypeFunc::FramePtr,frameptr);
 136   init_req(TypeFunc::ReturnAdr,retadr);
 137 }
 138 
 139 Node *ReturnNode::Ideal(PhaseGVN *phase, bool can_reshape){
 140   return remove_dead_region(phase, can_reshape) ? this : NULL;
 141 }
 142 
 143 const Type *ReturnNode::Value( PhaseTransform *phase ) const {
 144   return ( phase->type(in(TypeFunc::Control)) == Type::TOP)
 145     ? Type::TOP
 146     : Type::BOTTOM;
 147 }
 148 
 149 // Do we Match on this edge index or not?  No edges on return nodes
 150 uint ReturnNode::match_edge(uint idx) const {
 151   return 0;
 152 }
 153 
 154 
 155 #ifndef PRODUCT
 156 void ReturnNode::dump_req() const {
 157   // Dump the required inputs, enclosed in '(' and ')'
 158   uint i;                       // Exit value of loop
 159   for( i=0; i<req(); i++ ) {    // For all required inputs
 160     if( i == TypeFunc::Parms ) tty->print("returns");
 161     if( in(i) ) tty->print("%c%d ", Compile::current()->node_arena()->contains(in(i)) ? ' ' : 'o', in(i)->_idx);
 162     else tty->print("_ ");
 163   }
 164 }
 165 #endif
 166 
 167 //=============================================================================
 168 RethrowNode::RethrowNode(
 169   Node* cntrl,
 170   Node* i_o,
 171   Node* memory,
 172   Node* frameptr,
 173   Node* ret_adr,
 174   Node* exception
 175 ) : Node(TypeFunc::Parms + 1) {
 176   init_req(TypeFunc::Control  , cntrl    );
 177   init_req(TypeFunc::I_O      , i_o      );
 178   init_req(TypeFunc::Memory   , memory   );
 179   init_req(TypeFunc::FramePtr , frameptr );
 180   init_req(TypeFunc::ReturnAdr, ret_adr);
 181   init_req(TypeFunc::Parms    , exception);
 182 }
 183 
 184 Node *RethrowNode::Ideal(PhaseGVN *phase, bool can_reshape){
 185   return remove_dead_region(phase, can_reshape) ? this : NULL;
 186 }
 187 
 188 const Type *RethrowNode::Value( PhaseTransform *phase ) const {
 189   return (phase->type(in(TypeFunc::Control)) == Type::TOP)
 190     ? Type::TOP
 191     : Type::BOTTOM;
 192 }
 193 
 194 uint RethrowNode::match_edge(uint idx) const {
 195   return 0;
 196 }
 197 
 198 #ifndef PRODUCT
 199 void RethrowNode::dump_req() const {
 200   // Dump the required inputs, enclosed in '(' and ')'
 201   uint i;                       // Exit value of loop
 202   for( i=0; i<req(); i++ ) {    // For all required inputs
 203     if( i == TypeFunc::Parms ) tty->print("exception");
 204     if( in(i) ) tty->print("%c%d ", Compile::current()->node_arena()->contains(in(i)) ? ' ' : 'o', in(i)->_idx);
 205     else tty->print("_ ");
 206   }
 207 }
 208 #endif
 209 
 210 //=============================================================================
 211 // Do we Match on this edge index or not?  Match only target address & method
 212 uint TailCallNode::match_edge(uint idx) const {
 213   return TypeFunc::Parms <= idx  &&  idx <= TypeFunc::Parms+1;
 214 }
 215 
 216 //=============================================================================
 217 // Do we Match on this edge index or not?  Match only target address & oop
 218 uint TailJumpNode::match_edge(uint idx) const {
 219   return TypeFunc::Parms <= idx  &&  idx <= TypeFunc::Parms+1;
 220 }
 221 
 222 //=============================================================================
 223 JVMState::JVMState(ciMethod* method, JVMState* caller) {
 224   assert(method != NULL, "must be valid call site");
 225   _method = method;
 226   _reexecute = Reexecute_Undefined;
 227   debug_only(_bci = -99);  // random garbage value
 228   debug_only(_map = (SafePointNode*)-1);
 229   _caller = caller;
 230   _depth  = 1 + (caller == NULL ? 0 : caller->depth());
 231   _locoff = TypeFunc::Parms;
 232   _stkoff = _locoff + _method->max_locals();
 233   _monoff = _stkoff + _method->max_stack();
 234   _scloff = _monoff;
 235   _endoff = _monoff;
 236   _sp = 0;
 237 }
 238 JVMState::JVMState(int stack_size) {
 239   _method = NULL;
 240   _bci = InvocationEntryBci;
 241   _reexecute = Reexecute_Undefined;
 242   debug_only(_map = (SafePointNode*)-1);
 243   _caller = NULL;
 244   _depth  = 1;
 245   _locoff = TypeFunc::Parms;
 246   _stkoff = _locoff;
 247   _monoff = _stkoff + stack_size;
 248   _scloff = _monoff;
 249   _endoff = _monoff;
 250   _sp = 0;
 251 }
 252 
 253 //--------------------------------of_depth-------------------------------------
 254 JVMState* JVMState::of_depth(int d) const {
 255   const JVMState* jvmp = this;
 256   assert(0 < d && (uint)d <= depth(), "oob");
 257   for (int skip = depth() - d; skip > 0; skip--) {
 258     jvmp = jvmp->caller();
 259   }
 260   assert(jvmp->depth() == (uint)d, "found the right one");
 261   return (JVMState*)jvmp;
 262 }
 263 
 264 //-----------------------------same_calls_as-----------------------------------
 265 bool JVMState::same_calls_as(const JVMState* that) const {
 266   if (this == that)                    return true;
 267   if (this->depth() != that->depth())  return false;
 268   const JVMState* p = this;
 269   const JVMState* q = that;
 270   for (;;) {
 271     if (p->_method != q->_method)    return false;
 272     if (p->_method == NULL)          return true;   // bci is irrelevant
 273     if (p->_bci    != q->_bci)       return false;
 274     if (p->_reexecute != q->_reexecute)  return false;
 275     p = p->caller();
 276     q = q->caller();
 277     if (p == q)                      return true;
 278     assert(p != NULL && q != NULL, "depth check ensures we don't run off end");
 279   }
 280 }
 281 
 282 //------------------------------debug_start------------------------------------
 283 uint JVMState::debug_start()  const {
 284   debug_only(JVMState* jvmroot = of_depth(1));
 285   assert(jvmroot->locoff() <= this->locoff(), "youngest JVMState must be last");
 286   return of_depth(1)->locoff();
 287 }
 288 
 289 //-------------------------------debug_end-------------------------------------
 290 uint JVMState::debug_end() const {
 291   debug_only(JVMState* jvmroot = of_depth(1));
 292   assert(jvmroot->endoff() <= this->endoff(), "youngest JVMState must be last");
 293   return endoff();
 294 }
 295 
 296 //------------------------------debug_depth------------------------------------
 297 uint JVMState::debug_depth() const {
 298   uint total = 0;
 299   for (const JVMState* jvmp = this; jvmp != NULL; jvmp = jvmp->caller()) {
 300     total += jvmp->debug_size();
 301   }
 302   return total;
 303 }
 304 
 305 #ifndef PRODUCT
 306 
 307 //------------------------------format_helper----------------------------------
 308 // Given an allocation (a Chaitin object) and a Node decide if the Node carries
 309 // any defined value or not.  If it does, print out the register or constant.
 310 static void format_helper( PhaseRegAlloc *regalloc, outputStream* st, Node *n, const char *msg, uint i, GrowableArray<SafePointScalarObjectNode*> *scobjs ) {
 311   if (n == NULL) { st->print(" NULL"); return; }
 312   if (n->is_SafePointScalarObject()) {
 313     // Scalar replacement.
 314     SafePointScalarObjectNode* spobj = n->as_SafePointScalarObject();
 315     scobjs->append_if_missing(spobj);
 316     int sco_n = scobjs->find(spobj);
 317     assert(sco_n >= 0, "");
 318     st->print(" %s%d]=#ScObj" INT32_FORMAT, msg, i, sco_n);
 319     return;
 320   }
 321   if( OptoReg::is_valid(regalloc->get_reg_first(n))) { // Check for undefined
 322     char buf[50];
 323     regalloc->dump_register(n,buf);
 324     st->print(" %s%d]=%s",msg,i,buf);
 325   } else {                      // No register, but might be constant
 326     const Type *t = n->bottom_type();
 327     switch (t->base()) {
 328     case Type::Int:
 329       st->print(" %s%d]=#"INT32_FORMAT,msg,i,t->is_int()->get_con());
 330       break;
 331     case Type::AnyPtr:
 332       assert( t == TypePtr::NULL_PTR, "" );
 333       st->print(" %s%d]=#NULL",msg,i);
 334       break;
 335     case Type::AryPtr:
 336     case Type::KlassPtr:
 337     case Type::InstPtr:
 338       st->print(" %s%d]=#Ptr" INTPTR_FORMAT,msg,i,t->isa_oopptr()->const_oop());
 339       break;
 340     case Type::NarrowOop:
 341       st->print(" %s%d]=#Ptr" INTPTR_FORMAT,msg,i,t->make_ptr()->isa_oopptr()->const_oop());
 342       break;
 343     case Type::RawPtr:
 344       st->print(" %s%d]=#Raw" INTPTR_FORMAT,msg,i,t->is_rawptr());
 345       break;
 346     case Type::DoubleCon:
 347       st->print(" %s%d]=#%fD",msg,i,t->is_double_constant()->_d);
 348       break;
 349     case Type::FloatCon:
 350       st->print(" %s%d]=#%fF",msg,i,t->is_float_constant()->_f);
 351       break;
 352     case Type::Long:
 353       st->print(" %s%d]=#"INT64_FORMAT,msg,i,t->is_long()->get_con());
 354       break;
 355     case Type::Half:
 356     case Type::Top:
 357       st->print(" %s%d]=_",msg,i);
 358       break;
 359     default: ShouldNotReachHere();
 360     }
 361   }
 362 }
 363 
 364 //------------------------------format-----------------------------------------
 365 void JVMState::format(PhaseRegAlloc *regalloc, const Node *n, outputStream* st) const {
 366   st->print("        #");
 367   if( _method ) {
 368     _method->print_short_name(st);
 369     st->print(" @ bci:%d ",_bci);
 370   } else {
 371     st->print_cr(" runtime stub ");
 372     return;
 373   }
 374   if (n->is_MachSafePoint()) {
 375     GrowableArray<SafePointScalarObjectNode*> scobjs;
 376     MachSafePointNode *mcall = n->as_MachSafePoint();
 377     uint i;
 378     // Print locals
 379     for( i = 0; i < (uint)loc_size(); i++ )
 380       format_helper( regalloc, st, mcall->local(this, i), "L[", i, &scobjs );
 381     // Print stack
 382     for (i = 0; i < (uint)stk_size(); i++) {
 383       if ((uint)(_stkoff + i) >= mcall->len())
 384         st->print(" oob ");
 385       else
 386        format_helper( regalloc, st, mcall->stack(this, i), "STK[", i, &scobjs );
 387     }
 388     for (i = 0; (int)i < nof_monitors(); i++) {
 389       Node *box = mcall->monitor_box(this, i);
 390       Node *obj = mcall->monitor_obj(this, i);
 391       if ( OptoReg::is_valid(regalloc->get_reg_first(box)) ) {
 392         while( !box->is_BoxLock() )  box = box->in(1);
 393         format_helper( regalloc, st, box, "MON-BOX[", i, &scobjs );
 394       } else {
 395         OptoReg::Name box_reg = BoxLockNode::stack_slot(box);
 396         st->print(" MON-BOX%d=%s+%d",
 397                    i,
 398                    OptoReg::regname(OptoReg::c_frame_pointer),
 399                    regalloc->reg2offset(box_reg));
 400       }
 401       const char* obj_msg = "MON-OBJ[";
 402       if (EliminateLocks) {
 403         while( !box->is_BoxLock() )  box = box->in(1);
 404         if (box->as_BoxLock()->is_eliminated())
 405           obj_msg = "MON-OBJ(LOCK ELIMINATED)[";
 406       }
 407       format_helper( regalloc, st, obj, obj_msg, i, &scobjs );
 408     }
 409 
 410     for (i = 0; i < (uint)scobjs.length(); i++) {
 411       // Scalar replaced objects.
 412       st->print_cr("");
 413       st->print("        # ScObj" INT32_FORMAT " ", i);
 414       SafePointScalarObjectNode* spobj = scobjs.at(i);
 415       ciKlass* cik = spobj->bottom_type()->is_oopptr()->klass();
 416       assert(cik->is_instance_klass() ||
 417              cik->is_array_klass(), "Not supported allocation.");
 418       ciInstanceKlass *iklass = NULL;
 419       if (cik->is_instance_klass()) {
 420         cik->print_name_on(st);
 421         iklass = cik->as_instance_klass();
 422       } else if (cik->is_type_array_klass()) {
 423         cik->as_array_klass()->base_element_type()->print_name_on(st);
 424         st->print("[%d]=", spobj->n_fields());
 425       } else if (cik->is_obj_array_klass()) {
 426         ciType* cie = cik->as_array_klass()->base_element_type();
 427         int ndim = 1;
 428         while (cie->is_obj_array_klass()) {
 429           ndim += 1;
 430           cie = cie->as_array_klass()->base_element_type();
 431         }
 432         cie->print_name_on(st);
 433         while (ndim-- > 0) {
 434           st->print("[]");
 435         }
 436         st->print("[%d]=", spobj->n_fields());
 437       }
 438       st->print("{");
 439       uint nf = spobj->n_fields();
 440       if (nf > 0) {
 441         uint first_ind = spobj->first_index();
 442         Node* fld_node = mcall->in(first_ind);
 443         ciField* cifield;
 444         if (iklass != NULL) {
 445           st->print(" [");
 446           cifield = iklass->nonstatic_field_at(0);
 447           cifield->print_name_on(st);
 448           format_helper( regalloc, st, fld_node, ":", 0, &scobjs );
 449         } else {
 450           format_helper( regalloc, st, fld_node, "[", 0, &scobjs );
 451         }
 452         for (uint j = 1; j < nf; j++) {
 453           fld_node = mcall->in(first_ind+j);
 454           if (iklass != NULL) {
 455             st->print(", [");
 456             cifield = iklass->nonstatic_field_at(j);
 457             cifield->print_name_on(st);
 458             format_helper( regalloc, st, fld_node, ":", j, &scobjs );
 459           } else {
 460             format_helper( regalloc, st, fld_node, ", [", j, &scobjs );
 461           }
 462         }
 463       }
 464       st->print(" }");
 465     }
 466   }
 467   st->print_cr("");
 468   if (caller() != NULL)  caller()->format(regalloc, n, st);
 469 }
 470 
 471 
 472 void JVMState::dump_spec(outputStream *st) const {
 473   if (_method != NULL) {
 474     bool printed = false;
 475     if (!Verbose) {
 476       // The JVMS dumps make really, really long lines.
 477       // Take out the most boring parts, which are the package prefixes.
 478       char buf[500];
 479       stringStream namest(buf, sizeof(buf));
 480       _method->print_short_name(&namest);
 481       if (namest.count() < sizeof(buf)) {
 482         const char* name = namest.base();
 483         if (name[0] == ' ')  ++name;
 484         const char* endcn = strchr(name, ':');  // end of class name
 485         if (endcn == NULL)  endcn = strchr(name, '(');
 486         if (endcn == NULL)  endcn = name + strlen(name);
 487         while (endcn > name && endcn[-1] != '.' && endcn[-1] != '/')
 488           --endcn;
 489         st->print(" %s", endcn);
 490         printed = true;
 491       }
 492     }
 493     if (!printed)
 494       _method->print_short_name(st);
 495     st->print(" @ bci:%d",_bci);
 496     st->print(" reexecute:%s", _reexecute==Reexecute_True?"true":"false");
 497   } else {
 498     st->print(" runtime stub");
 499   }
 500   if (caller() != NULL)  caller()->dump_spec(st);
 501 }
 502 
 503 
 504 void JVMState::dump_on(outputStream* st) const {
 505   if (_map && !((uintptr_t)_map & 1)) {
 506     if (_map->len() > _map->req()) {  // _map->has_exceptions()
 507       Node* ex = _map->in(_map->req());  // _map->next_exception()
 508       // skip the first one; it's already being printed
 509       while (ex != NULL && ex->len() > ex->req()) {
 510         ex = ex->in(ex->req());  // ex->next_exception()
 511         ex->dump(1);
 512       }
 513     }
 514     _map->dump(2);
 515   }
 516   st->print("JVMS depth=%d loc=%d stk=%d mon=%d scalar=%d end=%d mondepth=%d sp=%d bci=%d reexecute=%s method=",
 517              depth(), locoff(), stkoff(), monoff(), scloff(), endoff(), monitor_depth(), sp(), bci(), should_reexecute()?"true":"false");
 518   if (_method == NULL) {
 519     st->print_cr("(none)");
 520   } else {
 521     _method->print_name(st);
 522     st->cr();
 523     if (bci() >= 0 && bci() < _method->code_size()) {
 524       st->print("    bc: ");
 525       _method->print_codes_on(bci(), bci()+1, st);
 526     }
 527   }
 528   if (caller() != NULL) {
 529     caller()->dump_on(st);
 530   }
 531 }
 532 
 533 // Extra way to dump a jvms from the debugger,
 534 // to avoid a bug with C++ member function calls.
 535 void dump_jvms(JVMState* jvms) {
 536   jvms->dump();
 537 }
 538 #endif
 539 
 540 //--------------------------clone_shallow--------------------------------------
 541 JVMState* JVMState::clone_shallow(Compile* C) const {
 542   JVMState* n = has_method() ? new (C) JVMState(_method, _caller) : new (C) JVMState(0);
 543   n->set_bci(_bci);
 544   n->_reexecute = _reexecute;
 545   n->set_locoff(_locoff);
 546   n->set_stkoff(_stkoff);
 547   n->set_monoff(_monoff);
 548   n->set_scloff(_scloff);
 549   n->set_endoff(_endoff);
 550   n->set_sp(_sp);
 551   n->set_map(_map);
 552   return n;
 553 }
 554 
 555 //---------------------------clone_deep----------------------------------------
 556 JVMState* JVMState::clone_deep(Compile* C) const {
 557   JVMState* n = clone_shallow(C);
 558   for (JVMState* p = n; p->_caller != NULL; p = p->_caller) {
 559     p->_caller = p->_caller->clone_shallow(C);
 560   }
 561   assert(n->depth() == depth(), "sanity");
 562   assert(n->debug_depth() == debug_depth(), "sanity");
 563   return n;
 564 }
 565 
 566 //=============================================================================
 567 uint CallNode::cmp( const Node &n ) const
 568 { return _tf == ((CallNode&)n)._tf && _jvms == ((CallNode&)n)._jvms; }
 569 #ifndef PRODUCT
 570 void CallNode::dump_req() const {
 571   // Dump the required inputs, enclosed in '(' and ')'
 572   uint i;                       // Exit value of loop
 573   for( i=0; i<req(); i++ ) {    // For all required inputs
 574     if( i == TypeFunc::Parms ) tty->print("(");
 575     if( in(i) ) tty->print("%c%d ", Compile::current()->node_arena()->contains(in(i)) ? ' ' : 'o', in(i)->_idx);
 576     else tty->print("_ ");
 577   }
 578   tty->print(")");
 579 }
 580 
 581 void CallNode::dump_spec(outputStream *st) const {
 582   st->print(" ");
 583   tf()->dump_on(st);
 584   if (_cnt != COUNT_UNKNOWN)  st->print(" C=%f",_cnt);
 585   if (jvms() != NULL)  jvms()->dump_spec(st);
 586 }
 587 #endif
 588 
 589 const Type *CallNode::bottom_type() const { return tf()->range(); }
 590 const Type *CallNode::Value(PhaseTransform *phase) const {
 591   if (phase->type(in(0)) == Type::TOP)  return Type::TOP;
 592   return tf()->range();
 593 }
 594 
 595 //------------------------------calling_convention-----------------------------
 596 void CallNode::calling_convention( BasicType* sig_bt, VMRegPair *parm_regs, uint argcnt ) const {
 597   // Use the standard compiler calling convention
 598   Matcher::calling_convention( sig_bt, parm_regs, argcnt, true );
 599 }
 600 
 601 
 602 //------------------------------match------------------------------------------
 603 // Construct projections for control, I/O, memory-fields, ..., and
 604 // return result(s) along with their RegMask info
 605 Node *CallNode::match( const ProjNode *proj, const Matcher *match ) {
 606   switch (proj->_con) {
 607   case TypeFunc::Control:
 608   case TypeFunc::I_O:
 609   case TypeFunc::Memory:
 610     return new (match->C, 1) MachProjNode(this,proj->_con,RegMask::Empty,MachProjNode::unmatched_proj);
 611 
 612   case TypeFunc::Parms+1:       // For LONG & DOUBLE returns
 613     assert(tf()->_range->field_at(TypeFunc::Parms+1) == Type::HALF, "");
 614     // 2nd half of doubles and longs
 615     return new (match->C, 1) MachProjNode(this,proj->_con, RegMask::Empty, (uint)OptoReg::Bad);
 616 
 617   case TypeFunc::Parms: {       // Normal returns
 618     uint ideal_reg = Matcher::base2reg[tf()->range()->field_at(TypeFunc::Parms)->base()];
 619     OptoRegPair regs = is_CallRuntime()
 620       ? match->c_return_value(ideal_reg,true)  // Calls into C runtime
 621       : match->  return_value(ideal_reg,true); // Calls into compiled Java code
 622     RegMask rm = RegMask(regs.first());
 623     if( OptoReg::is_valid(regs.second()) )
 624       rm.Insert( regs.second() );
 625     return new (match->C, 1) MachProjNode(this,proj->_con,rm,ideal_reg);
 626   }
 627 
 628   case TypeFunc::ReturnAdr:
 629   case TypeFunc::FramePtr:
 630   default:
 631     ShouldNotReachHere();
 632   }
 633   return NULL;
 634 }
 635 
 636 // Do we Match on this edge index or not?  Match no edges
 637 uint CallNode::match_edge(uint idx) const {
 638   return 0;
 639 }
 640 
 641 //
 642 // Determine whether the call could modify the field of the specified
 643 // instance at the specified offset.
 644 //
 645 bool CallNode::may_modify(const TypePtr *addr_t, PhaseTransform *phase) {
 646   const TypeOopPtr *adrInst_t  = addr_t->isa_oopptr();
 647 
 648   // If not an OopPtr or not an instance type, assume the worst.
 649   // Note: currently this method is called only for instance types.
 650   if (adrInst_t == NULL || !adrInst_t->is_known_instance()) {
 651     return true;
 652   }
 653   // The instance_id is set only for scalar-replaceable allocations which
 654   // are not passed as arguments according to Escape Analysis.
 655   return false;
 656 }
 657 
 658 // Does this call have a direct reference to n other than debug information?
 659 bool CallNode::has_non_debug_use(Node *n) {
 660   const TypeTuple * d = tf()->domain();
 661   for (uint i = TypeFunc::Parms; i < d->cnt(); i++) {
 662     Node *arg = in(i);
 663     if (arg == n) {
 664       return true;
 665     }
 666   }
 667   return false;
 668 }
 669 
 670 // Returns the unique CheckCastPP of a call
 671 // or 'this' if there are several CheckCastPP
 672 // or returns NULL if there is no one.
 673 Node *CallNode::result_cast() {
 674   Node *cast = NULL;
 675 
 676   Node *p = proj_out(TypeFunc::Parms);
 677   if (p == NULL)
 678     return NULL;
 679 
 680   for (DUIterator_Fast imax, i = p->fast_outs(imax); i < imax; i++) {
 681     Node *use = p->fast_out(i);
 682     if (use->is_CheckCastPP()) {
 683       if (cast != NULL) {
 684         return this;  // more than 1 CheckCastPP
 685       }
 686       cast = use;
 687     }
 688   }
 689   return cast;
 690 }
 691 
 692 
 693 //=============================================================================
 694 uint CallJavaNode::size_of() const { return sizeof(*this); }
 695 uint CallJavaNode::cmp( const Node &n ) const {
 696   CallJavaNode &call = (CallJavaNode&)n;
 697   return CallNode::cmp(call) && _method == call._method;
 698 }
 699 #ifndef PRODUCT
 700 void CallJavaNode::dump_spec(outputStream *st) const {
 701   if( _method ) _method->print_short_name(st);
 702   CallNode::dump_spec(st);
 703 }
 704 #endif
 705 
 706 //=============================================================================
 707 uint CallStaticJavaNode::size_of() const { return sizeof(*this); }
 708 uint CallStaticJavaNode::cmp( const Node &n ) const {
 709   CallStaticJavaNode &call = (CallStaticJavaNode&)n;
 710   return CallJavaNode::cmp(call);
 711 }
 712 
 713 //----------------------------uncommon_trap_request----------------------------
 714 // If this is an uncommon trap, return the request code, else zero.
 715 int CallStaticJavaNode::uncommon_trap_request() const {
 716   if (_name != NULL && !strcmp(_name, "uncommon_trap")) {
 717     return extract_uncommon_trap_request(this);
 718   }
 719   return 0;
 720 }
 721 int CallStaticJavaNode::extract_uncommon_trap_request(const Node* call) {
 722 #ifndef PRODUCT
 723   if (!(call->req() > TypeFunc::Parms &&
 724         call->in(TypeFunc::Parms) != NULL &&
 725         call->in(TypeFunc::Parms)->is_Con())) {
 726     assert(_in_dump_cnt != 0, "OK if dumping");
 727     tty->print("[bad uncommon trap]");
 728     return 0;
 729   }
 730 #endif
 731   return call->in(TypeFunc::Parms)->bottom_type()->is_int()->get_con();
 732 }
 733 
 734 #ifndef PRODUCT
 735 void CallStaticJavaNode::dump_spec(outputStream *st) const {
 736   st->print("# Static ");
 737   if (_name != NULL) {
 738     st->print("%s", _name);
 739     int trap_req = uncommon_trap_request();
 740     if (trap_req != 0) {
 741       char buf[100];
 742       st->print("(%s)",
 743                  Deoptimization::format_trap_request(buf, sizeof(buf),
 744                                                      trap_req));
 745     }
 746     st->print(" ");
 747   }
 748   CallJavaNode::dump_spec(st);
 749 }
 750 #endif
 751 
 752 //=============================================================================
 753 uint CallDynamicJavaNode::size_of() const { return sizeof(*this); }
 754 uint CallDynamicJavaNode::cmp( const Node &n ) const {
 755   CallDynamicJavaNode &call = (CallDynamicJavaNode&)n;
 756   return CallJavaNode::cmp(call);
 757 }
 758 #ifndef PRODUCT
 759 void CallDynamicJavaNode::dump_spec(outputStream *st) const {
 760   st->print("# Dynamic ");
 761   CallJavaNode::dump_spec(st);
 762 }
 763 #endif
 764 
 765 //=============================================================================
 766 uint CallRuntimeNode::size_of() const { return sizeof(*this); }
 767 uint CallRuntimeNode::cmp( const Node &n ) const {
 768   CallRuntimeNode &call = (CallRuntimeNode&)n;
 769   return CallNode::cmp(call) && !strcmp(_name,call._name);
 770 }
 771 #ifndef PRODUCT
 772 void CallRuntimeNode::dump_spec(outputStream *st) const {
 773   st->print("# ");
 774   st->print(_name);
 775   CallNode::dump_spec(st);
 776 }
 777 #endif
 778 
 779 //------------------------------calling_convention-----------------------------
 780 void CallRuntimeNode::calling_convention( BasicType* sig_bt, VMRegPair *parm_regs, uint argcnt ) const {
 781   Matcher::c_calling_convention( sig_bt, parm_regs, argcnt );
 782 }
 783 
 784 //=============================================================================
 785 //------------------------------calling_convention-----------------------------
 786 
 787 
 788 //=============================================================================
 789 #ifndef PRODUCT
 790 void CallLeafNode::dump_spec(outputStream *st) const {
 791   st->print("# ");
 792   st->print(_name);
 793   CallNode::dump_spec(st);
 794 }
 795 #endif
 796 
 797 //=============================================================================
 798 
 799 void SafePointNode::set_local(JVMState* jvms, uint idx, Node *c) {
 800   assert(verify_jvms(jvms), "jvms must match");
 801   int loc = jvms->locoff() + idx;
 802   if (in(loc)->is_top() && idx > 0 && !c->is_top() ) {
 803     // If current local idx is top then local idx - 1 could
 804     // be a long/double that needs to be killed since top could
 805     // represent the 2nd half ofthe long/double.
 806     uint ideal = in(loc -1)->ideal_reg();
 807     if (ideal == Op_RegD || ideal == Op_RegL) {
 808       // set other (low index) half to top
 809       set_req(loc - 1, in(loc));
 810     }
 811   }
 812   set_req(loc, c);
 813 }
 814 
 815 uint SafePointNode::size_of() const { return sizeof(*this); }
 816 uint SafePointNode::cmp( const Node &n ) const {
 817   return (&n == this);          // Always fail except on self
 818 }
 819 
 820 //-------------------------set_next_exception----------------------------------
 821 void SafePointNode::set_next_exception(SafePointNode* n) {
 822   assert(n == NULL || n->Opcode() == Op_SafePoint, "correct value for next_exception");
 823   if (len() == req()) {
 824     if (n != NULL)  add_prec(n);
 825   } else {
 826     set_prec(req(), n);
 827   }
 828 }
 829 
 830 
 831 //----------------------------next_exception-----------------------------------
 832 SafePointNode* SafePointNode::next_exception() const {
 833   if (len() == req()) {
 834     return NULL;
 835   } else {
 836     Node* n = in(req());
 837     assert(n == NULL || n->Opcode() == Op_SafePoint, "no other uses of prec edges");
 838     return (SafePointNode*) n;
 839   }
 840 }
 841 
 842 
 843 //------------------------------Ideal------------------------------------------
 844 // Skip over any collapsed Regions
 845 Node *SafePointNode::Ideal(PhaseGVN *phase, bool can_reshape) {
 846   return remove_dead_region(phase, can_reshape) ? this : NULL;
 847 }
 848 
 849 //------------------------------Identity---------------------------------------
 850 // Remove obviously duplicate safepoints
 851 Node *SafePointNode::Identity( PhaseTransform *phase ) {
 852 
 853   // If you have back to back safepoints, remove one
 854   if( in(TypeFunc::Control)->is_SafePoint() )
 855     return in(TypeFunc::Control);
 856 
 857   if( in(0)->is_Proj() ) {
 858     Node *n0 = in(0)->in(0);
 859     // Check if he is a call projection (except Leaf Call)
 860     if( n0->is_Catch() ) {
 861       n0 = n0->in(0)->in(0);
 862       assert( n0->is_Call(), "expect a call here" );
 863     }
 864     if( n0->is_Call() && n0->as_Call()->guaranteed_safepoint() ) {
 865       // Useless Safepoint, so remove it
 866       return in(TypeFunc::Control);
 867     }
 868   }
 869 
 870   return this;
 871 }
 872 
 873 //------------------------------Value------------------------------------------
 874 const Type *SafePointNode::Value( PhaseTransform *phase ) const {
 875   if( phase->type(in(0)) == Type::TOP ) return Type::TOP;
 876   if( phase->eqv( in(0), this ) ) return Type::TOP; // Dead infinite loop
 877   return Type::CONTROL;
 878 }
 879 
 880 #ifndef PRODUCT
 881 void SafePointNode::dump_spec(outputStream *st) const {
 882   st->print(" SafePoint ");
 883 }
 884 #endif
 885 
 886 const RegMask &SafePointNode::in_RegMask(uint idx) const {
 887   if( idx < TypeFunc::Parms ) return RegMask::Empty;
 888   // Values outside the domain represent debug info
 889   return *(Compile::current()->matcher()->idealreg2debugmask[in(idx)->ideal_reg()]);
 890 }
 891 const RegMask &SafePointNode::out_RegMask() const {
 892   return RegMask::Empty;
 893 }
 894 
 895 
 896 void SafePointNode::grow_stack(JVMState* jvms, uint grow_by) {
 897   assert((int)grow_by > 0, "sanity");
 898   int monoff = jvms->monoff();
 899   int scloff = jvms->scloff();
 900   int endoff = jvms->endoff();
 901   assert(endoff == (int)req(), "no other states or debug info after me");
 902   Node* top = Compile::current()->top();
 903   for (uint i = 0; i < grow_by; i++) {
 904     ins_req(monoff, top);
 905   }
 906   jvms->set_monoff(monoff + grow_by);
 907   jvms->set_scloff(scloff + grow_by);
 908   jvms->set_endoff(endoff + grow_by);
 909 }
 910 
 911 void SafePointNode::push_monitor(const FastLockNode *lock) {
 912   // Add a LockNode, which points to both the original BoxLockNode (the
 913   // stack space for the monitor) and the Object being locked.
 914   const int MonitorEdges = 2;
 915   assert(JVMState::logMonitorEdges == exact_log2(MonitorEdges), "correct MonitorEdges");
 916   assert(req() == jvms()->endoff(), "correct sizing");
 917   int nextmon = jvms()->scloff();
 918   if (GenerateSynchronizationCode) {
 919     add_req(lock->box_node());
 920     add_req(lock->obj_node());
 921   } else {
 922     Node* top = Compile::current()->top();
 923     add_req(top);
 924     add_req(top);
 925   }
 926   jvms()->set_scloff(nextmon+MonitorEdges);
 927   jvms()->set_endoff(req());
 928 }
 929 
 930 void SafePointNode::pop_monitor() {
 931   // Delete last monitor from debug info
 932   debug_only(int num_before_pop = jvms()->nof_monitors());
 933   const int MonitorEdges = (1<<JVMState::logMonitorEdges);
 934   int scloff = jvms()->scloff();
 935   int endoff = jvms()->endoff();
 936   int new_scloff = scloff - MonitorEdges;
 937   int new_endoff = endoff - MonitorEdges;
 938   jvms()->set_scloff(new_scloff);
 939   jvms()->set_endoff(new_endoff);
 940   while (scloff > new_scloff)  del_req(--scloff);
 941   assert(jvms()->nof_monitors() == num_before_pop-1, "");
 942 }
 943 
 944 Node *SafePointNode::peek_monitor_box() const {
 945   int mon = jvms()->nof_monitors() - 1;
 946   assert(mon >= 0, "most have a monitor");
 947   return monitor_box(jvms(), mon);
 948 }
 949 
 950 Node *SafePointNode::peek_monitor_obj() const {
 951   int mon = jvms()->nof_monitors() - 1;
 952   assert(mon >= 0, "most have a monitor");
 953   return monitor_obj(jvms(), mon);
 954 }
 955 
 956 // Do we Match on this edge index or not?  Match no edges
 957 uint SafePointNode::match_edge(uint idx) const {
 958   if( !needs_polling_address_input() )
 959     return 0;
 960 
 961   return (TypeFunc::Parms == idx);
 962 }
 963 
 964 //==============  SafePointScalarObjectNode  ==============
 965 
 966 SafePointScalarObjectNode::SafePointScalarObjectNode(const TypeOopPtr* tp,
 967 #ifdef ASSERT
 968                                                      AllocateNode* alloc,
 969 #endif
 970                                                      uint first_index,
 971                                                      uint n_fields) :
 972   TypeNode(tp, 1), // 1 control input -- seems required.  Get from root.
 973 #ifdef ASSERT
 974   _alloc(alloc),
 975 #endif
 976   _first_index(first_index),
 977   _n_fields(n_fields)
 978 {
 979   init_class_id(Class_SafePointScalarObject);
 980 }
 981 
 982 bool SafePointScalarObjectNode::pinned() const { return true; }
 983 bool SafePointScalarObjectNode::depends_only_on_test() const { return false; }
 984 
 985 uint SafePointScalarObjectNode::ideal_reg() const {
 986   return 0; // No matching to machine instruction
 987 }
 988 
 989 const RegMask &SafePointScalarObjectNode::in_RegMask(uint idx) const {
 990   return *(Compile::current()->matcher()->idealreg2debugmask[in(idx)->ideal_reg()]);
 991 }
 992 
 993 const RegMask &SafePointScalarObjectNode::out_RegMask() const {
 994   return RegMask::Empty;
 995 }
 996 
 997 uint SafePointScalarObjectNode::match_edge(uint idx) const {
 998   return 0;
 999 }
1000 
1001 SafePointScalarObjectNode*
1002 SafePointScalarObjectNode::clone(int jvms_adj, Dict* sosn_map) const {
1003   void* cached = (*sosn_map)[(void*)this];
1004   if (cached != NULL) {
1005     return (SafePointScalarObjectNode*)cached;
1006   }
1007   Compile* C = Compile::current();
1008   SafePointScalarObjectNode* res = (SafePointScalarObjectNode*)Node::clone();
1009   res->_first_index += jvms_adj;
1010   sosn_map->Insert((void*)this, (void*)res);
1011   return res;
1012 }
1013 
1014 
1015 #ifndef PRODUCT
1016 void SafePointScalarObjectNode::dump_spec(outputStream *st) const {
1017   st->print(" # fields@[%d..%d]", first_index(),
1018              first_index() + n_fields() - 1);
1019 }
1020 
1021 #endif
1022 
1023 //=============================================================================
1024 uint AllocateNode::size_of() const { return sizeof(*this); }
1025 
1026 AllocateNode::AllocateNode(Compile* C, const TypeFunc *atype,
1027                            Node *ctrl, Node *mem, Node *abio,
1028                            Node *size, Node *klass_node, Node *initial_test)
1029   : CallNode(atype, NULL, TypeRawPtr::BOTTOM)
1030 {
1031   init_class_id(Class_Allocate);
1032   init_flags(Flag_is_macro);
1033   _is_scalar_replaceable = false;
1034   Node *topnode = C->top();
1035 
1036   init_req( TypeFunc::Control  , ctrl );
1037   init_req( TypeFunc::I_O      , abio );
1038   init_req( TypeFunc::Memory   , mem );
1039   init_req( TypeFunc::ReturnAdr, topnode );
1040   init_req( TypeFunc::FramePtr , topnode );
1041   init_req( AllocSize          , size);
1042   init_req( KlassNode          , klass_node);
1043   init_req( InitialTest        , initial_test);
1044   init_req( ALength            , topnode);
1045   C->add_macro_node(this);
1046 }
1047 
1048 //=============================================================================
1049 uint AllocateArrayNode::size_of() const { return sizeof(*this); }
1050 
1051 Node* AllocateArrayNode::Ideal(PhaseGVN *phase, bool can_reshape) {
1052   if (remove_dead_region(phase, can_reshape))  return this;
1053 
1054   const Type* type = phase->type(Ideal_length());
1055   if (type->isa_int() && type->is_int()->_hi < 0) {
1056     if (can_reshape) {
1057       PhaseIterGVN *igvn = phase->is_IterGVN();
1058       // Unreachable fall through path (negative array length),
1059       // the allocation can only throw so disconnect it.
1060       Node* proj = proj_out(TypeFunc::Control);
1061       Node* catchproj = NULL;
1062       if (proj != NULL) {
1063         for (DUIterator_Fast imax, i = proj->fast_outs(imax); i < imax; i++) {
1064           Node *cn = proj->fast_out(i);
1065           if (cn->is_Catch()) {
1066             catchproj = cn->as_Multi()->proj_out(CatchProjNode::fall_through_index);
1067             break;
1068           }
1069         }
1070       }
1071       if (catchproj != NULL && catchproj->outcnt() > 0 &&
1072           (catchproj->outcnt() > 1 ||
1073            catchproj->unique_out()->Opcode() != Op_Halt)) {
1074         assert(catchproj->is_CatchProj(), "must be a CatchProjNode");
1075         Node* nproj = catchproj->clone();
1076         igvn->register_new_node_with_optimizer(nproj);
1077 
1078         Node *frame = new (phase->C, 1) ParmNode( phase->C->start(), TypeFunc::FramePtr );
1079         frame = phase->transform(frame);
1080         // Halt & Catch Fire
1081         Node *halt = new (phase->C, TypeFunc::Parms) HaltNode( nproj, frame );
1082         phase->C->root()->add_req(halt);
1083         phase->transform(halt);
1084 
1085         igvn->replace_node(catchproj, phase->C->top());
1086         return this;
1087       }
1088     } else {
1089       // Can't correct it during regular GVN so register for IGVN
1090       phase->C->record_for_igvn(this);
1091     }
1092   }
1093   return NULL;
1094 }
1095 
1096 // Retrieve the length from the AllocateArrayNode. Narrow the type with a
1097 // CastII, if appropriate.  If we are not allowed to create new nodes, and
1098 // a CastII is appropriate, return NULL.
1099 Node *AllocateArrayNode::make_ideal_length(const TypeOopPtr* oop_type, PhaseTransform *phase, bool allow_new_nodes) {
1100   Node *length = in(AllocateNode::ALength);
1101   assert(length != NULL, "length is not null");
1102 
1103   const TypeInt* length_type = phase->find_int_type(length);
1104   const TypeAryPtr* ary_type = oop_type->isa_aryptr();
1105 
1106   if (ary_type != NULL && length_type != NULL) {
1107     const TypeInt* narrow_length_type = ary_type->narrow_size_type(length_type);
1108     if (narrow_length_type != length_type) {
1109       // Assert one of:
1110       //   - the narrow_length is 0
1111       //   - the narrow_length is not wider than length
1112       assert(narrow_length_type == TypeInt::ZERO ||
1113              (narrow_length_type->_hi <= length_type->_hi &&
1114               narrow_length_type->_lo >= length_type->_lo),
1115              "narrow type must be narrower than length type");
1116 
1117       // Return NULL if new nodes are not allowed
1118       if (!allow_new_nodes) return NULL;
1119       // Create a cast which is control dependent on the initialization to
1120       // propagate the fact that the array length must be positive.
1121       length = new (phase->C, 2) CastIINode(length, narrow_length_type);
1122       length->set_req(0, initialization()->proj_out(0));
1123     }
1124   }
1125 
1126   return length;
1127 }
1128 
1129 //=============================================================================
1130 uint LockNode::size_of() const { return sizeof(*this); }
1131 
1132 // Redundant lock elimination
1133 //
1134 // There are various patterns of locking where we release and
1135 // immediately reacquire a lock in a piece of code where no operations
1136 // occur in between that would be observable.  In those cases we can
1137 // skip releasing and reacquiring the lock without violating any
1138 // fairness requirements.  Doing this around a loop could cause a lock
1139 // to be held for a very long time so we concentrate on non-looping
1140 // control flow.  We also require that the operations are fully
1141 // redundant meaning that we don't introduce new lock operations on
1142 // some paths so to be able to eliminate it on others ala PRE.  This
1143 // would probably require some more extensive graph manipulation to
1144 // guarantee that the memory edges were all handled correctly.
1145 //
1146 // Assuming p is a simple predicate which can't trap in any way and s
1147 // is a synchronized method consider this code:
1148 //
1149 //   s();
1150 //   if (p)
1151 //     s();
1152 //   else
1153 //     s();
1154 //   s();
1155 //
1156 // 1. The unlocks of the first call to s can be eliminated if the
1157 // locks inside the then and else branches are eliminated.
1158 //
1159 // 2. The unlocks of the then and else branches can be eliminated if
1160 // the lock of the final call to s is eliminated.
1161 //
1162 // Either of these cases subsumes the simple case of sequential control flow
1163 //
1164 // Addtionally we can eliminate versions without the else case:
1165 //
1166 //   s();
1167 //   if (p)
1168 //     s();
1169 //   s();
1170 //
1171 // 3. In this case we eliminate the unlock of the first s, the lock
1172 // and unlock in the then case and the lock in the final s.
1173 //
1174 // Note also that in all these cases the then/else pieces don't have
1175 // to be trivial as long as they begin and end with synchronization
1176 // operations.
1177 //
1178 //   s();
1179 //   if (p)
1180 //     s();
1181 //     f();
1182 //     s();
1183 //   s();
1184 //
1185 // The code will work properly for this case, leaving in the unlock
1186 // before the call to f and the relock after it.
1187 //
1188 // A potentially interesting case which isn't handled here is when the
1189 // locking is partially redundant.
1190 //
1191 //   s();
1192 //   if (p)
1193 //     s();
1194 //
1195 // This could be eliminated putting unlocking on the else case and
1196 // eliminating the first unlock and the lock in the then side.
1197 // Alternatively the unlock could be moved out of the then side so it
1198 // was after the merge and the first unlock and second lock
1199 // eliminated.  This might require less manipulation of the memory
1200 // state to get correct.
1201 //
1202 // Additionally we might allow work between a unlock and lock before
1203 // giving up eliminating the locks.  The current code disallows any
1204 // conditional control flow between these operations.  A formulation
1205 // similar to partial redundancy elimination computing the
1206 // availability of unlocking and the anticipatability of locking at a
1207 // program point would allow detection of fully redundant locking with
1208 // some amount of work in between.  I'm not sure how often I really
1209 // think that would occur though.  Most of the cases I've seen
1210 // indicate it's likely non-trivial work would occur in between.
1211 // There may be other more complicated constructs where we could
1212 // eliminate locking but I haven't seen any others appear as hot or
1213 // interesting.
1214 //
1215 // Locking and unlocking have a canonical form in ideal that looks
1216 // roughly like this:
1217 //
1218 //              <obj>
1219 //                | \\------+
1220 //                |  \       \
1221 //                | BoxLock   \
1222 //                |  |   |     \
1223 //                |  |    \     \
1224 //                |  |   FastLock
1225 //                |  |   /
1226 //                |  |  /
1227 //                |  |  |
1228 //
1229 //               Lock
1230 //                |
1231 //            Proj #0
1232 //                |
1233 //            MembarAcquire
1234 //                |
1235 //            Proj #0
1236 //
1237 //            MembarRelease
1238 //                |
1239 //            Proj #0
1240 //                |
1241 //              Unlock
1242 //                |
1243 //            Proj #0
1244 //
1245 //
1246 // This code proceeds by processing Lock nodes during PhaseIterGVN
1247 // and searching back through its control for the proper code
1248 // patterns.  Once it finds a set of lock and unlock operations to
1249 // eliminate they are marked as eliminatable which causes the
1250 // expansion of the Lock and Unlock macro nodes to make the operation a NOP
1251 //
1252 //=============================================================================
1253 
1254 //
1255 // Utility function to skip over uninteresting control nodes.  Nodes skipped are:
1256 //   - copy regions.  (These may not have been optimized away yet.)
1257 //   - eliminated locking nodes
1258 //
1259 static Node *next_control(Node *ctrl) {
1260   if (ctrl == NULL)
1261     return NULL;
1262   while (1) {
1263     if (ctrl->is_Region()) {
1264       RegionNode *r = ctrl->as_Region();
1265       Node *n = r->is_copy();
1266       if (n == NULL)
1267         break;  // hit a region, return it
1268       else
1269         ctrl = n;
1270     } else if (ctrl->is_Proj()) {
1271       Node *in0 = ctrl->in(0);
1272       if (in0->is_AbstractLock() && in0->as_AbstractLock()->is_eliminated()) {
1273         ctrl = in0->in(0);
1274       } else {
1275         break;
1276       }
1277     } else {
1278       break; // found an interesting control
1279     }
1280   }
1281   return ctrl;
1282 }
1283 //
1284 // Given a control, see if it's the control projection of an Unlock which
1285 // operating on the same object as lock.
1286 //
1287 bool AbstractLockNode::find_matching_unlock(const Node* ctrl, LockNode* lock,
1288                                             GrowableArray<AbstractLockNode*> &lock_ops) {
1289   ProjNode *ctrl_proj = (ctrl->is_Proj()) ? ctrl->as_Proj() : NULL;
1290   if (ctrl_proj != NULL && ctrl_proj->_con == TypeFunc::Control) {
1291     Node *n = ctrl_proj->in(0);
1292     if (n != NULL && n->is_Unlock()) {
1293       UnlockNode *unlock = n->as_Unlock();
1294       if ((lock->obj_node() == unlock->obj_node()) &&
1295           (lock->box_node() == unlock->box_node()) && !unlock->is_eliminated()) {
1296         lock_ops.append(unlock);
1297         return true;
1298       }
1299     }
1300   }
1301   return false;
1302 }
1303 
1304 //
1305 // Find the lock matching an unlock.  Returns null if a safepoint
1306 // or complicated control is encountered first.
1307 LockNode *AbstractLockNode::find_matching_lock(UnlockNode* unlock) {
1308   LockNode *lock_result = NULL;
1309   // find the matching lock, or an intervening safepoint
1310   Node *ctrl = next_control(unlock->in(0));
1311   while (1) {
1312     assert(ctrl != NULL, "invalid control graph");
1313     assert(!ctrl->is_Start(), "missing lock for unlock");
1314     if (ctrl->is_top()) break;  // dead control path
1315     if (ctrl->is_Proj()) ctrl = ctrl->in(0);
1316     if (ctrl->is_SafePoint()) {
1317         break;  // found a safepoint (may be the lock we are searching for)
1318     } else if (ctrl->is_Region()) {
1319       // Check for a simple diamond pattern.  Punt on anything more complicated
1320       if (ctrl->req() == 3 && ctrl->in(1) != NULL && ctrl->in(2) != NULL) {
1321         Node *in1 = next_control(ctrl->in(1));
1322         Node *in2 = next_control(ctrl->in(2));
1323         if (((in1->is_IfTrue() && in2->is_IfFalse()) ||
1324              (in2->is_IfTrue() && in1->is_IfFalse())) && (in1->in(0) == in2->in(0))) {
1325           ctrl = next_control(in1->in(0)->in(0));
1326         } else {
1327           break;
1328         }
1329       } else {
1330         break;
1331       }
1332     } else {
1333       ctrl = next_control(ctrl->in(0));  // keep searching
1334     }
1335   }
1336   if (ctrl->is_Lock()) {
1337     LockNode *lock = ctrl->as_Lock();
1338     if ((lock->obj_node() == unlock->obj_node()) &&
1339             (lock->box_node() == unlock->box_node())) {
1340       lock_result = lock;
1341     }
1342   }
1343   return lock_result;
1344 }
1345 
1346 // This code corresponds to case 3 above.
1347 
1348 bool AbstractLockNode::find_lock_and_unlock_through_if(Node* node, LockNode* lock,
1349                                                        GrowableArray<AbstractLockNode*> &lock_ops) {
1350   Node* if_node = node->in(0);
1351   bool  if_true = node->is_IfTrue();
1352 
1353   if (if_node->is_If() && if_node->outcnt() == 2 && (if_true || node->is_IfFalse())) {
1354     Node *lock_ctrl = next_control(if_node->in(0));
1355     if (find_matching_unlock(lock_ctrl, lock, lock_ops)) {
1356       Node* lock1_node = NULL;
1357       ProjNode* proj = if_node->as_If()->proj_out(!if_true);
1358       if (if_true) {
1359         if (proj->is_IfFalse() && proj->outcnt() == 1) {
1360           lock1_node = proj->unique_out();
1361         }
1362       } else {
1363         if (proj->is_IfTrue() && proj->outcnt() == 1) {
1364           lock1_node = proj->unique_out();
1365         }
1366       }
1367       if (lock1_node != NULL && lock1_node->is_Lock()) {
1368         LockNode *lock1 = lock1_node->as_Lock();
1369         if ((lock->obj_node() == lock1->obj_node()) &&
1370             (lock->box_node() == lock1->box_node()) && !lock1->is_eliminated()) {
1371           lock_ops.append(lock1);
1372           return true;
1373         }
1374       }
1375     }
1376   }
1377 
1378   lock_ops.trunc_to(0);
1379   return false;
1380 }
1381 
1382 bool AbstractLockNode::find_unlocks_for_region(const RegionNode* region, LockNode* lock,
1383                                GrowableArray<AbstractLockNode*> &lock_ops) {
1384   // check each control merging at this point for a matching unlock.
1385   // in(0) should be self edge so skip it.
1386   for (int i = 1; i < (int)region->req(); i++) {
1387     Node *in_node = next_control(region->in(i));
1388     if (in_node != NULL) {
1389       if (find_matching_unlock(in_node, lock, lock_ops)) {
1390         // found a match so keep on checking.
1391         continue;
1392       } else if (find_lock_and_unlock_through_if(in_node, lock, lock_ops)) {
1393         continue;
1394       }
1395 
1396       // If we fall through to here then it was some kind of node we
1397       // don't understand or there wasn't a matching unlock, so give
1398       // up trying to merge locks.
1399       lock_ops.trunc_to(0);
1400       return false;
1401     }
1402   }
1403   return true;
1404 
1405 }
1406 
1407 #ifndef PRODUCT
1408 //
1409 // Create a counter which counts the number of times this lock is acquired
1410 //
1411 void AbstractLockNode::create_lock_counter(JVMState* state) {
1412   _counter = OptoRuntime::new_named_counter(state, NamedCounter::LockCounter);
1413 }
1414 #endif
1415 
1416 void AbstractLockNode::set_eliminated() {
1417   _eliminate = true;
1418 #ifndef PRODUCT
1419   if (_counter) {
1420     // Update the counter to indicate that this lock was eliminated.
1421     // The counter update code will stay around even though the
1422     // optimizer will eliminate the lock operation itself.
1423     _counter->set_tag(NamedCounter::EliminatedLockCounter);
1424   }
1425 #endif
1426 }
1427 
1428 //=============================================================================
1429 Node *LockNode::Ideal(PhaseGVN *phase, bool can_reshape) {
1430 
1431   // perform any generic optimizations first (returns 'this' or NULL)
1432   Node *result = SafePointNode::Ideal(phase, can_reshape);
1433 
1434   // Now see if we can optimize away this lock.  We don't actually
1435   // remove the locking here, we simply set the _eliminate flag which
1436   // prevents macro expansion from expanding the lock.  Since we don't
1437   // modify the graph, the value returned from this function is the
1438   // one computed above.
1439   if (result == NULL && can_reshape && EliminateLocks && !is_eliminated()) {
1440     //
1441     // If we are locking an unescaped object, the lock/unlock is unnecessary
1442     //
1443     ConnectionGraph *cgr = phase->C->congraph();
1444     PointsToNode::EscapeState es = PointsToNode::GlobalEscape;
1445     if (cgr != NULL)
1446       es = cgr->escape_state(obj_node(), phase);
1447     if (es != PointsToNode::UnknownEscape && es != PointsToNode::GlobalEscape) {
1448       // Mark it eliminated to update any counters
1449       this->set_eliminated();
1450       return result;
1451     }
1452 
1453     //
1454     // Try lock coarsening
1455     //
1456     PhaseIterGVN* iter = phase->is_IterGVN();
1457     if (iter != NULL) {
1458 
1459       GrowableArray<AbstractLockNode*>   lock_ops;
1460 
1461       Node *ctrl = next_control(in(0));
1462 
1463       // now search back for a matching Unlock
1464       if (find_matching_unlock(ctrl, this, lock_ops)) {
1465         // found an unlock directly preceding this lock.  This is the
1466         // case of single unlock directly control dependent on a
1467         // single lock which is the trivial version of case 1 or 2.
1468       } else if (ctrl->is_Region() ) {
1469         if (find_unlocks_for_region(ctrl->as_Region(), this, lock_ops)) {
1470         // found lock preceded by multiple unlocks along all paths
1471         // joining at this point which is case 3 in description above.
1472         }
1473       } else {
1474         // see if this lock comes from either half of an if and the
1475         // predecessors merges unlocks and the other half of the if
1476         // performs a lock.
1477         if (find_lock_and_unlock_through_if(ctrl, this, lock_ops)) {
1478           // found unlock splitting to an if with locks on both branches.
1479         }
1480       }
1481 
1482       if (lock_ops.length() > 0) {
1483         // add ourselves to the list of locks to be eliminated.
1484         lock_ops.append(this);
1485 
1486   #ifndef PRODUCT
1487         if (PrintEliminateLocks) {
1488           int locks = 0;
1489           int unlocks = 0;
1490           for (int i = 0; i < lock_ops.length(); i++) {
1491             AbstractLockNode* lock = lock_ops.at(i);
1492             if (lock->Opcode() == Op_Lock)
1493               locks++;
1494             else
1495               unlocks++;
1496             if (Verbose) {
1497               lock->dump(1);
1498             }
1499           }
1500           tty->print_cr("***Eliminated %d unlocks and %d locks", unlocks, locks);
1501         }
1502   #endif
1503 
1504         // for each of the identified locks, mark them
1505         // as eliminatable
1506         for (int i = 0; i < lock_ops.length(); i++) {
1507           AbstractLockNode* lock = lock_ops.at(i);
1508 
1509           // Mark it eliminated to update any counters
1510           lock->set_eliminated();
1511           lock->set_coarsened();
1512         }
1513       } else if (result != NULL && ctrl->is_Region() &&
1514                  iter->_worklist.member(ctrl)) {
1515         // We weren't able to find any opportunities but the region this
1516         // lock is control dependent on hasn't been processed yet so put
1517         // this lock back on the worklist so we can check again once any
1518         // region simplification has occurred.
1519         iter->_worklist.push(this);
1520       }
1521     }
1522   }
1523 
1524   return result;
1525 }
1526 
1527 //=============================================================================
1528 uint UnlockNode::size_of() const { return sizeof(*this); }
1529 
1530 //=============================================================================
1531 Node *UnlockNode::Ideal(PhaseGVN *phase, bool can_reshape) {
1532 
1533   // perform any generic optimizations first (returns 'this' or NULL)
1534   Node * result = SafePointNode::Ideal(phase, can_reshape);
1535 
1536   // Now see if we can optimize away this unlock.  We don't actually
1537   // remove the unlocking here, we simply set the _eliminate flag which
1538   // prevents macro expansion from expanding the unlock.  Since we don't
1539   // modify the graph, the value returned from this function is the
1540   // one computed above.
1541   // Escape state is defined after Parse phase.
1542   if (result == NULL && can_reshape && EliminateLocks && !is_eliminated()) {
1543     //
1544     // If we are unlocking an unescaped object, the lock/unlock is unnecessary.
1545     //
1546     ConnectionGraph *cgr = phase->C->congraph();
1547     PointsToNode::EscapeState es = PointsToNode::GlobalEscape;
1548     if (cgr != NULL)
1549       es = cgr->escape_state(obj_node(), phase);
1550     if (es != PointsToNode::UnknownEscape && es != PointsToNode::GlobalEscape) {
1551       // Mark it eliminated to update any counters
1552       this->set_eliminated();
1553     }
1554   }
1555   return result;
1556 }