1 /*
   2  * Copyright (c) 2015, 2018, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  */
  23 
  24 #include "precompiled.hpp"
  25 #include "opto/compile.hpp"
  26 #include "opto/castnode.hpp"
  27 #include "opto/graphKit.hpp"
  28 #include "opto/idealKit.hpp"
  29 #include "opto/loopnode.hpp"
  30 #include "opto/macro.hpp"
  31 #include "opto/node.hpp"
  32 #include "opto/type.hpp"
  33 #include "utilities/macros.hpp"
  34 #include "gc/z/c2/zBarrierSetC2.hpp"
  35 #include "gc/z/zThreadLocalData.hpp"
  36 #include "gc/z/zBarrierSetRuntime.hpp"
  37 
  38 ZBarrierSetC2State::ZBarrierSetC2State(Arena* comp_arena)
  39   : _load_barrier_nodes(new (comp_arena) GrowableArray<LoadBarrierNode*>(comp_arena, 8,  0, NULL)) {}
  40 
  41 int ZBarrierSetC2State::load_barrier_count() const {
  42   return _load_barrier_nodes->length();
  43 }
  44 
  45 void ZBarrierSetC2State::add_load_barrier_node(LoadBarrierNode * n) {
  46   assert(!_load_barrier_nodes->contains(n), " duplicate entry in expand list");
  47   _load_barrier_nodes->append(n);
  48 }
  49 
  50 void ZBarrierSetC2State::remove_load_barrier_node(LoadBarrierNode * n) {
  51   // this function may be called twice for a node so check
  52   // that the node is in the array before attempting to remove it
  53   if (_load_barrier_nodes->contains(n)) {
  54     _load_barrier_nodes->remove(n);
  55   }
  56 }
  57 
  58 LoadBarrierNode* ZBarrierSetC2State::load_barrier_node(int idx) const {
  59   return _load_barrier_nodes->at(idx);
  60 }
  61 
  62 void* ZBarrierSetC2::create_barrier_state(Arena* comp_arena) const {
  63   return new(comp_arena) ZBarrierSetC2State(comp_arena);
  64 }
  65 
  66 ZBarrierSetC2State* ZBarrierSetC2::state() const {
  67   return reinterpret_cast<ZBarrierSetC2State*>(Compile::current()->barrier_set_state());
  68 }
  69 
  70 bool ZBarrierSetC2::is_gc_barrier_node(Node* node) const {
  71   return node->is_LoadBarrier();
  72 }
  73 
  74 void ZBarrierSetC2::register_potential_barrier_node(Node* node) const {
  75   if (node->is_LoadBarrier()) {
  76     state()->add_load_barrier_node(node->as_LoadBarrier());
  77   }
  78 }
  79 
  80 void ZBarrierSetC2::unregister_potential_barrier_node(Node* node) const {
  81   if (node->is_LoadBarrier()) {
  82     state()->remove_load_barrier_node(node->as_LoadBarrier());
  83   }
  84 }
  85 
  86 void ZBarrierSetC2::eliminate_useless_gc_barriers(Unique_Node_List &useful) const {
  87   // Remove useless LoadBarrier nodes
  88   ZBarrierSetC2State* s = state();
  89   for (int i = s->load_barrier_count()-1; i >= 0; i--) {
  90     LoadBarrierNode* n = s->load_barrier_node(i);
  91     if (!useful.member(n)) {
  92       unregister_potential_barrier_node(n);
  93     }
  94   }
  95 }
  96 
  97 void ZBarrierSetC2::enqueue_useful_gc_barrier(Unique_Node_List &worklist, Node* node) const {
  98   if (node->is_LoadBarrier() && !node->as_LoadBarrier()->has_true_uses()) {
  99     worklist.push(node);
 100   }
 101 }
 102 
 103 void ZBarrierSetC2::find_dominating_barriers(PhaseIterGVN& igvn) {
 104   // Look for dominating barriers on the same address only once all
 105   // other loop opts are over: loop opts may cause a safepoint to be
 106   // inserted between a barrier and its dominating barrier.
 107   Compile* C = Compile::current();
 108   ZBarrierSetC2* bs = (ZBarrierSetC2*)BarrierSet::barrier_set()->barrier_set_c2();
 109   ZBarrierSetC2State* s = bs->state();
 110   if (s->load_barrier_count() >= 2) {
 111     Compile::TracePhase tp("idealLoop", &C->timers[Phase::_t_idealLoop]);
 112     PhaseIdealLoop ideal_loop(igvn, true, false, true);
 113     if (C->major_progress()) C->print_method(PHASE_PHASEIDEALLOOP_ITERATIONS, 2);
 114   }
 115 }
 116 
 117 void ZBarrierSetC2::add_users_to_worklist(Unique_Node_List* worklist) const {
 118   // Permanent temporary workaround
 119   // Loadbarriers may have non-obvious dead uses keeping them alive during parsing. The use is
 120   // removed by RemoveUseless (after parsing, before optimize) but the barriers won't be added to
 121   // the worklist. Unless we add them explicitly they are not guaranteed to end up there.
 122   ZBarrierSetC2State* s = state();
 123 
 124   for (int i = 0; i < s->load_barrier_count(); i++) {
 125     LoadBarrierNode* n = s->load_barrier_node(i);
 126     worklist->push(n);
 127   }
 128 }
 129 
 130 const TypeFunc* ZBarrierSetC2::load_barrier_Type() const {
 131   const Type** fields;
 132 
 133   // Create input types (domain)
 134   fields = TypeTuple::fields(2);
 135   fields[TypeFunc::Parms+0] = TypeInstPtr::NOTNULL;
 136   fields[TypeFunc::Parms+1] = TypeOopPtr::BOTTOM;
 137   const TypeTuple *domain = TypeTuple::make(TypeFunc::Parms+2, fields);
 138 
 139   // Create result type (range)
 140   fields = TypeTuple::fields(1);
 141   fields[TypeFunc::Parms+0] = TypeInstPtr::BOTTOM;
 142   const TypeTuple *range = TypeTuple::make(TypeFunc::Parms+1, fields);
 143 
 144   return TypeFunc::make(domain, range);
 145 }
 146 
 147 // == LoadBarrierNode ==
 148 
 149 LoadBarrierNode::LoadBarrierNode(Compile* C,
 150                                  Node* c,
 151                                  Node* mem,
 152                                  Node* val,
 153                                  Node* adr,
 154                                  bool weak,
 155                                  bool writeback,
 156                                  bool oop_reload_allowed) :
 157     MultiNode(Number_of_Inputs),
 158     _weak(weak),
 159     _writeback(writeback),
 160     _oop_reload_allowed(oop_reload_allowed) {
 161   init_req(Control, c);
 162   init_req(Memory, mem);
 163   init_req(Oop, val);
 164   init_req(Address, adr);
 165   init_req(Similar, C->top());
 166 
 167   init_class_id(Class_LoadBarrier);
 168   BarrierSetC2* bs = BarrierSet::barrier_set()->barrier_set_c2();
 169   bs->register_potential_barrier_node(this);
 170 }
 171 
 172 const Type *LoadBarrierNode::bottom_type() const {
 173   const Type** floadbarrier = (const Type **)(Compile::current()->type_arena()->Amalloc_4((Number_of_Outputs)*sizeof(Type*)));
 174   Node* in_oop = in(Oop);
 175   floadbarrier[Control] = Type::CONTROL;
 176   floadbarrier[Memory] = Type::MEMORY;
 177   floadbarrier[Oop] = in_oop == NULL ? Type::TOP : in_oop->bottom_type();
 178   return TypeTuple::make(Number_of_Outputs, floadbarrier);
 179 }
 180 
 181 const Type *LoadBarrierNode::Value(PhaseGVN *phase) const {
 182   const Type** floadbarrier = (const Type **)(phase->C->type_arena()->Amalloc_4((Number_of_Outputs)*sizeof(Type*)));
 183   const Type* val_t = phase->type(in(Oop));
 184   floadbarrier[Control] = Type::CONTROL;
 185   floadbarrier[Memory] = Type::MEMORY;
 186   floadbarrier[Oop] = val_t;
 187   return TypeTuple::make(Number_of_Outputs, floadbarrier);
 188 }
 189 
 190 bool LoadBarrierNode::is_dominator(PhaseIdealLoop* phase, bool linear_only, Node *d, Node *n) {
 191   if (phase != NULL) {
 192     return phase->is_dominator(d, n);
 193   }
 194 
 195   for (int i = 0; i < 10 && n != NULL; i++) {
 196     n = IfNode::up_one_dom(n, linear_only);
 197     if (n == d) {
 198       return true;
 199     }
 200   }
 201 
 202   return false;
 203 }
 204 
 205 LoadBarrierNode* LoadBarrierNode::has_dominating_barrier(PhaseIdealLoop* phase, bool linear_only, bool look_for_similar) {
 206   Node* val = in(LoadBarrierNode::Oop);
 207   if (in(Similar)->is_Proj() && in(Similar)->in(0)->is_LoadBarrier()) {
 208     LoadBarrierNode* lb = in(Similar)->in(0)->as_LoadBarrier();
 209     assert(lb->in(Address) == in(Address), "");
 210     // Load barrier on Similar edge dominates so if it now has the Oop field it can replace this barrier.
 211     if (lb->in(Oop) == in(Oop)) {
 212       return lb;
 213     }
 214     // Follow chain of load barrier through Similar edges
 215     while (!lb->in(Similar)->is_top()) {
 216       lb = lb->in(Similar)->in(0)->as_LoadBarrier();
 217       assert(lb->in(Address) == in(Address), "");
 218     }
 219     if (lb != in(Similar)->in(0)) {
 220       return lb;
 221     }
 222   }
 223   for (DUIterator_Fast imax, i = val->fast_outs(imax); i < imax; i++) {
 224     Node* u = val->fast_out(i);
 225     if (u != this && u->is_LoadBarrier() && u->in(Oop) == val && u->as_LoadBarrier()->has_true_uses()) {
 226       Node* this_ctrl = in(LoadBarrierNode::Control);
 227       Node* other_ctrl = u->in(LoadBarrierNode::Control);
 228       if (is_dominator(phase, linear_only, other_ctrl, this_ctrl)) {
 229         return u->as_LoadBarrier();
 230       }
 231     }
 232   }
 233 
 234   if (ZVerifyLoadBarriers || can_be_eliminated()) {
 235     return NULL;
 236   }
 237 
 238   if (!look_for_similar) {
 239     return NULL;
 240   }
 241 
 242   Node* addr = in(LoadBarrierNode::Address);
 243   for (DUIterator_Fast imax, i = addr->fast_outs(imax); i < imax; i++) {
 244     Node* u = addr->fast_out(i);
 245     if (u != this && u->is_LoadBarrier() && u->as_LoadBarrier()->has_true_uses()) {
 246       Node* this_ctrl = in(LoadBarrierNode::Control);
 247       Node* other_ctrl = u->in(LoadBarrierNode::Control);
 248       if (is_dominator(phase, linear_only, other_ctrl, this_ctrl)) {
 249         ResourceMark rm;
 250         Unique_Node_List wq;
 251         wq.push(in(LoadBarrierNode::Control));
 252         bool ok = true;
 253         bool dom_found = false;
 254         for (uint next = 0; next < wq.size(); ++next) {
 255           Node *n = wq.at(next);
 256           if (n->is_top()) {
 257             return NULL;
 258           }
 259           assert(n->is_CFG(), "");
 260           if (n->is_SafePoint()) {
 261             ok = false;
 262             break;
 263           }
 264           if (n == u) {
 265             dom_found = true;
 266             continue;
 267           }
 268           if (n->is_Region()) {
 269             for (uint i = 1; i < n->req(); i++) {
 270               Node* m = n->in(i);
 271               if (m != NULL) {
 272                 wq.push(m);
 273               }
 274             }
 275           } else {
 276             Node* m = n->in(0);
 277             if (m != NULL) {
 278               wq.push(m);
 279             }
 280           }
 281         }
 282         if (ok) {
 283           assert(dom_found, "");
 284           return u->as_LoadBarrier();;
 285         }
 286         break;
 287       }
 288     }
 289   }
 290 
 291   return NULL;
 292 }
 293 
 294 void LoadBarrierNode::push_dominated_barriers(PhaseIterGVN* igvn) const {
 295   // change to that barrier may affect a dominated barrier so re-push those
 296   Node* val = in(LoadBarrierNode::Oop);
 297 
 298   for (DUIterator_Fast imax, i = val->fast_outs(imax); i < imax; i++) {
 299     Node* u = val->fast_out(i);
 300     if (u != this && u->is_LoadBarrier() && u->in(Oop) == val) {
 301       Node* this_ctrl = in(Control);
 302       Node* other_ctrl = u->in(Control);
 303       if (is_dominator(NULL, false, this_ctrl, other_ctrl)) {
 304         igvn->_worklist.push(u);
 305       }
 306     }
 307 
 308     Node* addr = in(LoadBarrierNode::Address);
 309     for (DUIterator_Fast imax, i = addr->fast_outs(imax); i < imax; i++) {
 310       Node* u = addr->fast_out(i);
 311       if (u != this && u->is_LoadBarrier() && u->in(Similar)->is_top()) {
 312         Node* this_ctrl = in(Control);
 313         Node* other_ctrl = u->in(Control);
 314         if (is_dominator(NULL, false, this_ctrl, other_ctrl)) {
 315           igvn->_worklist.push(u);
 316         }
 317       }
 318     }
 319   }
 320 }
 321 
 322 Node *LoadBarrierNode::Identity(PhaseGVN *phase) {
 323   if (!phase->C->directive()->ZOptimizeLoadBarriersOption) {
 324     return this;
 325   }
 326 
 327   bool redundant_addr = false;
 328   LoadBarrierNode* dominating_barrier = has_dominating_barrier(NULL, true, false);
 329   if (dominating_barrier != NULL) {
 330     assert(dominating_barrier->in(Oop) == in(Oop), "");
 331     return dominating_barrier;
 332   }
 333 
 334   return this;
 335 }
 336 
 337 Node *LoadBarrierNode::Ideal(PhaseGVN *phase, bool can_reshape) {
 338   if (remove_dead_region(phase, can_reshape)) {
 339     return this;
 340   }
 341 
 342   Node* val = in(Oop);
 343   Node* mem = in(Memory);
 344   Node* ctrl = in(Control);
 345   Node* adr = in(Address);
 346   assert(val->Opcode() != Op_LoadN, "");
 347 
 348   if (mem->is_MergeMem()) {
 349     Node* new_mem = mem->as_MergeMem()->memory_at(Compile::AliasIdxRaw);
 350     set_req(Memory, new_mem);
 351     if (mem->outcnt() == 0 && can_reshape) {
 352       phase->is_IterGVN()->_worklist.push(mem);
 353     }
 354 
 355     return this;
 356   }
 357 
 358   bool optimizeLoadBarriers = phase->C->directive()->ZOptimizeLoadBarriersOption;
 359   LoadBarrierNode* dominating_barrier = optimizeLoadBarriers ? has_dominating_barrier(NULL, !can_reshape, !phase->C->major_progress()) : NULL;
 360   if (dominating_barrier != NULL && dominating_barrier->in(Oop) != in(Oop)) {
 361     assert(in(Address) == dominating_barrier->in(Address), "");
 362     set_req(Similar, dominating_barrier->proj_out(Oop));
 363     return this;
 364   }
 365 
 366   bool eliminate = (optimizeLoadBarriers && !(val->is_Phi() || val->Opcode() == Op_LoadP || val->Opcode() == Op_GetAndSetP || val->is_DecodeN())) ||
 367                    (can_reshape && (dominating_barrier != NULL || !has_true_uses()));
 368 
 369   if (eliminate) {
 370     if (can_reshape) {
 371       PhaseIterGVN* igvn = phase->is_IterGVN();
 372       Node* out_ctrl = proj_out_or_null(Control);
 373       Node* out_res = proj_out_or_null(Oop);
 374 
 375       if (out_ctrl != NULL) {
 376         igvn->replace_node(out_ctrl, ctrl);
 377       }
 378 
 379       // That transformation may cause the Similar edge on the load barrier to be invalid
 380       fix_similar_in_uses(igvn);
 381       if (out_res != NULL) {
 382         if (dominating_barrier != NULL) {
 383           igvn->replace_node(out_res, dominating_barrier->proj_out(Oop));
 384         } else {
 385           igvn->replace_node(out_res, val);
 386         }
 387       }
 388     }
 389 
 390     return new ConINode(TypeInt::ZERO);
 391   }
 392 
 393   // If the Similar edge is no longer a load barrier, clear it
 394   Node* similar = in(Similar);
 395   if (!similar->is_top() && !(similar->is_Proj() && similar->in(0)->is_LoadBarrier())) {
 396     set_req(Similar, phase->C->top());
 397     return this;
 398   }
 399 
 400   if (can_reshape) {
 401     // If this barrier is linked through the Similar edge by a
 402     // dominated barrier and both barriers have the same Oop field,
 403     // the dominated barrier can go away, so push it for reprocessing.
 404     // We also want to avoid a barrier to depend on another dominating
 405     // barrier through its Similar edge that itself depend on another
 406     // barrier through its Similar edge and rather have the first
 407     // depend on the third.
 408     PhaseIterGVN* igvn = phase->is_IterGVN();
 409     Node* out_res = proj_out(Oop);
 410     for (DUIterator_Fast imax, i = out_res->fast_outs(imax); i < imax; i++) {
 411       Node* u = out_res->fast_out(i);
 412       if (u->is_LoadBarrier() && u->in(Similar) == out_res &&
 413           (u->in(Oop) == val || !u->in(Similar)->is_top())) {
 414         igvn->_worklist.push(u);
 415       }
 416     }
 417 
 418     push_dominated_barriers(igvn);
 419   }
 420 
 421   return NULL;
 422 }
 423 
 424 void LoadBarrierNode::fix_similar_in_uses(PhaseIterGVN* igvn) {
 425   Node* out_res = proj_out_or_null(Oop);
 426   if (out_res == NULL) {
 427     return;
 428   }
 429 
 430   for (DUIterator_Fast imax, i = out_res->fast_outs(imax); i < imax; i++) {
 431     Node* u = out_res->fast_out(i);
 432     if (u->is_LoadBarrier() && u->in(Similar) == out_res) {
 433       igvn->replace_input_of(u, Similar, igvn->C->top());
 434       --i;
 435       --imax;
 436     }
 437   }
 438 }
 439 
 440 bool LoadBarrierNode::has_true_uses() const {
 441   Node* out_res = proj_out_or_null(Oop);
 442   if (out_res == NULL) {
 443     return false;
 444   }
 445 
 446   for (DUIterator_Fast imax, i = out_res->fast_outs(imax); i < imax; i++) {
 447     Node* u = out_res->fast_out(i);
 448     if (!u->is_LoadBarrier() || u->in(Similar) != out_res) {
 449       return true;
 450     }
 451   }
 452 
 453   return false;
 454 }
 455 
 456 // == Accesses ==
 457 
 458 Node* ZBarrierSetC2::make_cas_loadbarrier(C2AtomicAccess& access) const {
 459   assert(!UseCompressedOops, "Not allowed");
 460   CompareAndSwapNode* cas = (CompareAndSwapNode*)access.raw_access();
 461   PhaseGVN& gvn = access.kit()->gvn();
 462   Compile* C = Compile::current();
 463   GraphKit* kit = access.kit();
 464 
 465   Node* in_ctrl     = cas->in(MemNode::Control);
 466   Node* in_mem      = cas->in(MemNode::Memory);
 467   Node* in_adr      = cas->in(MemNode::Address);
 468   Node* in_val      = cas->in(MemNode::ValueIn);
 469   Node* in_expected = cas->in(LoadStoreConditionalNode::ExpectedIn);
 470 
 471   float likely                   = PROB_LIKELY(0.999);
 472 
 473   const TypePtr *adr_type        = gvn.type(in_adr)->isa_ptr();
 474   Compile::AliasType* alias_type = C->alias_type(adr_type);
 475   int alias_idx                  = C->get_alias_index(adr_type);
 476 
 477   // Outer check - true: continue, false: load and check
 478   Node* region   = new RegionNode(3);
 479   Node* phi      = new PhiNode(region, TypeInt::BOOL);
 480   Node* phi_mem  = new PhiNode(region, Type::MEMORY, adr_type);
 481 
 482   // Inner check - is the healed ref equal to the expected
 483   Node* region2  = new RegionNode(3);
 484   Node* phi2     = new PhiNode(region2, TypeInt::BOOL);
 485   Node* phi_mem2 = new PhiNode(region2, Type::MEMORY, adr_type);
 486 
 487   // CAS node returns 0 or 1
 488   Node* cmp     = gvn.transform(new CmpINode(cas, kit->intcon(0)));
 489   Node* bol     = gvn.transform(new BoolNode(cmp, BoolTest::ne))->as_Bool();
 490   IfNode* iff   = gvn.transform(new IfNode(in_ctrl, bol, likely, COUNT_UNKNOWN))->as_If();
 491   Node* then    = gvn.transform(new IfTrueNode(iff));
 492   Node* elsen   = gvn.transform(new IfFalseNode(iff));
 493 
 494   Node* scmemproj1   = gvn.transform(new SCMemProjNode(cas));
 495 
 496   kit->set_memory(scmemproj1, alias_idx);
 497   phi_mem->init_req(1, scmemproj1);
 498   phi_mem2->init_req(2, scmemproj1);
 499 
 500   // CAS fail - reload and heal oop
 501   Node* reload      = kit->make_load(elsen, in_adr, TypeOopPtr::BOTTOM, T_OBJECT, MemNode::unordered);
 502   Node* barrier     = gvn.transform(new LoadBarrierNode(C, elsen, scmemproj1, reload, in_adr, false, true, false));
 503   Node* barrierctrl = gvn.transform(new ProjNode(barrier, LoadBarrierNode::Control));
 504   Node* barrierdata = gvn.transform(new ProjNode(barrier, LoadBarrierNode::Oop));
 505 
 506   // Check load
 507   Node* tmpX    = gvn.transform(new CastP2XNode(NULL, barrierdata));
 508   Node* in_expX = gvn.transform(new CastP2XNode(NULL, in_expected));
 509   Node* cmp2    = gvn.transform(new CmpXNode(tmpX, in_expX));
 510   Node *bol2    = gvn.transform(new BoolNode(cmp2, BoolTest::ne))->as_Bool();
 511   IfNode* iff2  = gvn.transform(new IfNode(barrierctrl, bol2, likely, COUNT_UNKNOWN))->as_If();
 512   Node* then2   = gvn.transform(new IfTrueNode(iff2));
 513   Node* elsen2  = gvn.transform(new IfFalseNode(iff2));
 514 
 515   // redo CAS
 516   Node* cas2       = gvn.transform(new CompareAndSwapPNode(elsen2, kit->memory(alias_idx), in_adr, in_val, in_expected, cas->order()));
 517   Node* scmemproj2 = gvn.transform(new SCMemProjNode(cas2));
 518   kit->set_control(elsen2);
 519   kit->set_memory(scmemproj2, alias_idx);
 520 
 521   // Merge inner flow - check if healed oop was equal too expected.
 522   region2->set_req(1, kit->control());
 523   region2->set_req(2, then2);
 524   phi2->set_req(1, cas2);
 525   phi2->set_req(2, kit->intcon(0));
 526   phi_mem2->init_req(1, scmemproj2);
 527   kit->set_memory(phi_mem2, alias_idx);
 528 
 529   // Merge outer flow - then check if first cas succeded
 530   region->set_req(1, then);
 531   region->set_req(2, region2);
 532   phi->set_req(1, kit->intcon(1));
 533   phi->set_req(2, phi2);
 534   phi_mem->init_req(2, phi_mem2);
 535   kit->set_memory(phi_mem, alias_idx);
 536 
 537   gvn.transform(region2);
 538   gvn.transform(phi2);
 539   gvn.transform(phi_mem2);
 540   gvn.transform(region);
 541   gvn.transform(phi);
 542   gvn.transform(phi_mem);
 543 
 544   kit->set_control(region);
 545   kit->insert_mem_bar(Op_MemBarCPUOrder);
 546 
 547   return phi;
 548 }
 549 
 550 Node* ZBarrierSetC2::make_cmpx_loadbarrier(C2AtomicAccess& access) const {
 551   CompareAndExchangePNode* cmpx = (CompareAndExchangePNode*)access.raw_access();
 552   GraphKit* kit = access.kit();
 553   PhaseGVN& gvn = kit->gvn();
 554   Compile* C = Compile::current();
 555 
 556   Node* in_ctrl     = cmpx->in(MemNode::Control);
 557   Node* in_mem      = cmpx->in(MemNode::Memory);
 558   Node* in_adr      = cmpx->in(MemNode::Address);
 559   Node* in_val      = cmpx->in(MemNode::ValueIn);
 560   Node* in_expected = cmpx->in(LoadStoreConditionalNode::ExpectedIn);
 561 
 562   float likely                   = PROB_LIKELY(0.999);
 563 
 564   const TypePtr *adr_type        = cmpx->get_ptr_type();
 565   Compile::AliasType* alias_type = C->alias_type(adr_type);
 566   int alias_idx                  = C->get_alias_index(adr_type);
 567 
 568   // Outer check - true: continue, false: load and check
 569   Node* region  = new RegionNode(3);
 570   Node* phi     = new PhiNode(region, adr_type);
 571 
 572   // Inner check - is the healed ref equal to the expected
 573   Node* region2 = new RegionNode(3);
 574   Node* phi2    = new PhiNode(region2, adr_type);
 575 
 576   // Check if cmpx succeded
 577   Node* cmp     = gvn.transform(new CmpPNode(cmpx, in_expected));
 578   Node* bol     = gvn.transform(new BoolNode(cmp, BoolTest::eq))->as_Bool();
 579   IfNode* iff   = gvn.transform(new IfNode(in_ctrl, bol, likely, COUNT_UNKNOWN))->as_If();
 580   Node* then    = gvn.transform(new IfTrueNode(iff));
 581   Node* elsen   = gvn.transform(new IfFalseNode(iff));
 582 
 583   Node* scmemproj1  = gvn.transform(new SCMemProjNode(cmpx));
 584   kit->set_memory(scmemproj1, alias_idx);
 585 
 586   // CAS fail - reload and heal oop
 587   Node* reload      = kit->make_load(elsen, in_adr, TypeOopPtr::BOTTOM, T_OBJECT, MemNode::unordered);
 588   Node* barrier     = gvn.transform(new LoadBarrierNode(C, elsen, scmemproj1, reload, in_adr, false, true, false));
 589   Node* barrierctrl = gvn.transform(new ProjNode(barrier, LoadBarrierNode::Control));
 590   Node* barrierdata = gvn.transform(new ProjNode(barrier, LoadBarrierNode::Oop));
 591 
 592   // Check load
 593   Node* tmpX    = gvn.transform(new CastP2XNode(NULL, barrierdata));
 594   Node* in_expX = gvn.transform(new CastP2XNode(NULL, in_expected));
 595   Node* cmp2    = gvn.transform(new CmpXNode(tmpX, in_expX));
 596   Node *bol2    = gvn.transform(new BoolNode(cmp2, BoolTest::ne))->as_Bool();
 597   IfNode* iff2  = gvn.transform(new IfNode(barrierctrl, bol2, likely, COUNT_UNKNOWN))->as_If();
 598   Node* then2   = gvn.transform(new IfTrueNode(iff2));
 599   Node* elsen2  = gvn.transform(new IfFalseNode(iff2));
 600 
 601   // Redo CAS
 602   Node* cmpx2      = gvn.transform(new CompareAndExchangePNode(elsen2, kit->memory(alias_idx), in_adr, in_val, in_expected, adr_type, cmpx->get_ptr_type(), cmpx->order()));
 603   Node* scmemproj2 = gvn.transform(new SCMemProjNode(cmpx2));
 604   kit->set_control(elsen2);
 605   kit->set_memory(scmemproj2, alias_idx);
 606 
 607   // Merge inner flow - check if healed oop was equal too expected.
 608   region2->set_req(1, kit->control());
 609   region2->set_req(2, then2);
 610   phi2->set_req(1, cmpx2);
 611   phi2->set_req(2, barrierdata);
 612 
 613   // Merge outer flow - then check if first cas succeded
 614   region->set_req(1, then);
 615   region->set_req(2, region2);
 616   phi->set_req(1, cmpx);
 617   phi->set_req(2, phi2);
 618 
 619   gvn.transform(region2);
 620   gvn.transform(phi2);
 621   gvn.transform(region);
 622   gvn.transform(phi);
 623 
 624   kit->set_control(region);
 625   kit->set_memory(in_mem, alias_idx);
 626   kit->insert_mem_bar(Op_MemBarCPUOrder);
 627 
 628   return phi;
 629 }
 630 
 631 Node* ZBarrierSetC2::load_barrier(GraphKit* kit, Node* val, Node* adr, bool weak, bool writeback, bool oop_reload_allowed) const {
 632   PhaseGVN& gvn = kit->gvn();
 633   Node* barrier = new LoadBarrierNode(Compile::current(), kit->control(), kit->memory(TypeRawPtr::BOTTOM), val, adr, weak, writeback, oop_reload_allowed);
 634   Node* transformed_barrier = gvn.transform(barrier);
 635 
 636   if (transformed_barrier->is_LoadBarrier()) {
 637     if (barrier == transformed_barrier) {
 638       kit->set_control(gvn.transform(new ProjNode(barrier, LoadBarrierNode::Control)));
 639     }
 640     return gvn.transform(new ProjNode(transformed_barrier, LoadBarrierNode::Oop));
 641   } else {
 642     return val;
 643   }
 644 }
 645 
 646 static bool barrier_needed(C2Access access) {
 647   return ZBarrierSet::barrier_needed(access.decorators(), access.type());
 648 }
 649 
 650 Node* ZBarrierSetC2::load_at_resolved(C2Access& access, const Type* val_type) const {
 651   Node* p = BarrierSetC2::load_at_resolved(access, val_type);
 652   if (!barrier_needed(access)) {
 653     return p;
 654   }
 655 
 656   bool conc_root = (access.decorators() & IN_CONCURRENT_ROOT) != 0;
 657   bool weak = (access.decorators() & ON_WEAK_OOP_REF) != 0;
 658 
 659   GraphKit* kit = access.kit();
 660   PhaseGVN& gvn = kit->gvn();
 661   Node* adr = access.addr().node();
 662   Node* heap_base_oop = access.base();
 663   bool unsafe = (access.decorators() & C2_UNSAFE_ACCESS) != 0;
 664   if (unsafe) {
 665     if (!ZVerifyLoadBarriers) {
 666       p = load_barrier(kit, p, adr);
 667     } else {
 668       if (!TypePtr::NULL_PTR->higher_equal(gvn.type(heap_base_oop))) {
 669         p = load_barrier(kit, p, adr);
 670       } else {
 671         IdealKit ideal(kit);
 672         IdealVariable res(ideal);
 673 #define __ ideal.
 674         __ declarations_done();
 675         __ set(res, p);
 676         __ if_then(heap_base_oop, BoolTest::ne, kit->null(), PROB_UNLIKELY(0.999)); {
 677           kit->sync_kit(ideal);
 678           p = load_barrier(kit, p, adr);
 679           __ set(res, p);
 680           __ sync_kit(kit);
 681         } __ end_if();
 682         kit->final_sync(ideal);
 683         p = __ value(res);
 684 #undef __
 685       }
 686     }
 687     return p;
 688   } else {
 689     return load_barrier(access.kit(), p, access.addr().node(), weak, true, true);
 690   }
 691 }
 692 
 693 Node* ZBarrierSetC2::atomic_cmpxchg_val_at_resolved(C2AtomicAccess& access, Node* expected_val,
 694                                                     Node* new_val, const Type* val_type) const {
 695   Node* result = BarrierSetC2::atomic_cmpxchg_val_at_resolved(access, expected_val, new_val, val_type);
 696   if (!barrier_needed(access)) {
 697     return result;
 698   }
 699 
 700   access.set_needs_pinning(false);
 701   return make_cmpx_loadbarrier(access);
 702 }
 703 
 704 Node* ZBarrierSetC2::atomic_cmpxchg_bool_at_resolved(C2AtomicAccess& access, Node* expected_val,
 705                                                      Node* new_val, const Type* value_type) const {
 706   Node* result = BarrierSetC2::atomic_cmpxchg_bool_at_resolved(access, expected_val, new_val, value_type);
 707   if (!barrier_needed(access)) {
 708     return result;
 709   }
 710 
 711   Node* load_store = access.raw_access();
 712   bool weak_cas = (access.decorators() & C2_WEAK_CMPXCHG) != 0;
 713   bool expected_is_null = (expected_val->get_ptr_type() == TypePtr::NULL_PTR);
 714 
 715   if (!expected_is_null) {
 716     if (weak_cas) {
 717       access.set_needs_pinning(false);
 718       load_store = make_cas_loadbarrier(access);
 719     } else {
 720       access.set_needs_pinning(false);
 721       load_store = make_cas_loadbarrier(access);
 722     }
 723   }
 724 
 725   return load_store;
 726 }
 727 
 728 Node* ZBarrierSetC2::atomic_xchg_at_resolved(C2AtomicAccess& access, Node* new_val, const Type* val_type) const {
 729   Node* result = BarrierSetC2::atomic_xchg_at_resolved(access, new_val, val_type);
 730   if (!barrier_needed(access)) {
 731     return result;
 732   }
 733 
 734   Node* load_store = access.raw_access();
 735   Node* adr = access.addr().node();
 736 
 737   return load_barrier(access.kit(), load_store, adr, false, false, false);
 738 }
 739 
 740 // == Macro Expansion ==
 741 
 742 void ZBarrierSetC2::expand_loadbarrier_node(PhaseMacroExpand* phase, LoadBarrierNode* barrier) const {
 743   Node* in_ctrl = barrier->in(LoadBarrierNode::Control);
 744   Node* in_mem  = barrier->in(LoadBarrierNode::Memory);
 745   Node* in_val  = barrier->in(LoadBarrierNode::Oop);
 746   Node* in_adr  = barrier->in(LoadBarrierNode::Address);
 747 
 748   Node* out_ctrl = barrier->proj_out(LoadBarrierNode::Control);
 749   Node* out_res  = barrier->proj_out(LoadBarrierNode::Oop);
 750 
 751   PhaseIterGVN &igvn = phase->igvn();
 752 
 753   if (ZVerifyLoadBarriers) {
 754     igvn.replace_node(out_res, in_val);
 755     igvn.replace_node(out_ctrl, in_ctrl);
 756     return;
 757   }
 758 
 759   if (barrier->can_be_eliminated()) {
 760     // Clone and pin the load for this barrier below the dominating
 761     // barrier: the load cannot be allowed to float above the
 762     // dominating barrier
 763     Node* load = in_val;
 764     Node* decode = NULL;
 765     if (load->is_DecodeN()) {
 766       decode = load;
 767       load = load->in(1);
 768     }
 769     if (load->is_Load()) {
 770       Node* new_load = load->clone();
 771       Node* addp = new_load->in(MemNode::Address);
 772       assert(addp->is_AddP() || addp->is_Phi(), "bad address");
 773       Node* cast = new CastPPNode(addp, igvn.type(addp), true);
 774       Node* ctrl = NULL;
 775       Node* similar = barrier->in(LoadBarrierNode::Similar);
 776       if (similar->is_Phi()) {
 777         // already expanded
 778         ctrl = similar->in(0);
 779       } else {
 780         assert(similar->is_Proj() && similar->in(0)->is_LoadBarrier(), "unexpected graph shape");
 781         ctrl = similar->in(0)->as_LoadBarrier()->proj_out(LoadBarrierNode::Control);
 782       }
 783       assert(ctrl != NULL, "bad control");
 784       cast->set_req(0, ctrl);
 785       igvn.transform(cast);
 786       new_load->set_req(MemNode::Address, cast);
 787       igvn.transform(new_load);
 788 
 789       Node* new_in_val = new_load;
 790       if (decode != NULL) {
 791         new_in_val = decode->clone();
 792         new_in_val->set_req(1, new_load);
 793         igvn.transform(new_in_val);
 794       }
 795 
 796       igvn.replace_node(out_res, new_in_val);
 797       igvn.replace_node(out_ctrl, in_ctrl);
 798       return;
 799     }
 800     // cannot eliminate
 801   }
 802 
 803   // There are two cases that require the basic loadbarrier
 804   // 1) When the writeback of a healed oop must be avoided (swap)
 805   // 2) When we must guarantee that no reload of is done (swap, cas, cmpx)
 806   if (!barrier->is_writeback()) {
 807     assert(!barrier->oop_reload_allowed(), "writeback barriers should be marked as requires oop");
 808   }
 809 
 810   if (!barrier->oop_reload_allowed()) {
 811     expand_loadbarrier_basic(phase, barrier);
 812   } else {
 813     expand_loadbarrier_optimized(phase, barrier);
 814   }
 815 }
 816 
 817 // Basic loadbarrier using conventional arg passing
 818 void ZBarrierSetC2::expand_loadbarrier_basic(PhaseMacroExpand* phase, LoadBarrierNode *barrier) const {
 819   PhaseIterGVN &igvn = phase->igvn();
 820 
 821   Node* in_ctrl = barrier->in(LoadBarrierNode::Control);
 822   Node* in_mem  = barrier->in(LoadBarrierNode::Memory);
 823   Node* in_val  = barrier->in(LoadBarrierNode::Oop);
 824   Node* in_adr  = barrier->in(LoadBarrierNode::Address);
 825 
 826   Node* out_ctrl = barrier->proj_out(LoadBarrierNode::Control);
 827   Node* out_res  = barrier->proj_out(LoadBarrierNode::Oop);
 828 
 829   float unlikely  = PROB_UNLIKELY(0.999);
 830   const Type* in_val_maybe_null_t = igvn.type(in_val);
 831 
 832   Node* jthread = igvn.transform(new ThreadLocalNode());
 833   Node* adr = phase->basic_plus_adr(jthread, in_bytes(ZThreadLocalData::address_bad_mask_offset()));
 834   Node* bad_mask = igvn.transform(LoadNode::make(igvn, in_ctrl, in_mem, adr, TypeRawPtr::BOTTOM, TypeX_X, TypeX_X->basic_type(), MemNode::unordered));
 835   Node* cast = igvn.transform(new CastP2XNode(in_ctrl, in_val));
 836   Node* obj_masked = igvn.transform(new AndXNode(cast, bad_mask));
 837   Node* cmp = igvn.transform(new CmpXNode(obj_masked, igvn.zerocon(TypeX_X->basic_type())));
 838   Node *bol = igvn.transform(new BoolNode(cmp, BoolTest::ne))->as_Bool();
 839   IfNode* iff = igvn.transform(new IfNode(in_ctrl, bol, unlikely, COUNT_UNKNOWN))->as_If();
 840   Node* then = igvn.transform(new IfTrueNode(iff));
 841   Node* elsen = igvn.transform(new IfFalseNode(iff));
 842 
 843   Node* result_region;
 844   Node* result_val;
 845 
 846   result_region = new RegionNode(3);
 847   result_val = new PhiNode(result_region, TypeInstPtr::BOTTOM);
 848 
 849   result_region->set_req(1, elsen);
 850   Node* res = igvn.transform(new CastPPNode(in_val, in_val_maybe_null_t));
 851   res->init_req(0, elsen);
 852   result_val->set_req(1, res);
 853 
 854   const TypeFunc *tf = load_barrier_Type();
 855   Node* call;
 856   if (barrier->is_weak()) {
 857     call = new CallLeafNode(tf,
 858                             ZBarrierSetRuntime::load_barrier_on_weak_oop_field_preloaded_addr(),
 859                             "ZBarrierSetRuntime::load_barrier_on_weak_oop_field_preloaded",
 860                             TypeRawPtr::BOTTOM);
 861   } else {
 862     call = new CallLeafNode(tf,
 863                             ZBarrierSetRuntime::load_barrier_on_oop_field_preloaded_addr(),
 864                             "ZBarrierSetRuntime::load_barrier_on_oop_field_preloaded",
 865                             TypeRawPtr::BOTTOM);
 866   }
 867 
 868   call->init_req(TypeFunc::Control, then);
 869   call->init_req(TypeFunc::I_O    , phase->top());
 870   call->init_req(TypeFunc::Memory , in_mem);
 871   call->init_req(TypeFunc::FramePtr, phase->top());
 872   call->init_req(TypeFunc::ReturnAdr, phase->top());
 873   call->init_req(TypeFunc::Parms+0, in_val);
 874   if (barrier->is_writeback()) {
 875     call->init_req(TypeFunc::Parms+1, in_adr);
 876   } else {
 877     // when slow path is called with a null adr, the healed oop will not be written back
 878     call->init_req(TypeFunc::Parms+1, igvn.zerocon(T_OBJECT));
 879   }
 880   call = igvn.transform(call);
 881 
 882   Node* ctrl = igvn.transform(new ProjNode(call, TypeFunc::Control));
 883   res = igvn.transform(new ProjNode(call, TypeFunc::Parms));
 884   res = igvn.transform(new CheckCastPPNode(ctrl, res, in_val_maybe_null_t));
 885 
 886   result_region->set_req(2, ctrl);
 887   result_val->set_req(2, res);
 888 
 889   result_region = igvn.transform(result_region);
 890   result_val = igvn.transform(result_val);
 891 
 892   if (out_ctrl != NULL) { // added if cond
 893     igvn.replace_node(out_ctrl, result_region);
 894   }
 895   igvn.replace_node(out_res, result_val);
 896 }
 897 
 898 // Optimized, low spill, loadbarrier variant using stub specialized on register used
 899 void ZBarrierSetC2::expand_loadbarrier_optimized(PhaseMacroExpand* phase, LoadBarrierNode *barrier) const {
 900   PhaseIterGVN &igvn = phase->igvn();
 901 #ifdef PRINT_NODE_TRAVERSALS
 902   Node* preceding_barrier_node = barrier->in(LoadBarrierNode::Oop);
 903 #endif
 904 
 905   Node* in_ctrl = barrier->in(LoadBarrierNode::Control);
 906   Node* in_mem = barrier->in(LoadBarrierNode::Memory);
 907   Node* in_val = barrier->in(LoadBarrierNode::Oop);
 908   Node* in_adr = barrier->in(LoadBarrierNode::Address);
 909 
 910   Node* out_ctrl = barrier->proj_out(LoadBarrierNode::Control);
 911   Node* out_res = barrier->proj_out(LoadBarrierNode::Oop);
 912 
 913   assert(barrier->in(LoadBarrierNode::Oop) != NULL, "oop to loadbarrier node cannot be null");
 914 
 915 #ifdef PRINT_NODE_TRAVERSALS
 916   tty->print("\n\n\nBefore barrier optimization:\n");
 917   traverse(barrier, out_ctrl, out_res, -1);
 918 
 919   tty->print("\nBefore barrier optimization:  preceding_barrier_node\n");
 920   traverse(preceding_barrier_node, out_ctrl, out_res, -1);
 921 #endif
 922 
 923   float unlikely  = PROB_UNLIKELY(0.999);
 924 
 925   Node* jthread = igvn.transform(new ThreadLocalNode());
 926   Node* adr = phase->basic_plus_adr(jthread, in_bytes(ZThreadLocalData::address_bad_mask_offset()));
 927   Node* bad_mask = igvn.transform(LoadNode::make(igvn, in_ctrl, in_mem, adr,
 928                                                  TypeRawPtr::BOTTOM, TypeX_X, TypeX_X->basic_type(),
 929                                                  MemNode::unordered));
 930   Node* cast = igvn.transform(new CastP2XNode(in_ctrl, in_val));
 931   Node* obj_masked = igvn.transform(new AndXNode(cast, bad_mask));
 932   Node* cmp = igvn.transform(new CmpXNode(obj_masked, igvn.zerocon(TypeX_X->basic_type())));
 933   Node *bol = igvn.transform(new BoolNode(cmp, BoolTest::ne))->as_Bool();
 934   IfNode* iff = igvn.transform(new IfNode(in_ctrl, bol, unlikely, COUNT_UNKNOWN))->as_If();
 935   Node* then = igvn.transform(new IfTrueNode(iff));
 936   Node* elsen = igvn.transform(new IfFalseNode(iff));
 937 
 938   Node* slow_path_surrogate;
 939   if (!barrier->is_weak()) {
 940     slow_path_surrogate = igvn.transform(new LoadBarrierSlowRegNode(then, in_mem, in_adr, in_val->adr_type(),
 941                                                                     (const TypePtr*) in_val->bottom_type(), MemNode::unordered));
 942   } else {
 943     slow_path_surrogate = igvn.transform(new LoadBarrierWeakSlowRegNode(then, in_mem, in_adr, in_val->adr_type(),
 944                                                                         (const TypePtr*) in_val->bottom_type(), MemNode::unordered));
 945   }
 946 
 947   Node *new_loadp;
 948   new_loadp = slow_path_surrogate;
 949   // create the final region/phi pair to converge cntl/data paths to downstream code
 950   Node* result_region = igvn.transform(new RegionNode(3));
 951   result_region->set_req(1, then);
 952   result_region->set_req(2, elsen);
 953 
 954   Node* result_phi = igvn.transform(new PhiNode(result_region, TypeInstPtr::BOTTOM));
 955   result_phi->set_req(1, new_loadp);
 956   result_phi->set_req(2, barrier->in(LoadBarrierNode::Oop));
 957 
 958   // finally, connect the original outputs to the barrier region and phi to complete the expansion/substitution
 959   // igvn.replace_node(out_ctrl, result_region);
 960   if (out_ctrl != NULL) { // added if cond
 961     igvn.replace_node(out_ctrl, result_region);
 962   }
 963   igvn.replace_node(out_res, result_phi);
 964 
 965   assert(barrier->outcnt() == 0,"LoadBarrier macro node has non-null outputs after expansion!");
 966 
 967 #ifdef PRINT_NODE_TRAVERSALS
 968   tty->print("\nAfter barrier optimization:  old out_ctrl\n");
 969   traverse(out_ctrl, out_ctrl, out_res, -1);
 970   tty->print("\nAfter barrier optimization:  old out_res\n");
 971   traverse(out_res, out_ctrl, out_res, -1);
 972   tty->print("\nAfter barrier optimization:  old barrier\n");
 973   traverse(barrier, out_ctrl, out_res, -1);
 974   tty->print("\nAfter barrier optimization:  preceding_barrier_node\n");
 975   traverse(preceding_barrier_node, result_region, result_phi, -1);
 976 #endif
 977 
 978   return;
 979 }
 980 
 981 bool ZBarrierSetC2::expand_macro_nodes(PhaseMacroExpand* macro) const {
 982   Compile* C = Compile::current();
 983   PhaseIterGVN &igvn = macro->igvn();
 984   ZBarrierSetC2State* s = state();
 985   if (s->load_barrier_count() > 0) {
 986 #ifdef ASSERT
 987     verify_gc_barriers(false);
 988 #endif
 989     igvn.set_delay_transform(true);
 990     int skipped = 0;
 991     while (s->load_barrier_count() > skipped) {
 992       int load_barrier_count = s->load_barrier_count();
 993       LoadBarrierNode * n = s->load_barrier_node(load_barrier_count-1-skipped);
 994       if (igvn.type(n) == Type::TOP || (n->in(0) != NULL && n->in(0)->is_top())) {
 995         // node is unreachable, so don't try to expand it
 996         s->remove_load_barrier_node(n);
 997         continue;
 998       }
 999       if (!n->can_be_eliminated()) {
1000         skipped++;
1001         continue;
1002       }
1003       expand_loadbarrier_node(macro, n);
1004       assert(s->load_barrier_count() < load_barrier_count, "must have deleted a node from load barrier list");
1005       if (C->failing())  return true;
1006     }
1007     while (s->load_barrier_count() > 0) {
1008       int load_barrier_count = s->load_barrier_count();
1009       LoadBarrierNode* n = s->load_barrier_node(load_barrier_count - 1);
1010       assert(!(igvn.type(n) == Type::TOP || (n->in(0) != NULL && n->in(0)->is_top())), "should have been processed already");
1011       assert(!n->can_be_eliminated(), "should have been processed already");
1012       expand_loadbarrier_node(macro, n);
1013       assert(s->load_barrier_count() < load_barrier_count, "must have deleted a node from load barrier list");
1014       if (C->failing())  return true;
1015     }
1016     igvn.set_delay_transform(false);
1017     igvn.optimize();
1018     if (C->failing())  return true;
1019   }
1020   return false;
1021 }
1022 
1023 // == Loop optimization ==
1024 
1025 static bool replace_with_dominating_barrier(PhaseIdealLoop* phase, LoadBarrierNode* lb, bool last_round) {
1026   PhaseIterGVN &igvn = phase->igvn();
1027   Compile* C = Compile::current();
1028 
1029   LoadBarrierNode* lb2 = lb->has_dominating_barrier(phase, false, last_round);
1030   if (lb2 != NULL) {
1031     if (lb->in(LoadBarrierNode::Oop) != lb2->in(LoadBarrierNode::Oop)) {
1032       assert(lb->in(LoadBarrierNode::Address) == lb2->in(LoadBarrierNode::Address), "");
1033       igvn.replace_input_of(lb, LoadBarrierNode::Similar, lb2->proj_out(LoadBarrierNode::Oop));
1034       C->set_major_progress();
1035     } else  {
1036       // That transformation may cause the Similar edge on dominated load barriers to be invalid
1037       lb->fix_similar_in_uses(&igvn);
1038 
1039       Node* val = lb->proj_out(LoadBarrierNode::Oop);
1040       assert(lb2->has_true_uses(), "");
1041       assert(lb2->in(LoadBarrierNode::Oop) == lb->in(LoadBarrierNode::Oop), "");
1042 
1043       phase->lazy_update(lb, lb->in(LoadBarrierNode::Control));
1044       phase->lazy_replace(lb->proj_out(LoadBarrierNode::Control), lb->in(LoadBarrierNode::Control));
1045       igvn.replace_node(val, lb2->proj_out(LoadBarrierNode::Oop));
1046 
1047       return true;
1048     }
1049   }
1050   return false;
1051 }
1052 
1053 static Node* find_dominating_memory(PhaseIdealLoop* phase, Node* mem, Node* dom, int i) {
1054   assert(dom->is_Region() || i == -1, "");
1055   Node* m = mem;
1056   while(phase->is_dominator(dom, phase->has_ctrl(m) ? phase->get_ctrl(m) : m->in(0))) {
1057     if (m->is_Mem()) {
1058       assert(m->as_Mem()->adr_type() == TypeRawPtr::BOTTOM, "");
1059       m = m->in(MemNode::Memory);
1060     } else if (m->is_MergeMem()) {
1061       m = m->as_MergeMem()->memory_at(Compile::AliasIdxRaw);
1062     } else if (m->is_Phi()) {
1063       if (m->in(0) == dom && i != -1) {
1064         m = m->in(i);
1065         break;
1066       } else {
1067         m = m->in(LoopNode::EntryControl);
1068       }
1069     } else if (m->is_Proj()) {
1070       m = m->in(0);
1071     } else if (m->is_SafePoint() || m->is_MemBar()) {
1072       m = m->in(TypeFunc::Memory);
1073     } else {
1074 #ifdef ASSERT
1075       m->dump();
1076 #endif
1077       ShouldNotReachHere();
1078     }
1079   }
1080   return m;
1081 }
1082 
1083 static LoadBarrierNode* clone_load_barrier(PhaseIdealLoop* phase, LoadBarrierNode* lb, Node* ctl, Node* mem, Node* oop_in) {
1084   PhaseIterGVN &igvn = phase->igvn();
1085   Compile* C = Compile::current();
1086   Node* the_clone = lb->clone();
1087   the_clone->set_req(LoadBarrierNode::Control, ctl);
1088   the_clone->set_req(LoadBarrierNode::Memory, mem);
1089   if (oop_in != NULL) {
1090     the_clone->set_req(LoadBarrierNode::Oop, oop_in);
1091   }
1092 
1093   LoadBarrierNode* new_lb = the_clone->as_LoadBarrier();
1094   igvn.register_new_node_with_optimizer(new_lb);
1095   IdealLoopTree *loop = phase->get_loop(new_lb->in(0));
1096   phase->set_ctrl(new_lb, new_lb->in(0));
1097   phase->set_loop(new_lb, loop);
1098   phase->set_idom(new_lb, new_lb->in(0), phase->dom_depth(new_lb->in(0))+1);
1099   if (!loop->_child) {
1100     loop->_body.push(new_lb);
1101   }
1102 
1103   Node* proj_ctl = new ProjNode(new_lb, LoadBarrierNode::Control);
1104   igvn.register_new_node_with_optimizer(proj_ctl);
1105   phase->set_ctrl(proj_ctl, proj_ctl->in(0));
1106   phase->set_loop(proj_ctl, loop);
1107   phase->set_idom(proj_ctl, new_lb, phase->dom_depth(new_lb)+1);
1108   if (!loop->_child) {
1109     loop->_body.push(proj_ctl);
1110   }
1111 
1112   Node* proj_oop = new ProjNode(new_lb, LoadBarrierNode::Oop);
1113   phase->register_new_node(proj_oop, new_lb);
1114 
1115   if (!new_lb->in(LoadBarrierNode::Similar)->is_top()) {
1116     LoadBarrierNode* similar = new_lb->in(LoadBarrierNode::Similar)->in(0)->as_LoadBarrier();
1117     if (!phase->is_dominator(similar, ctl)) {
1118       igvn.replace_input_of(new_lb, LoadBarrierNode::Similar, C->top());
1119     }
1120   }
1121 
1122   return new_lb;
1123 }
1124 
1125 static void replace_barrier(PhaseIdealLoop* phase, LoadBarrierNode* lb, Node* new_val) {
1126   PhaseIterGVN &igvn = phase->igvn();
1127   Node* val = lb->proj_out(LoadBarrierNode::Oop);
1128   igvn.replace_node(val, new_val);
1129   phase->lazy_update(lb, lb->in(LoadBarrierNode::Control));
1130   phase->lazy_replace(lb->proj_out(LoadBarrierNode::Control), lb->in(LoadBarrierNode::Control));
1131 }
1132 
1133 static bool split_barrier_thru_phi(PhaseIdealLoop* phase, LoadBarrierNode* lb) {
1134   PhaseIterGVN &igvn = phase->igvn();
1135   Compile* C = Compile::current();
1136 
1137   if (lb->in(LoadBarrierNode::Oop)->is_Phi()) {
1138     Node* oop_phi = lb->in(LoadBarrierNode::Oop);
1139 
1140     if (oop_phi->req() == 2) {
1141       // Ignore phis with only one input
1142       return false;
1143     }
1144 
1145     if (phase->is_dominator(phase->get_ctrl(lb->in(LoadBarrierNode::Address)),
1146                             oop_phi->in(0)) && phase->get_ctrl(lb->in(LoadBarrierNode::Address)) != oop_phi->in(0)) {
1147       // That transformation may cause the Similar edge on dominated load barriers to be invalid
1148       lb->fix_similar_in_uses(&igvn);
1149 
1150       RegionNode* region = oop_phi->in(0)->as_Region();
1151 
1152       int backedge = LoopNode::LoopBackControl;
1153       if (region->is_Loop() && region->in(backedge)->is_Proj() && region->in(backedge)->in(0)->is_If()) {
1154         Node* c = region->in(backedge)->in(0)->in(0);
1155         assert(c->unique_ctrl_out() == region->in(backedge)->in(0), "");
1156         Node* oop = lb->in(LoadBarrierNode::Oop)->in(backedge);
1157         Node* oop_c = phase->has_ctrl(oop) ? phase->get_ctrl(oop) : oop;
1158         if (!phase->is_dominator(oop_c, c)) {
1159           return false;
1160         }
1161       }
1162 
1163       // If the node on the backedge above the phi is the node itself - we have a self loop.
1164       // Don't clone - this will be folded later.
1165       if (oop_phi->in(LoopNode::LoopBackControl) == lb->proj_out(LoadBarrierNode::Oop)) {
1166         return false;
1167       }
1168 
1169       bool is_strip_mined = region->is_CountedLoop() && region->as_CountedLoop()->is_strip_mined();
1170       Node *phi = oop_phi->clone();
1171 
1172       for (uint i = 1; i < region->req(); i++) {
1173         Node* ctrl = region->in(i);
1174         if (ctrl != C->top()) {
1175           assert(!phase->is_dominator(ctrl, region) || region->is_Loop(), "");
1176 
1177           Node* mem = lb->in(LoadBarrierNode::Memory);
1178           Node* m = find_dominating_memory(phase, mem, region, i);
1179 
1180           if (region->is_Loop() && i == LoopNode::LoopBackControl && ctrl->is_Proj() && ctrl->in(0)->is_If()) {
1181             ctrl = ctrl->in(0)->in(0);
1182           } else if (region->is_Loop() && is_strip_mined) {
1183             // If this is a strip mined loop, control must move above OuterStripMinedLoop
1184             assert(i == LoopNode::EntryControl, "check");
1185             assert(ctrl->is_OuterStripMinedLoop(), "sanity");
1186             ctrl = ctrl->as_OuterStripMinedLoop()->in(LoopNode::EntryControl);
1187           }
1188 
1189           LoadBarrierNode* new_lb = clone_load_barrier(phase, lb, ctrl, m, lb->in(LoadBarrierNode::Oop)->in(i));
1190           Node* out_ctrl = new_lb->proj_out(LoadBarrierNode::Control);
1191 
1192           if (is_strip_mined && (i == LoopNode::EntryControl)) {
1193             assert(region->in(i)->is_OuterStripMinedLoop(), "");
1194             igvn.replace_input_of(region->in(i), i, out_ctrl);
1195           } else if (ctrl == region->in(i)) {
1196             igvn.replace_input_of(region, i, out_ctrl);
1197           } else {
1198             Node* iff = region->in(i)->in(0);
1199             igvn.replace_input_of(iff, 0, out_ctrl);
1200             phase->set_idom(iff, out_ctrl, phase->dom_depth(out_ctrl)+1);
1201           }
1202           phi->set_req(i, new_lb->proj_out(LoadBarrierNode::Oop));
1203         }
1204       }
1205       phase->register_new_node(phi, region);
1206       replace_barrier(phase, lb, phi);
1207 
1208       if (region->is_Loop()) {
1209         // Load barrier moved to the back edge of the Loop may now
1210         // have a safepoint on the path to the barrier on the Similar
1211         // edge
1212         igvn.replace_input_of(phi->in(LoopNode::LoopBackControl)->in(0), LoadBarrierNode::Similar, C->top());
1213         Node* head = region->in(LoopNode::EntryControl);
1214         phase->set_idom(region, head, phase->dom_depth(head)+1);
1215         phase->recompute_dom_depth();
1216         if (head->is_CountedLoop() && head->as_CountedLoop()->is_main_loop()) {
1217           head->as_CountedLoop()->set_normal_loop();
1218         }
1219       }
1220 
1221       return true;
1222     }
1223   }
1224 
1225   return false;
1226 }
1227 
1228 static bool move_out_of_loop(PhaseIdealLoop* phase, LoadBarrierNode* lb) {
1229   PhaseIterGVN &igvn = phase->igvn();
1230   IdealLoopTree *lb_loop = phase->get_loop(lb->in(0));
1231   if (lb_loop != phase->ltree_root() && !lb_loop->_irreducible) {
1232     Node* oop_ctrl = phase->get_ctrl(lb->in(LoadBarrierNode::Oop));
1233     IdealLoopTree *oop_loop = phase->get_loop(oop_ctrl);
1234     IdealLoopTree* adr_loop = phase->get_loop(phase->get_ctrl(lb->in(LoadBarrierNode::Address)));
1235     if (!lb_loop->is_member(oop_loop) && !lb_loop->is_member(adr_loop)) {
1236       // That transformation may cause the Similar edge on dominated load barriers to be invalid
1237       lb->fix_similar_in_uses(&igvn);
1238 
1239       Node* head = lb_loop->_head;
1240       assert(head->is_Loop(), "");
1241 
1242       if (phase->is_dominator(head, oop_ctrl)) {
1243         assert(oop_ctrl->Opcode() == Op_CProj && oop_ctrl->in(0)->Opcode() == Op_NeverBranch, "");
1244         assert(lb_loop->is_member(phase->get_loop(oop_ctrl->in(0)->in(0))), "");
1245         return false;
1246       }
1247 
1248       if (head->is_CountedLoop()) {
1249         CountedLoopNode* cloop = head->as_CountedLoop();
1250         if (cloop->is_main_loop()) {
1251           cloop->set_normal_loop();
1252         }
1253         // When we are moving barrier out of a counted loop,
1254         // make sure we move it all the way out of the strip mined outer loop.
1255         if (cloop->is_strip_mined()) {
1256           head = cloop->outer_loop();
1257         }
1258       }
1259 
1260       Node* mem = lb->in(LoadBarrierNode::Memory);
1261       Node* m = find_dominating_memory(phase, mem, head, -1);
1262 
1263       LoadBarrierNode* new_lb = clone_load_barrier(phase, lb, head->in(LoopNode::EntryControl), m, NULL);
1264 
1265       assert(phase->idom(head) == head->in(LoopNode::EntryControl), "");
1266       Node* proj_ctl = new_lb->proj_out(LoadBarrierNode::Control);
1267       igvn.replace_input_of(head, LoopNode::EntryControl, proj_ctl);
1268       phase->set_idom(head, proj_ctl, phase->dom_depth(proj_ctl) + 1);
1269 
1270       replace_barrier(phase, lb, new_lb->proj_out(LoadBarrierNode::Oop));
1271 
1272       phase->recompute_dom_depth();
1273 
1274       return true;
1275     }
1276   }
1277 
1278   return false;
1279 }
1280 
1281 static bool common_barriers(PhaseIdealLoop* phase, LoadBarrierNode* lb) {
1282   PhaseIterGVN &igvn = phase->igvn();
1283   Node* in_val = lb->in(LoadBarrierNode::Oop);
1284   for (DUIterator_Fast imax, i = in_val->fast_outs(imax); i < imax; i++) {
1285     Node* u = in_val->fast_out(i);
1286     if (u != lb && u->is_LoadBarrier() && u->as_LoadBarrier()->has_true_uses()) {
1287       Node* this_ctrl = lb->in(LoadBarrierNode::Control);
1288       Node* other_ctrl = u->in(LoadBarrierNode::Control);
1289 
1290       Node* lca = phase->dom_lca(this_ctrl, other_ctrl);
1291       bool ok = true;
1292 
1293       Node* proj1 = NULL;
1294       Node* proj2 = NULL;
1295 
1296       while (this_ctrl != lca && ok) {
1297         if (this_ctrl->in(0) != NULL &&
1298             this_ctrl->in(0)->is_MultiBranch()) {
1299           if (this_ctrl->in(0)->in(0) == lca) {
1300             assert(proj1 == NULL, "");
1301             assert(this_ctrl->is_Proj(), "");
1302             proj1 = this_ctrl;
1303           } else if (!(this_ctrl->in(0)->is_If() && this_ctrl->as_Proj()->is_uncommon_trap_if_pattern(Deoptimization::Reason_none))) {
1304             ok = false;
1305           }
1306         }
1307         this_ctrl = phase->idom(this_ctrl);
1308       }
1309       while (other_ctrl != lca && ok) {
1310         if (other_ctrl->in(0) != NULL &&
1311             other_ctrl->in(0)->is_MultiBranch()) {
1312           if (other_ctrl->in(0)->in(0) == lca) {
1313             assert(other_ctrl->is_Proj(), "");
1314             assert(proj2 == NULL, "");
1315             proj2 = other_ctrl;
1316           } else if (!(other_ctrl->in(0)->is_If() && other_ctrl->as_Proj()->is_uncommon_trap_if_pattern(Deoptimization::Reason_none))) {
1317             ok = false;
1318           }
1319         }
1320         other_ctrl = phase->idom(other_ctrl);
1321       }
1322       assert(proj1 == NULL || proj2 == NULL || proj1->in(0) == proj2->in(0), "");
1323       if (ok && proj1 && proj2 && proj1 != proj2 && proj1->in(0)->is_If()) {
1324         // That transformation may cause the Similar edge on dominated load barriers to be invalid
1325         lb->fix_similar_in_uses(&igvn);
1326         u->as_LoadBarrier()->fix_similar_in_uses(&igvn);
1327 
1328         Node* split = lca->unique_ctrl_out();
1329         assert(split->in(0) == lca, "");
1330 
1331         Node* mem = lb->in(LoadBarrierNode::Memory);
1332         Node* m = find_dominating_memory(phase, mem, split, -1);
1333         LoadBarrierNode* new_lb = clone_load_barrier(phase, lb, lca, m, NULL);
1334 
1335         Node* proj_ctl = new_lb->proj_out(LoadBarrierNode::Control);
1336         igvn.replace_input_of(split, 0, new_lb->proj_out(LoadBarrierNode::Control));
1337         phase->set_idom(split, proj_ctl, phase->dom_depth(proj_ctl)+1);
1338 
1339         Node* proj_oop = new_lb->proj_out(LoadBarrierNode::Oop);
1340         replace_barrier(phase, lb, proj_oop);
1341         replace_barrier(phase, u->as_LoadBarrier(), proj_oop);
1342 
1343         phase->recompute_dom_depth();
1344 
1345         return true;
1346       }
1347     }
1348   }
1349 
1350   return false;
1351 }
1352 
1353 static void optimize_load_barrier(PhaseIdealLoop* phase, LoadBarrierNode* lb, bool last_round) {
1354   Compile* C = Compile::current();
1355 
1356   if (!C->directive()->ZOptimizeLoadBarriersOption) {
1357     return;
1358   }
1359 
1360   if (lb->has_true_uses()) {
1361     if (replace_with_dominating_barrier(phase, lb, last_round)) {
1362       return;
1363     }
1364 
1365     if (split_barrier_thru_phi(phase, lb)) {
1366       return;
1367     }
1368 
1369     if (move_out_of_loop(phase, lb)) {
1370       return;
1371     }
1372 
1373     if (common_barriers(phase, lb)) {
1374       return;
1375     }
1376   }
1377 }
1378 
1379 void ZBarrierSetC2::loop_optimize_gc_barrier(PhaseIdealLoop* phase, Node* node, bool last_round) {
1380   if (node->is_LoadBarrier()) {
1381     optimize_load_barrier(phase, node->as_LoadBarrier(), last_round);
1382   }
1383 }
1384 
1385 // == Verification ==
1386 
1387 #ifdef ASSERT
1388 
1389 static bool look_for_barrier(Node* n, bool post_parse, VectorSet& visited) {
1390   if (visited.test_set(n->_idx)) {
1391     return true;
1392   }
1393 
1394   for (DUIterator_Fast imax, i = n->fast_outs(imax); i < imax; i++) {
1395     Node* u = n->fast_out(i);
1396     if (u->is_LoadBarrier()) {
1397     } else if ((u->is_Phi() || u->is_CMove()) && !post_parse) {
1398       if (!look_for_barrier(u, post_parse, visited)) {
1399         return false;
1400       }
1401     } else if (u->Opcode() == Op_EncodeP || u->Opcode() == Op_DecodeN) {
1402       if (!look_for_barrier(u, post_parse, visited)) {
1403         return false;
1404       }
1405     } else if (u->Opcode() != Op_SCMemProj) {
1406       tty->print("bad use"); u->dump();
1407       return false;
1408     }
1409   }
1410 
1411   return true;
1412 }
1413 
1414 void ZBarrierSetC2::verify_gc_barriers(bool post_parse) const {
1415   ZBarrierSetC2State* s = state();
1416   Compile* C = Compile::current();
1417   ResourceMark rm;
1418   VectorSet visited(Thread::current()->resource_area());
1419   for (int i = 0; i < s->load_barrier_count(); i++) {
1420     LoadBarrierNode* n = s->load_barrier_node(i);
1421 
1422     // The dominating barrier on the same address if it exists and
1423     // this barrier must not be applied on the value from the same
1424     // load otherwise the value is not reloaded before it's used the
1425     // second time.
1426     assert(n->in(LoadBarrierNode::Similar)->is_top() ||
1427            (n->in(LoadBarrierNode::Similar)->in(0)->is_LoadBarrier() &&
1428             n->in(LoadBarrierNode::Similar)->in(0)->in(LoadBarrierNode::Address) == n->in(LoadBarrierNode::Address) &&
1429             n->in(LoadBarrierNode::Similar)->in(0)->in(LoadBarrierNode::Oop) != n->in(LoadBarrierNode::Oop)),
1430            "broken similar edge");
1431 
1432     assert(post_parse || n->as_LoadBarrier()->has_true_uses(),
1433            "found unneeded load barrier");
1434 
1435     // Several load barrier nodes chained through their Similar edge
1436     // break the code that remove the barriers in final graph reshape.
1437     assert(n->in(LoadBarrierNode::Similar)->is_top() ||
1438            (n->in(LoadBarrierNode::Similar)->in(0)->is_LoadBarrier() &&
1439             n->in(LoadBarrierNode::Similar)->in(0)->in(LoadBarrierNode::Similar)->is_top()),
1440            "chain of Similar load barriers");
1441 
1442     if (!n->in(LoadBarrierNode::Similar)->is_top()) {
1443       ResourceMark rm;
1444       Unique_Node_List wq;
1445       Node* other = n->in(LoadBarrierNode::Similar)->in(0);
1446       wq.push(n);
1447       bool ok = true;
1448       bool dom_found = false;
1449       for (uint next = 0; next < wq.size(); ++next) {
1450         Node *n = wq.at(next);
1451         assert(n->is_CFG(), "");
1452         assert(!n->is_SafePoint(), "");
1453 
1454         if (n == other) {
1455           continue;
1456         }
1457 
1458         if (n->is_Region()) {
1459           for (uint i = 1; i < n->req(); i++) {
1460             Node* m = n->in(i);
1461             if (m != NULL) {
1462               wq.push(m);
1463             }
1464           }
1465         } else {
1466           Node* m = n->in(0);
1467           if (m != NULL) {
1468             wq.push(m);
1469           }
1470         }
1471       }
1472     }
1473 
1474     if (ZVerifyLoadBarriers) {
1475       if ((n->is_Load() || n->is_LoadStore()) && n->bottom_type()->make_oopptr() != NULL) {
1476         visited.Clear();
1477         bool found = look_for_barrier(n, post_parse, visited);
1478         if (!found) {
1479           n->dump(1);
1480           n->dump(-3);
1481           stringStream ss;
1482           C->method()->print_short_name(&ss);
1483           tty->print_cr("-%s-", ss.as_string());
1484           assert(found, "");
1485         }
1486       }
1487     }
1488   }
1489 }
1490 
1491 #endif