jdk6 Cdiff hotspot/src/share/vm/opto/graphKit.cpp

hotspot/src/share/vm/opto/graphKit.cpp

rev 611 : Merge


*** 1,10 ****
  #ifdef USE_PRAGMA_IDENT_SRC
  #pragma ident "@(#)graphKit.cpp 1.132 07/10/04 14:36:00 JVM"
  #endif
  /*
!  * Copyright 2001-2007 Sun Microsystems, Inc.  All Rights Reserved.
   * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   *
   * This code is free software; you can redistribute it and/or modify it
   * under the terms of the GNU General Public License version 2 only, as
   * published by the Free Software Foundation.
--- 1,10 ----
  #ifdef USE_PRAGMA_IDENT_SRC
  #pragma ident "@(#)graphKit.cpp 1.132 07/10/04 14:36:00 JVM"
  #endif
  /*
!  * Copyright 2001-2008 Sun Microsystems, Inc.  All Rights Reserved.
   * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   *
   * This code is free software; you can redistribute it and/or modify it
   * under the terms of the GNU General Public License version 2 only, as
   * published by the Free Software Foundation.
*** 533,543 ****
        // Cheat with a preallocated exception object.
        if (C->log() != NULL)
          C->log()->elem("hot_throw preallocated='1' reason='%s'",
                         Deoptimization::trap_reason_name(reason));
        const TypeInstPtr* ex_con  = TypeInstPtr::make(ex_obj);
!       Node*              ex_node = _gvn.transform(new (C, 1) ConPNode(ex_con));
  
        // Clear the detail message of the preallocated exception object.
        // Weblogic sometimes mutates the detail message of exceptions 
        // using reflection.
        int offset = java_lang_Throwable::get_detailMessage_offset();
--- 533,543 ----
        // Cheat with a preallocated exception object.
        if (C->log() != NULL)
          C->log()->elem("hot_throw preallocated='1' reason='%s'",
                         Deoptimization::trap_reason_name(reason));
        const TypeInstPtr* ex_con  = TypeInstPtr::make(ex_obj);
!       Node*              ex_node = _gvn.transform( ConNode::make(C, ex_con) );
  
        // Clear the detail message of the preallocated exception object.
        // Weblogic sometimes mutates the detail message of exceptions 
        // using reflection.
        int offset = java_lang_Throwable::get_detailMessage_offset();
*** 588,607 ****
    _sp     = kit->sp();
    kit->set_map(clone_map ? kit->clone_map() : NULL);
  #ifdef ASSERT
    _bci    = kit->bci();
    Parse* parser = kit->is_Parse();
!   int block = (parser == NULL || parser->block() == NULL) ? -1 : parser->block()->pre_order();
    _block  = block;
  #endif
  }
  PreserveJVMState::~PreserveJVMState() {
    GraphKit* kit = _kit;
  #ifdef ASSERT
    assert(kit->bci() == _bci, "bci must not shift");
    Parse* parser = kit->is_Parse();
!   int block = (parser == NULL || parser->block() == NULL) ? -1 : parser->block()->pre_order();
    assert(block == _block,    "block must not shift");
  #endif
    kit->set_map(_map);
    kit->set_sp(_sp);
  }
--- 588,607 ----
    _sp     = kit->sp();
    kit->set_map(clone_map ? kit->clone_map() : NULL);
  #ifdef ASSERT
    _bci    = kit->bci();
    Parse* parser = kit->is_Parse();
!   int block = (parser == NULL || parser->block() == NULL) ? -1 : parser->block()->rpo();
    _block  = block;
  #endif
  }
  PreserveJVMState::~PreserveJVMState() {
    GraphKit* kit = _kit;
  #ifdef ASSERT
    assert(kit->bci() == _bci, "bci must not shift");
    Parse* parser = kit->is_Parse();
!   int block = (parser == NULL || parser->block() == NULL) ? -1 : parser->block()->rpo();
    assert(block == _block,    "block must not shift");
  #endif
    kit->set_map(_map);
    kit->set_sp(_sp);
  }
*** 858,874 ****
--- 858,882 ----
      l = in_jvms->mon_size();
      out_jvms->set_monoff(p);
      for (j = 0; j < l; j++)
        call->set_req(p++, in_map->in(k+j));
  
+     // Copy any scalar object fields.
+     k = in_jvms->scloff();
+     l = in_jvms->scl_size();
+     out_jvms->set_scloff(p);
+     for (j = 0; j < l; j++)
+       call->set_req(p++, in_map->in(k+j));
+ 
      // Finish the new jvms.
      out_jvms->set_endoff(p);
  
      assert(out_jvms->endoff()     == debug_end,             "fill ptr must match");
      assert(out_jvms->depth()      == in_jvms->depth(),      "depth must match");
      assert(out_jvms->loc_size()   == in_jvms->loc_size(),   "size must match");
      assert(out_jvms->mon_size()   == in_jvms->mon_size(),   "size must match");
+     assert(out_jvms->scl_size()   == in_jvms->scl_size(),   "size must match");
      assert(out_jvms->debug_size() == in_jvms->debug_size(), "size must match");
  
      // Update the two tail pointers in parallel.
      out_jvms = out_jvms->caller();
      in_jvms  = in_jvms->caller();
*** 1036,1055 ****
  Node* GraphKit::load_object_klass(Node* obj) {
    // Special-case a fresh allocation to avoid building nodes:
    Node* akls = AllocateNode::Ideal_klass(obj, &_gvn);
    if (akls != NULL)  return akls;
    Node* k_adr = basic_plus_adr(obj, oopDesc::klass_offset_in_bytes());
!   return _gvn.transform( new (C, 3) LoadKlassNode(0, immutable_memory(), k_adr, TypeInstPtr::KLASS) );
  }
  
  //-------------------------load_array_length-----------------------------------
  Node* GraphKit::load_array_length(Node* array) {
    // Special-case a fresh allocation to avoid building nodes:
!   Node* alen = AllocateArrayNode::Ideal_length(array, &_gvn);
!   if (alen != NULL)  return alen;
    Node *r_adr = basic_plus_adr(array, arrayOopDesc::length_offset_in_bytes());
!   return _gvn.transform( new (C, 3) LoadRangeNode(0, immutable_memory(), r_adr, TypeInt::POS));
  }
  
  //------------------------------do_null_check----------------------------------
  // Helper function to do a NULL pointer check.  Returned value is 
  // the incoming address with NULL casted away.  You are allowed to use the
--- 1044,1072 ----
  Node* GraphKit::load_object_klass(Node* obj) {
    // Special-case a fresh allocation to avoid building nodes:
    Node* akls = AllocateNode::Ideal_klass(obj, &_gvn);
    if (akls != NULL)  return akls;
    Node* k_adr = basic_plus_adr(obj, oopDesc::klass_offset_in_bytes());
!   return _gvn.transform( LoadKlassNode::make(_gvn, immutable_memory(), k_adr, TypeInstPtr::KLASS) );
  }
  
  //-------------------------load_array_length-----------------------------------
  Node* GraphKit::load_array_length(Node* array) {
    // Special-case a fresh allocation to avoid building nodes:
!   AllocateArrayNode* alloc = AllocateArrayNode::Ideal_array_allocation(array, &_gvn);
!   Node *alen;
!   if (alloc == NULL) {
      Node *r_adr = basic_plus_adr(array, arrayOopDesc::length_offset_in_bytes());
!     alen = _gvn.transform( new (C, 3) LoadRangeNode(0, immutable_memory(), r_adr, TypeInt::POS));
!   } else {
!     alen = alloc->Ideal_length();
!     Node* ccast = alloc->make_ideal_length(_gvn.type(array)->is_aryptr(), &_gvn);
!     if (ccast != alen) {
!       alen = _gvn.transform(ccast);
!     }
!   }
!   return alen;
  }
  
  //------------------------------do_null_check----------------------------------
  // Helper function to do a NULL pointer check.  Returned value is 
  // the incoming address with NULL casted away.  You are allowed to use the
*** 1173,1182 ****
--- 1190,1205 ----
    else if (type == T_OBJECT)
      reason = Deoptimization::Reason_null_check;
    else
      reason = Deoptimization::Reason_div0_check;
  
+   // %%% Since Reason_unhandled is not recorded on a per-bytecode basis,
+   // ciMethodData::has_trap_at will return a conservative -1 if any
+   // must-be-null assertion has failed.  This could cause performance
+   // problems for a method after its first do_null_assert failure.
+   // Consider using 'Reason_class_check' instead?
+ 
    // To cause an implicit null check, we set the not-null probability
    // to the maximum (PROB_MAX).  For an explicit check the probablity
    // is set to a smaller value.
    if (null_control != NULL || too_many_traps(reason)) {
      // probability is less likely
*** 1205,1214 ****
--- 1228,1238 ----
      } else if (assert_null) {
        uncommon_trap(reason,
                      Deoptimization::Action_make_not_entrant,
                      NULL, "assert_null");
      } else {
+       replace_in_map(value, zerocon(type));
        builtin_throw(reason);
      }
    }
  
    // Must throw exception, fall-thru not possible?
*** 1321,1331 ****
    Node* mem = memory(adr_idx);
    Node* ld;
    if (require_atomic_access && bt == T_LONG) {
      ld = LoadLNode::make_atomic(C, ctl, mem, adr, adr_type, t);
    } else {
!     ld = LoadNode::make(C, ctl, mem, adr, adr_type, t, bt);
    }
    return _gvn.transform(ld);
  }
  
  Node* GraphKit::store_to_memory(Node* ctl, Node* adr, Node *val, BasicType bt,
--- 1345,1355 ----
    Node* mem = memory(adr_idx);
    Node* ld;
    if (require_atomic_access && bt == T_LONG) {
      ld = LoadLNode::make_atomic(C, ctl, mem, adr, adr_type, t);
    } else {
!     ld = LoadNode::make(_gvn, ctl, mem, adr, adr_type, t, bt);
    }
    return _gvn.transform(ld);
  }
  
  Node* GraphKit::store_to_memory(Node* ctl, Node* adr, Node *val, BasicType bt,
*** 1337,1347 ****
    Node *mem = memory(adr_idx);
    Node* st;
    if (require_atomic_access && bt == T_LONG) {
      st = StoreLNode::make_atomic(C, ctl, mem, adr, adr_type, val);
    } else {
!     st = StoreNode::make(C, ctl, mem, adr, adr_type, val, bt);
    }
    st = _gvn.transform(st);
    set_memory(st, adr_idx);
    // Back-to-back stores can only remove intermediate store with DU info
    // so push on worklist for optimizer.
--- 1361,1371 ----
    Node *mem = memory(adr_idx);
    Node* st;
    if (require_atomic_access && bt == T_LONG) {
      st = StoreLNode::make_atomic(C, ctl, mem, adr, adr_type, val);
    } else {
!     st = StoreNode::make(_gvn, ctl, mem, adr, adr_type, val, bt);
    }
    st = _gvn.transform(st);
    set_memory(st, adr_idx);
    // Back-to-back stores can only remove intermediate store with DU info
    // so push on worklist for optimizer.
*** 1359,1368 ****
--- 1383,1396 ----
                             const Type* val_type,
                             BasicType bt) {
    BarrierSet* bs = Universe::heap()->barrier_set();
    set_control(ctl);
    switch (bs->kind()) {
+     case BarrierSet::G1SATBCT:
+     case BarrierSet::G1SATBCTLogging:
+         g1_write_barrier_pre(obj, adr, adr_idx, val, val_type, bt);
+       break;
  
      case BarrierSet::CardTableModRef:
      case BarrierSet::CardTableExtension:
      case BarrierSet::ModRef: 
        break;
*** 1383,1392 ****
--- 1411,1424 ----
                              BasicType bt,
                              bool use_precise) {
    BarrierSet* bs = Universe::heap()->barrier_set();
    set_control(ctl);
    switch (bs->kind()) {
+     case BarrierSet::G1SATBCT:
+     case BarrierSet::G1SATBCTLogging:
+         g1_write_barrier_post(store, obj, adr, adr_idx, val, bt, use_precise);
+       break;
  
      case BarrierSet::CardTableModRef:
      case BarrierSet::CardTableExtension:
        write_barrier_post(store, obj, adr, val, use_precise);
        break;
*** 1448,1458 ****
  
  
  //-------------------------array_element_address-------------------------
  Node* GraphKit::array_element_address(Node* ary, Node* idx, BasicType elembt,
                                        const TypeInt* sizetype) {
!   uint shift  = exact_log2(type2aelembytes[elembt]);
    uint header = arrayOopDesc::base_offset_in_bytes(elembt);
  
    // short-circuit a common case (saves lots of confusing waste motion)
    jint idx_con = find_int_con(idx, -1);
    if (idx_con >= 0) {
--- 1480,1490 ----
  
  
  //-------------------------array_element_address-------------------------
  Node* GraphKit::array_element_address(Node* ary, Node* idx, BasicType elembt,
                                        const TypeInt* sizetype) {
!   uint shift  = exact_log2(type2aelembytes(elembt));
    uint header = arrayOopDesc::base_offset_in_bytes(elembt);
  
    // short-circuit a common case (saves lots of confusing waste motion)
    jint idx_con = find_int_con(idx, -1);
    if (idx_con >= 0) {
*** 1953,1962 ****
--- 1985,1995 ----
      // recompile; the offending check-cast will be compiled to handle NULLs.
      // If we see more than one offending BCI, then all checkcasts in the
      // method will be compiled to handle NULLs.
      PreserveJVMState pjvms(this);
      set_control(*null_control);
+     replace_in_map(value, null());
      uncommon_trap(Deoptimization::Reason_null_check,
                    Deoptimization::Action_make_not_entrant);
      (*null_control) = top();    // NULL path is dead
    }
  
*** 2203,2213 ****
    Node *p2 = _gvn.transform( new (C, 4) AddPNode(subklass,subklass,chk_off_X) );
    // For some types like interfaces the following loadKlass is from a 1-word
    // cache which is mutable so can't use immutable memory.  Other
    // types load from the super-class display table which is immutable.
    Node *kmem = might_be_cache ? memory(p2) : immutable_memory();
!   Node *nkls = _gvn.transform( new (C, 3) LoadKlassNode( NULL, kmem, p2, _gvn.type(p2)->is_ptr(), TypeKlassPtr::OBJECT_OR_NULL ) );
  
    // Compile speed common case: ARE a subtype and we canNOT fail
    if( superklass == nkls )
      return top();             // false path is dead; no test needed.
  
--- 2236,2246 ----
    Node *p2 = _gvn.transform( new (C, 4) AddPNode(subklass,subklass,chk_off_X) );
    // For some types like interfaces the following loadKlass is from a 1-word
    // cache which is mutable so can't use immutable memory.  Other
    // types load from the super-class display table which is immutable.
    Node *kmem = might_be_cache ? memory(p2) : immutable_memory();
!   Node *nkls = _gvn.transform( LoadKlassNode::make( _gvn, kmem, p2, _gvn.type(p2)->is_ptr(), TypeKlassPtr::OBJECT_OR_NULL ) );
  
    // Compile speed common case: ARE a subtype and we canNOT fail
    if( superklass == nkls )
      return top();             // false path is dead; no test needed.
  
*** 2794,2804 ****
    if (ReduceFieldZeroing && !raw_mem_only) {
      // Extract memory strands which may participate in the new object's
      // initialization, and source them from the new InitializeNode.
      // This will allow us to observe initializations when they occur,
      // and link them properly (as a group) to the InitializeNode.
-     Node* klass_node = alloc->in(AllocateNode::KlassNode);
      assert(init->in(InitializeNode::Memory) == malloc, "");
      MergeMemNode* minit_in = MergeMemNode::make(C, malloc);
      init->set_req(InitializeNode::Memory, minit_in);
      record_for_igvn(minit_in); // fold it up later, if possible
      Node* minit_out = memory(rawidx);
--- 2827,2836 ----
*** 2809,2819 ****
        hook_memory_on_init(*this, elemidx, minit_in, minit_out);
      } else if (oop_type->isa_instptr()) {
        ciInstanceKlass* ik = oop_type->klass()->as_instance_klass();
        for (int i = 0, len = ik->nof_nonstatic_fields(); i < len; i++) {
          ciField* field = ik->nonstatic_field_at(i);
!         if (field->offset() >= TrackedInitializationLimit)
            continue;  // do not bother to track really large numbers of fields
          // Find (or create) the alias category for this field:
          int fieldidx = C->alias_type(field)->index();
          hook_memory_on_init(*this, fieldidx, minit_in, minit_out);
        }
--- 2841,2851 ----
        hook_memory_on_init(*this, elemidx, minit_in, minit_out);
      } else if (oop_type->isa_instptr()) {
        ciInstanceKlass* ik = oop_type->klass()->as_instance_klass();
        for (int i = 0, len = ik->nof_nonstatic_fields(); i < len; i++) {
          ciField* field = ik->nonstatic_field_at(i);
!         if (field->offset() >= TrackedInitializationLimit * HeapWordSize)
            continue;  // do not bother to track really large numbers of fields
          // Find (or create) the alias category for this field:
          int fieldidx = C->alias_type(field)->index();
          hook_memory_on_init(*this, fieldidx, minit_in, minit_out);
        }
*** 2825,2848 ****
    javaoop = _gvn.transform(javaoop);
    C->set_recent_alloc(control(), javaoop);
    assert(just_allocated_object(control()) == javaoop, "just allocated");
   
  #ifdef ASSERT
!   { // Verify that the AllocateNode::Ideal_foo recognizers work:
!     Node* kn = alloc->in(AllocateNode::KlassNode);
!     Node* ln = alloc->in(AllocateNode::ALength);
!     assert(AllocateNode::Ideal_klass(rawoop, &_gvn) == kn,
!            "Ideal_klass works");
!     assert(AllocateNode::Ideal_klass(javaoop, &_gvn) == kn,
!            "Ideal_klass works");
      if (alloc->is_AllocateArray()) {
!       assert(AllocateArrayNode::Ideal_length(rawoop, &_gvn) == ln,
!              "Ideal_length works");
!       assert(AllocateArrayNode::Ideal_length(javaoop, &_gvn) == ln,
!              "Ideal_length works");
      } else {
!       assert(ln->is_top(), "no length, please");
      }
    }
  #endif //ASSERT
   
    return javaoop;
--- 2857,2878 ----
    javaoop = _gvn.transform(javaoop);
    C->set_recent_alloc(control(), javaoop);
    assert(just_allocated_object(control()) == javaoop, "just allocated");
   
  #ifdef ASSERT
!   { // Verify that the AllocateNode::Ideal_allocation recognizers work:
!     assert(AllocateNode::Ideal_allocation(rawoop, &_gvn) == alloc,
!            "Ideal_allocation works");
!     assert(AllocateNode::Ideal_allocation(javaoop, &_gvn) == alloc,
!            "Ideal_allocation works");
      if (alloc->is_AllocateArray()) {
!       assert(AllocateArrayNode::Ideal_array_allocation(rawoop, &_gvn) == alloc->as_AllocateArray(),
!              "Ideal_allocation works");
!       assert(AllocateArrayNode::Ideal_array_allocation(javaoop, &_gvn) == alloc->as_AllocateArray(),
!              "Ideal_allocation works");
      } else {
!       assert(alloc->in(AllocateNode::ALength)->is_top(), "no length, please");
      }
    }
  #endif //ASSERT
   
    return javaoop;
*** 2915,2928 ****
    const TypeKlassPtr* tklass = _gvn.type(klass_node)->isa_klassptr();
    if (!tklass)  tklass = TypeKlassPtr::OBJECT;
    const TypeOopPtr* oop_type = tklass->as_instance_type();
  
    // Now generate allocation code
    AllocateNode* alloc
      = new (C, AllocateNode::ParmLimit)
          AllocateNode(C, AllocateNode::alloc_type(),
!                      control(), memory(Compile::AliasIdxRaw), i_o(),
                       size, klass_node,
                       initial_slow_test);
  
    return set_output_for_allocation(alloc, oop_type, raw_mem_only);
  }
--- 2945,2970 ----
    const TypeKlassPtr* tklass = _gvn.type(klass_node)->isa_klassptr();
    if (!tklass)  tklass = TypeKlassPtr::OBJECT;
    const TypeOopPtr* oop_type = tklass->as_instance_type();
  
    // Now generate allocation code
+ 
+   // With escape analysis, the entire memory state is needed to be able to
+   // eliminate the allocation.  If the allocations cannot be eliminated, this
+   // will be optimized to the raw slice when the allocation is expanded.
+   Node *mem;
+   if (C->do_escape_analysis()) {
+     mem = reset_memory();
+     set_all_memory(mem);
+   } else {
+     mem = memory(Compile::AliasIdxRaw);
+   }
+ 
    AllocateNode* alloc
      = new (C, AllocateNode::ParmLimit)
          AllocateNode(C, AllocateNode::alloc_type(),
!                      control(), mem, i_o(),
                       size, klass_node,
                       initial_slow_test);
  
    return set_output_for_allocation(alloc, oop_type, raw_mem_only);
  }
*** 3049,3091 ****
      // This is the size
      (*return_size_val) = size;
    }
  
    // Now generate allocation code
    // Create the AllocateArrayNode and its result projections
    AllocateArrayNode* alloc
      = new (C, AllocateArrayNode::ParmLimit)
          AllocateArrayNode(C, AllocateArrayNode::alloc_type(),
!                           control(), memory(Compile::AliasIdxRaw), i_o(),
                            size, klass_node,
                            initial_slow_test,
                            length);
  
    // Cast to correct type.  Note that the klass_node may be constant or not,
    // and in the latter case the actual array type will be inexact also.
    // (This happens via a non-constant argument to inline_native_newArray.)
    // In any case, the value of klass_node provides the desired array type.
    const TypeInt* length_type = _gvn.find_int_type(length);
-   const TypeInt* narrow_length_type = NULL;
    const TypeOopPtr* ary_type = _gvn.type(klass_node)->is_klassptr()->as_instance_type();
    if (ary_type->isa_aryptr() && length_type != NULL) {
      // Try to get a better type than POS for the size
      ary_type = ary_type->is_aryptr()->cast_to_size(length_type);
-     narrow_length_type = ary_type->is_aryptr()->size();
-     if (narrow_length_type == length_type)
-       narrow_length_type = NULL;
    }
  
    Node* javaoop = set_output_for_allocation(alloc, ary_type, raw_mem_only);
  
!   // Cast length on remaining path to be positive:
!   if (narrow_length_type != NULL) {
!     Node* ccast = new (C, 2) CastIINode(length, narrow_length_type);
!     ccast->set_req(0, control());
      _gvn.set_type_bottom(ccast);
      record_for_igvn(ccast);
-     if (map()->find_edge(length) >= 0) {
        replace_in_map(length, ccast);
      }
    }
  
    return javaoop;
--- 3091,3140 ----
      // This is the size
      (*return_size_val) = size;
    }
  
    // Now generate allocation code
+ 
+   // With escape analysis, the entire memory state is needed to be able to
+   // eliminate the allocation.  If the allocations cannot be eliminated, this
+   // will be optimized to the raw slice when the allocation is expanded.
+   Node *mem;
+   if (C->do_escape_analysis()) {
+     mem = reset_memory();
+     set_all_memory(mem);
+   } else {
+     mem = memory(Compile::AliasIdxRaw);
+   }
+ 
    // Create the AllocateArrayNode and its result projections
    AllocateArrayNode* alloc
      = new (C, AllocateArrayNode::ParmLimit)
          AllocateArrayNode(C, AllocateArrayNode::alloc_type(),
!                           control(), mem, i_o(),
                            size, klass_node,
                            initial_slow_test,
                            length);
  
    // Cast to correct type.  Note that the klass_node may be constant or not,
    // and in the latter case the actual array type will be inexact also.
    // (This happens via a non-constant argument to inline_native_newArray.)
    // In any case, the value of klass_node provides the desired array type.
    const TypeInt* length_type = _gvn.find_int_type(length);
    const TypeOopPtr* ary_type = _gvn.type(klass_node)->is_klassptr()->as_instance_type();
    if (ary_type->isa_aryptr() && length_type != NULL) {
      // Try to get a better type than POS for the size
      ary_type = ary_type->is_aryptr()->cast_to_size(length_type);
    }
  
    Node* javaoop = set_output_for_allocation(alloc, ary_type, raw_mem_only);
  
!   // Cast length on remaining path to be as narrow as possible
!   if (map()->find_edge(length) >= 0) {
!     Node* ccast = alloc->make_ideal_length(ary_type, &_gvn);
!     if (ccast != length) {
        _gvn.set_type_bottom(ccast);
        record_for_igvn(ccast);
        replace_in_map(length, ccast);
      }
    }
  
    return javaoop;
*** 3145,3149 ****
--- 3194,3446 ----
        return init->as_Initialize();
      }
    }
    return NULL;
  }
+ 
+ void GraphKit::g1_write_barrier_pre(Node* obj,
+                                     Node* adr,
+                                     uint alias_idx,
+                                     Node* val,
+                                     const Type* val_type,
+                                     BasicType bt) {
+   IdealKit ideal(gvn(), control(), merged_memory(), true);
+ #define __ ideal.
+   __ declares_done();
+ 
+   Node* thread = __ thread();
+ 
+   Node* no_ctrl = NULL;
+   Node* no_base = __ top();
+   Node* zero = __ ConI(0);
+ 
+   float likely  = PROB_LIKELY(0.999);
+   float unlikely  = PROB_UNLIKELY(0.999);
+ 
+   BasicType active_type = in_bytes(PtrQueue::byte_width_of_active()) == 4 ? T_INT : T_BYTE;
+   assert(in_bytes(PtrQueue::byte_width_of_active()) == 4 || in_bytes(PtrQueue::byte_width_of_active()) == 1, "flag width");
+ 
+   // Offsets into the thread
+   const int marking_offset = in_bytes(JavaThread::satb_mark_queue_offset() +  // 648
+                                           PtrQueue::byte_offset_of_active());
+   const int index_offset   = in_bytes(JavaThread::satb_mark_queue_offset() +  // 656
+                                           PtrQueue::byte_offset_of_index());
+   const int buffer_offset  = in_bytes(JavaThread::satb_mark_queue_offset() +  // 652
+                                           PtrQueue::byte_offset_of_buf());
+   // Now the actual pointers into the thread
+ 
+   // set_control( ctl);
+ 
+   Node* marking_adr = __ AddP(no_base, thread, __ ConX(marking_offset));
+   Node* buffer_adr  = __ AddP(no_base, thread, __ ConX(buffer_offset));
+   Node* index_adr   = __ AddP(no_base, thread, __ ConX(index_offset));
+ 
+   // Now some of the values
+ 
+   Node* marking = __ load(__ ctrl(), marking_adr, TypeInt::INT, active_type, Compile::AliasIdxRaw);
+ 
+   // if (!marking)
+   __ if_then(marking, BoolTest::ne, zero); {
+     Node* index   = __ load(__ ctrl(), index_adr, TypeInt::INT, T_INT, Compile::AliasIdxRaw);
+ 
+     const Type* t1 = adr->bottom_type();
+     const Type* t2 = val->bottom_type();
+ 
+     Node* orig = __ load(no_ctrl, adr, val_type, bt, alias_idx);
+     // if (orig != NULL)
+     __ if_then(orig, BoolTest::ne, null()); {
+       Node* buffer  = __ load(__ ctrl(), buffer_adr, TypeRawPtr::NOTNULL, T_ADDRESS, Compile::AliasIdxRaw);
+ 
+       // load original value
+       // alias_idx correct??
+ 
+       // is the queue for this thread full?
+       __ if_then(index, BoolTest::ne, zero, likely); {
+ 
+         // decrement the index
+         Node* next_index = __ SubI(index,  __ ConI(sizeof(intptr_t)));
+         Node* next_indexX = next_index;
+ #ifdef _LP64
+           // We could refine the type for what it's worth
+           // const TypeLong* lidxtype = TypeLong::make(CONST64(0), get_size_from_queue);
+           next_indexX = _gvn.transform( new (C, 2) ConvI2LNode(next_index, TypeLong::make(0, max_jlong, Type::WidenMax)) );
+ #endif // _LP64
+ 
+         // Now get the buffer location we will log the original value into and store it
+ 
+         Node *log_addr = __ AddP(no_base, buffer, next_indexX);
+         // __ store(__ ctrl(), log_addr, orig, T_OBJECT, C->get_alias_index(TypeOopPtr::BOTTOM));
+         __ store(__ ctrl(), log_addr, orig, T_OBJECT, Compile::AliasIdxRaw);
+ 
+ 
+         // update the index
+         // __ store(__ ctrl(), index_adr, next_index, T_INT, Compile::AliasIdxRaw);
+         // This is a hack to force this store to occur before the oop store that is coming up
+         __ store(__ ctrl(), index_adr, next_index, T_INT, C->get_alias_index(TypeOopPtr::BOTTOM));
+ 
+       } __ else_(); {
+ 
+         // logging buffer is full, call the runtime
+         const TypeFunc *tf = OptoRuntime::g1_wb_pre_Type();
+         // __ make_leaf_call(tf, OptoRuntime::g1_wb_pre_Java(), "g1_wb_pre", orig, thread);
+         __ make_leaf_call(tf, CAST_FROM_FN_PTR(address, SharedRuntime::g1_wb_pre), "g1_wb_pre", orig, thread);
+       } __ end_if();
+     } __ end_if();
+   } __ end_if();
+ 
+   __ drain_delay_transform();
+   set_control( __ ctrl());
+   set_all_memory( __ merged_memory());
+ 
+ #undef __
+ }
+ 
+ //
+ // Update the card table and add card address to the queue
+ //
+ void GraphKit::g1_mark_card(IdealKit* ideal, Node* card_adr, Node* store,  Node* index, Node* index_adr, Node* buffer, const TypeFunc* tf) {
+ #define __ ideal->
+   Node* zero = __ ConI(0);
+   Node* no_base = __ top();
+   BasicType card_bt = T_BYTE;
+   // Smash zero into card. MUST BE ORDERED WRT TO STORE
+   __ storeCM(__ ctrl(), card_adr, zero, store, card_bt, Compile::AliasIdxRaw);
+ 
+   //  Now do the queue work
+   __ if_then(index, BoolTest::ne, zero); {
+ 
+     Node* next_index = __ SubI(index,  __ ConI(sizeof(intptr_t)));
+     Node* next_indexX = next_index;
+ #ifdef _LP64
+     // We could refine the type for what it's worth
+     // const TypeLong* lidxtype = TypeLong::make(CONST64(0), get_size_from_queue);
+     next_indexX = _gvn.transform( new (C, 2) ConvI2LNode(next_index, TypeLong::make(0, max_jlong, Type::WidenMax)) );
+ #endif // _LP64
+     Node* log_addr = __ AddP(no_base, buffer, next_indexX);
+ 
+     __ store(__ ctrl(), log_addr, card_adr, T_ADDRESS, Compile::AliasIdxRaw);
+     __ store(__ ctrl(), index_adr, next_index, T_INT, Compile::AliasIdxRaw);
+ 
+   } __ else_(); {
+     __ make_leaf_call(tf, CAST_FROM_FN_PTR(address, SharedRuntime::g1_wb_post), "g1_wb_post", card_adr, __ thread());
+   } __ end_if();
+ #undef __
+ }
+ 
+ void GraphKit::g1_write_barrier_post(Node* store,
+                                      Node* obj,
+                                      Node* adr,
+                                      uint alias_idx,
+                                      Node* val,
+                                      BasicType bt,
+                                      bool use_precise) {
+   // If we are writing a NULL then we need no post barrier
+ 
+   if (val != NULL && val->is_Con() && val->bottom_type() == TypePtr::NULL_PTR) {
+     // Must be NULL
+     const Type* t = val->bottom_type();
+     assert(t == Type::TOP || t == TypePtr::NULL_PTR, "must be NULL");
+     // No post barrier if writing NULLx
+     return;
+   }
+ 
+   if (!use_precise) {
+     // All card marks for a (non-array) instance are in one place:
+     adr = obj;
+   }
+   // (Else it's an array (or unknown), and we want more precise card marks.)
+   assert(adr != NULL, "");
+ 
+   IdealKit ideal(gvn(), control(), merged_memory(), true);
+ #define __ ideal.
+   __ declares_done();
+ 
+   Node* thread = __ thread();
+ 
+   Node* no_ctrl = NULL;
+   Node* no_base = __ top();
+   float likely  = PROB_LIKELY(0.999);
+   float unlikely  = PROB_UNLIKELY(0.999);
+   Node* zero = __ ConI(0);
+   Node* zeroX = __ ConX(0);
+ 
+   // Get the alias_index for raw card-mark memory
+   const TypePtr* card_type = TypeRawPtr::BOTTOM;
+ 
+   const TypeFunc *tf = OptoRuntime::g1_wb_post_Type();
+ 
+   // Get the address of the card table
+   CardTableModRefBS* ct =
+     (CardTableModRefBS*)(Universe::heap()->barrier_set());
+   Node *card_table = __ makecon(TypeRawPtr::make((address)ct->byte_map_base));
+   // Get base of card map
+   assert(sizeof(*ct->byte_map_base) == sizeof(jbyte), "adjust this code");
+ 
+ 
+   // Offsets into the thread
+   const int index_offset  = in_bytes(JavaThread::dirty_card_queue_offset() +
+                                      PtrQueue::byte_offset_of_index());
+   const int buffer_offset = in_bytes(JavaThread::dirty_card_queue_offset() +
+                                      PtrQueue::byte_offset_of_buf());
+ 
+   // Pointers into the thread
+ 
+   Node* buffer_adr = __ AddP(no_base, thread, __ ConX(buffer_offset));
+   Node* index_adr =  __ AddP(no_base, thread, __ ConX(index_offset));
+ 
+   // Now some values
+ 
+   Node* index  = __ load(no_ctrl, index_adr, TypeInt::INT, T_INT, Compile::AliasIdxRaw);
+   Node* buffer = __ load(no_ctrl, buffer_adr, TypeRawPtr::NOTNULL, T_ADDRESS, Compile::AliasIdxRaw);
+ 
+ 
+   // Convert the store obj pointer to an int prior to doing math on it
+   // Use addr not obj gets accurate card marks
+ 
+   // Node* cast = __ CastPX(no_ctrl, adr /* obj */);
+ 
+   // Must use ctrl to prevent "integerized oop" existing across safepoint
+   Node* cast =  __ CastPX(__ ctrl(), ( use_precise ? adr : obj ));
+ 
+   // Divide pointer by card size
+   Node* card_offset = __ URShiftX( cast, __ ConI(CardTableModRefBS::card_shift) );
+ 
+   // Combine card table base and card offset
+   Node *card_adr = __ AddP(no_base, card_table, card_offset );
+ 
+   // If we know the value being stored does it cross regions?
+ 
+   if (val != NULL) {
+     // Does the store cause us to cross regions?
+ 
+     // Should be able to do an unsigned compare of region_size instead of
+     // and extra shift. Do we have an unsigned compare??
+     // Node* region_size = __ ConI(1 << HeapRegion::LogOfHRGrainBytes);
+     Node* xor_res =  __ URShiftX ( __ XorX( cast,  __ CastPX(__ ctrl(), val)), __ ConI(HeapRegion::LogOfHRGrainBytes));
+ 
+     // if (xor_res == 0) same region so skip
+     __ if_then(xor_res, BoolTest::ne, zeroX); {
+ 
+       // No barrier if we are storing a NULL
+       __ if_then(val, BoolTest::ne, null(), unlikely); {
+ 
+         // Ok must mark the card if not already dirty
+ 
+         // load the original value of the card
+         Node* card_val = __ load(__ ctrl(), card_adr, TypeInt::INT, T_BYTE, Compile::AliasIdxRaw);
+ 
+         __ if_then(card_val, BoolTest::ne, zero); {
+           g1_mark_card(&ideal, card_adr, store, index, index_adr, buffer, tf);
+         } __ end_if();
+       } __ end_if();
+     } __ end_if();
+   } else {
+     g1_mark_card(&ideal, card_adr, store, index, index_adr, buffer, tf);
+   }
+ 
+ 
+   __ drain_delay_transform();
+   set_control( __ ctrl());
+   set_all_memory( __ merged_memory());
+ #undef __
+ 
+ }