hotspot Cdiff src/cpu/sparc/vm/stubGenerator

src/cpu/sparc/vm/stubGenerator_sparc.cpp


*** 214,226 ****
      // setup parameters
      const Register t = G3_scratch;
      __ ld_ptr(parameter_size.as_in().as_address(), t); // get parameter size (in words)
      __ sll(t, Interpreter::logStackElementSize, t);    // compute number of bytes
      __ sub(FP, t, Gargs);                              // setup parameter pointer
- #ifdef _LP64
      __ add( Gargs, STACK_BIAS, Gargs );                // Account for LP64 stack bias
- #endif
      __ mov(SP, O5_savedSP);
  
  
      // do the call
      //
--- 214,224 ----
*** 269,299 ****
        __ BIND(is_double);
        __ ba(exit);
        __ delayed()->stf(FloatRegisterImpl::D, F0, addr, G0);
  
        __ BIND(is_long);
- #ifdef _LP64
        __ ba(exit);
        __ delayed()->st_long(O0, addr, G0);      // store entire long
- #else
- #if defined(COMPILER2)
-   // All return values are where we want them, except for Longs.  C2 returns
-   // longs in G1 in the 32-bit build whereas the interpreter wants them in O0/O1.
-   // Since the interpreter will return longs in G1 and O0/O1 in the 32bit
-   // build we simply always use G1.
-   // Note: I tried to make c2 return longs in O0/O1 and G1 so we wouldn't have to
-   // do this here. Unfortunately if we did a rethrow we'd see an machepilog node
-   // first which would move g1 -> O0/O1 and destroy the exception we were throwing.
- 
-       __ ba(exit);
-       __ delayed()->stx(G1, addr, G0);  // store entire long
- #else
-       __ st(O1, addr, BytesPerInt);
-       __ ba(exit);
-       __ delayed()->st(O0, addr, G0);
- #endif /* COMPILER2 */
- #endif /* _LP64 */
       }
       return start;
    }
  
  
--- 267,278 ----
*** 744,769 ****
      __ align(CodeEntryAlignment);
      StubCodeMark mark(this, "StubRoutines", "partial_subtype_check");
      address start = __ pc();
      Label miss;
  
- #if defined(COMPILER2) && !defined(_LP64)
-     // Do not use a 'save' because it blows the 64-bit O registers.
-     __ add(SP,-4*wordSize,SP);  // Make space for 4 temps (stack must be 2 words aligned)
-     __ st_ptr(L0,SP,(frame::register_save_words+0)*wordSize);
-     __ st_ptr(L1,SP,(frame::register_save_words+1)*wordSize);
-     __ st_ptr(L2,SP,(frame::register_save_words+2)*wordSize);
-     __ st_ptr(L3,SP,(frame::register_save_words+3)*wordSize);
-     Register Rret   = O0;
-     Register Rsub   = O1;
-     Register Rsuper = O2;
- #else
      __ save_frame(0);
      Register Rret   = I0;
      Register Rsub   = I1;
      Register Rsuper = I2;
- #endif
  
      Register L0_ary_len = L0;
      Register L1_ary_ptr = L1;
      Register L2_super   = L2;
      Register L3_index   = L3;
--- 723,736 ----
*** 773,808 ****
                                       NULL, &miss);
  
      // Match falls through here.
      __ addcc(G0,0,Rret);        // set Z flags, Z result
  
- #if defined(COMPILER2) && !defined(_LP64)
-     __ ld_ptr(SP,(frame::register_save_words+0)*wordSize,L0);
-     __ ld_ptr(SP,(frame::register_save_words+1)*wordSize,L1);
-     __ ld_ptr(SP,(frame::register_save_words+2)*wordSize,L2);
-     __ ld_ptr(SP,(frame::register_save_words+3)*wordSize,L3);
-     __ retl();                  // Result in Rret is zero; flags set to Z
-     __ delayed()->add(SP,4*wordSize,SP);
- #else
      __ ret();                   // Result in Rret is zero; flags set to Z
      __ delayed()->restore();
- #endif
  
      __ BIND(miss);
      __ addcc(G0,1,Rret);        // set NZ flags, NZ result
  
- #if defined(COMPILER2) && !defined(_LP64)
-     __ ld_ptr(SP,(frame::register_save_words+0)*wordSize,L0);
-     __ ld_ptr(SP,(frame::register_save_words+1)*wordSize,L1);
-     __ ld_ptr(SP,(frame::register_save_words+2)*wordSize,L2);
-     __ ld_ptr(SP,(frame::register_save_words+3)*wordSize,L3);
-     __ retl();                  // Result in Rret is != 0; flags set to NZ
-     __ delayed()->add(SP,4*wordSize,SP);
- #else
      __ ret();                   // Result in Rret is != 0; flags set to NZ
      __ delayed()->restore();
- #endif
  
      return start;
    }
  
  
--- 740,757 ----
*** 826,840 ****
    //  Input:
    //    Rint  -  32-bits value
    //    Rtmp  -  scratch
    //
    void assert_clean_int(Register Rint, Register Rtmp) {
- #if defined(ASSERT) && defined(_LP64)
-     __ signx(Rint, Rtmp);
-     __ cmp(Rint, Rtmp);
-     __ breakpoint_trap(Assembler::notEqual, Assembler::xcc);
- #endif
    }
  
    //
    //  Generate overlap test for array copy stubs
    //
--- 775,784 ----
*** 1267,1287 ****
        // are HeapWordSize aligned (see LibraryCallKit::basictype2arraycopy()).
        //
        // Aligned arrays have 4 bytes alignment in 32-bits VM
        // and 8 bytes - in 64-bits VM. So we do it only for 32-bits VM
        //
- #ifndef _LP64
-       // copy a 4-bytes word if necessary to align 'to' to 8 bytes
-       __ andcc(to, 7, G0);
-       __ br(Assembler::zero, false, Assembler::pn, L_skip_alignment);
-       __ delayed()->ld(from, 0, O3);
-       __ inc(from, 4);
-       __ inc(to, 4);
-       __ dec(count, 4);
-       __ st(O3, to, -4);
-     __ BIND(L_skip_alignment);
- #endif
      } else {
        // copy bytes to align 'to' on 8 byte boundary
        __ andcc(to, 7, G1); // misaligned bytes
        __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
        __ delayed()->neg(G1);
--- 1211,1220 ----
*** 1294,1306 ****
        __ stb(O3, to, 0);
        __ br(Assembler::notZero, false, Assembler::pt, L_align);
        __ delayed()->inc(to);
      __ BIND(L_skip_alignment);
      }
- #ifdef _LP64
      if (!aligned)
- #endif
      {
        // Copy with shift 16 bytes per iteration if arrays do not have
        // the same alignment mod 8, otherwise fall through to the next
        // code for aligned copy.
        // The compare above (count >= 23) guarantes 'count' >= 16 bytes.
--- 1227,1237 ----
*** 1393,1410 ****
        __ deccc(G1);
        __ brx(Assembler::notZero, false, Assembler::pt, L_align);
        __ delayed()->stb(O3, end_to, 0);
      __ BIND(L_skip_alignment);
      }
- #ifdef _LP64
      if (aligned) {
        // Both arrays are aligned to 8-bytes in 64-bits VM.
        // The 'count' is decremented in copy_16_bytes_backward_with_shift()
        // in unaligned case.
        __ dec(count, 16);
      } else
- #endif
      {
        // Copy with shift 16 bytes per iteration if arrays do not have
        // the same alignment mod 8, otherwise jump to the next
        // code for aligned copy (and substracting 16 from 'count' before jump).
        // The compare above (count >= 11) guarantes 'count' >= 16 bytes.
--- 1324,1339 ----
*** 1488,1508 ****
        // are HeapWordSize aligned (see LibraryCallKit::basictype2arraycopy()).
        //
        // Aligned arrays have 4 bytes alignment in 32-bits VM
        // and 8 bytes - in 64-bits VM.
        //
- #ifndef _LP64
-       // copy a 2-elements word if necessary to align 'to' to 8 bytes
-       __ andcc(to, 7, G0);
-       __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
-       __ delayed()->ld(from, 0, O3);
-       __ inc(from, 4);
-       __ inc(to, 4);
-       __ dec(count, 2);
-       __ st(O3, to, -4);
-     __ BIND(L_skip_alignment);
- #endif
      } else {
        // copy 1 element if necessary to align 'to' on an 4 bytes
        __ andcc(to, 3, G0);
        __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
        __ delayed()->lduh(from, 0, O3);
--- 1417,1426 ----
*** 1522,1534 ****
        __ inc(to, 4);
        __ sth(O3, to, -4);
        __ sth(O4, to, -2);
      __ BIND(L_skip_alignment2);
      }
- #ifdef _LP64
      if (!aligned)
- #endif
      {
        // Copy with shift 16 bytes per iteration if arrays do not have
        // the same alignment mod 8, otherwise fall through to the next
        // code for aligned copy.
        // The compare above (count >= 11) guarantes 'count' >= 16 bytes.
--- 1440,1450 ----
*** 1641,1664 ****
        __ sth(value, to, 0);
        __ inc(to, 2);
        __ dec(count, 1 << (shift - 1));
        __ BIND(L_skip_align2);
      }
- #ifdef _LP64
      if (!aligned) {
- #endif
      // align to 8 bytes, we know we are 4 byte aligned to start
      __ andcc(to, 7, G0);
      __ br(Assembler::zero, false, Assembler::pt, L_fill_32_bytes);
      __ delayed()->nop();
      __ stw(value, to, 0);
      __ inc(to, 4);
      __ dec(count, 1 << shift);
      __ BIND(L_fill_32_bytes);
- #ifdef _LP64
      }
- #endif
  
      if (t == T_INT) {
        // Zero extend value
        __ srl(value, 0, value);
      }
--- 1557,1576 ----
*** 1855,1872 ****
        __ dec(end_to, 4);
        __ sth(O3, end_to, 2);
        __ sth(O4, end_to, 0);
      __ BIND(L_skip_alignment2);
      }
- #ifdef _LP64
      if (aligned) {
        // Both arrays are aligned to 8-bytes in 64-bits VM.
        // The 'count' is decremented in copy_16_bytes_backward_with_shift()
        // in unaligned case.
        __ dec(count, 8);
      } else
- #endif
      {
        // Copy with shift 16 bytes per iteration if arrays do not have
        // the same alignment mod 8, otherwise jump to the next
        // code for aligned copy (and substracting 8 from 'count' before jump).
        // The compare above (count >= 11) guarantes 'count' >= 16 bytes.
--- 1767,1782 ----
*** 1972,1984 ****
      // are HeapWordSize aligned (see LibraryCallKit::basictype2arraycopy()).
      //
      // Aligned arrays have 4 bytes alignment in 32-bits VM
      // and 8 bytes - in 64-bits VM.
      //
- #ifdef _LP64
      if (!aligned)
- #endif
      {
        // The next check could be put under 'ifndef' since the code in
        // generate_disjoint_long_copy_core() has own checks and set 'offset'.
  
        // for short arrays, just do single element copy
--- 1882,1892 ----
*** 2461,2480 ****
  
      // save arguments for barrier generation
      __ mov(to, G1);
      __ mov(count, G5);
      gen_write_ref_array_pre_barrier(G1, G5, dest_uninitialized);
-   #ifdef _LP64
      assert_clean_int(count, O3);     // Make sure 'count' is clean int.
      if (UseCompressedOops) {
        generate_disjoint_int_copy_core(aligned);
      } else {
        generate_disjoint_long_copy_core(aligned);
      }
-   #else
-     generate_disjoint_int_copy_core(aligned);
-   #endif
      // O0 is used as temp register
      gen_write_ref_array_post_barrier(G1, G5, O0);
  
      // O3, O4 are used as temp registers
      inc_counter_np(SharedRuntime::_oop_array_copy_ctr, O3, O4);
--- 2369,2384 ----
*** 2516,2534 ****
      // save arguments for barrier generation
      __ mov(to, G1);
      __ mov(count, G5);
      gen_write_ref_array_pre_barrier(G1, G5, dest_uninitialized);
  
-   #ifdef _LP64
      if (UseCompressedOops) {
        generate_conjoint_int_copy_core(aligned);
      } else {
        generate_conjoint_long_copy_core(aligned);
      }
-   #else
-     generate_conjoint_int_copy_core(aligned);
-   #endif
  
      // O0 is used as temp register
      gen_write_ref_array_post_barrier(G1, G5, O0);
  
      // O3, O4 are used as temp registers
--- 2420,2434 ----
*** 3136,3161 ****
      // Aligned versions
      StubRoutines::_arrayof_jint_disjoint_arraycopy = generate_disjoint_int_copy(true, &entry,
                                                                                  "arrayof_jint_disjoint_arraycopy");
      StubRoutines::_arrayof_jint_arraycopy          = generate_conjoint_int_copy(true, entry, &entry_jint_arraycopy,
                                                                                  "arrayof_jint_arraycopy");
- #ifdef _LP64
      // In 64 bit we need both aligned and unaligned versions of jint arraycopy.
      // entry_jint_arraycopy always points to the unaligned version (notice that we overwrite it).
      StubRoutines::_jint_disjoint_arraycopy         = generate_disjoint_int_copy(false, &entry,
                                                                                  "jint_disjoint_arraycopy");
      StubRoutines::_jint_arraycopy                  = generate_conjoint_int_copy(false, entry,
                                                                                  &entry_jint_arraycopy,
                                                                                  "jint_arraycopy");
- #else
-     // In 32 bit jints are always HeapWordSize aligned, so always use the aligned version
-     // (in fact in 32bit we always have a pre-loop part even in the aligned version,
-     //  because it uses 64-bit loads/stores, so the aligned flag is actually ignored).
-     StubRoutines::_jint_disjoint_arraycopy = StubRoutines::_arrayof_jint_disjoint_arraycopy;
-     StubRoutines::_jint_arraycopy          = StubRoutines::_arrayof_jint_arraycopy;
- #endif
- 
  
      //*** jlong
      // It is always aligned
      StubRoutines::_arrayof_jlong_disjoint_arraycopy = generate_disjoint_long_copy(true, &entry,
                                                                                    "arrayof_jlong_disjoint_arraycopy");
--- 3036,3052 ----
*** 3176,3186 ****
                                                                                        "arrayof_oop_disjoint_arraycopy_uninit",
                                                                                        /*dest_uninitialized*/true);
      StubRoutines::_arrayof_oop_arraycopy_uninit          = generate_conjoint_oop_copy(true, entry, NULL,
                                                                                        "arrayof_oop_arraycopy_uninit",
                                                                                        /*dest_uninitialized*/true);
- #ifdef _LP64
      if (UseCompressedOops) {
        // With compressed oops we need unaligned versions, notice that we overwrite entry_oop_arraycopy.
        StubRoutines::_oop_disjoint_arraycopy            = generate_disjoint_oop_copy(false, &entry,
                                                                                      "oop_disjoint_arraycopy");
        StubRoutines::_oop_arraycopy                     = generate_conjoint_oop_copy(false, entry, &entry_oop_arraycopy,
--- 3067,3076 ----
*** 3191,3201 ****
                                                                                      /*dest_uninitialized*/true);
        StubRoutines::_oop_arraycopy_uninit              = generate_conjoint_oop_copy(false, entry, NULL,
                                                                                      "oop_arraycopy_uninit",
                                                                                      /*dest_uninitialized*/true);
      } else
- #endif
      {
        // oop arraycopy is always aligned on 32bit and 64bit without compressed oops
        StubRoutines::_oop_disjoint_arraycopy            = StubRoutines::_arrayof_oop_disjoint_arraycopy;
        StubRoutines::_oop_arraycopy                     = StubRoutines::_arrayof_oop_arraycopy;
        StubRoutines::_oop_disjoint_arraycopy_uninit     = StubRoutines::_arrayof_oop_disjoint_arraycopy_uninit;
--- 3081,3090 ----
*** 5102,5122 ****
      StubRoutines::Sparc::_test_stop_entry                  = generate_test_stop();
  
      StubRoutines::Sparc::_stop_subroutine_entry            = generate_stop_subroutine();
      StubRoutines::Sparc::_flush_callers_register_windows_entry = generate_flush_callers_register_windows();
  
- #if !defined(COMPILER2) && !defined(_LP64)
-     StubRoutines::_atomic_xchg_entry         = generate_atomic_xchg();
-     StubRoutines::_atomic_cmpxchg_entry      = generate_atomic_cmpxchg();
-     StubRoutines::_atomic_add_entry          = generate_atomic_add();
-     StubRoutines::_atomic_xchg_ptr_entry     = StubRoutines::_atomic_xchg_entry;
-     StubRoutines::_atomic_cmpxchg_ptr_entry  = StubRoutines::_atomic_cmpxchg_entry;
-     StubRoutines::_atomic_cmpxchg_byte_entry = ShouldNotCallThisStub();
-     StubRoutines::_atomic_cmpxchg_long_entry = generate_atomic_cmpxchg_long();
-     StubRoutines::_atomic_add_ptr_entry      = StubRoutines::_atomic_add_entry;
- #endif  // COMPILER2 !=> _LP64
- 
      // Build this early so it's available for the interpreter.
      StubRoutines::_throw_StackOverflowError_entry =
              generate_throw_exception("StackOverflowError throw_exception",
              CAST_FROM_FN_PTR(address, SharedRuntime::throw_StackOverflowError));
      StubRoutines::_throw_delayed_StackOverflowError_entry =
--- 4991,5000 ----
*** 5220,5234 ****
   private:
    int _stub_count;
    void stub_prolog(StubCodeDesc* cdesc) {
      # ifdef ASSERT
        // put extra information in the stub code, to make it more readable
- #ifdef _LP64
  // Write the high part of the address
  // [RGV] Check if there is a dependency on the size of this prolog
        __ emit_data((intptr_t)cdesc >> 32,    relocInfo::none);
- #endif
        __ emit_data((intptr_t)cdesc,    relocInfo::none);
        __ emit_data(++_stub_count, relocInfo::none);
      # endif
      align(true);
    }
--- 5098,5110 ----
< prev index next >