1 /*
   2  * Copyright (c) 1999, 2011, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  *
  23  */
  24 
  25 #include "precompiled.hpp"
  26 #include "c1/c1_Defs.hpp"
  27 #include "c1/c1_MacroAssembler.hpp"
  28 #include "c1/c1_Runtime1.hpp"
  29 #include "interpreter/interpreter.hpp"
  30 #include "nativeInst_sparc.hpp"
  31 #include "oops/compiledICHolderOop.hpp"
  32 #include "oops/oop.inline.hpp"
  33 #include "prims/jvmtiExport.hpp"
  34 #include "register_sparc.hpp"
  35 #include "runtime/sharedRuntime.hpp"
  36 #include "runtime/signature.hpp"
  37 #include "runtime/vframeArray.hpp"
  38 #include "vmreg_sparc.inline.hpp"
  39 
  40 // Implementation of StubAssembler
  41 
  42 int StubAssembler::call_RT(Register oop_result1, Register oop_result2, address entry_point, int number_of_arguments) {
  43   // for sparc changing the number of arguments doesn't change
  44   // anything about the frame size so we'll always lie and claim that
  45   // we are only passing 1 argument.
  46   set_num_rt_args(1);
  47 
  48   assert_not_delayed();
  49   // bang stack before going to runtime
  50   set(-os::vm_page_size() + STACK_BIAS, G3_scratch);
  51   st(G0, SP, G3_scratch);
  52 
  53   // debugging support
  54   assert(number_of_arguments >= 0   , "cannot have negative number of arguments");
  55 
  56   set_last_Java_frame(SP, noreg);
  57   if (VerifyThread)  mov(G2_thread, O0); // about to be smashed; pass early
  58   save_thread(L7_thread_cache);
  59   // do the call
  60   call(entry_point, relocInfo::runtime_call_type);
  61   if (!VerifyThread) {
  62     delayed()->mov(G2_thread, O0);  // pass thread as first argument
  63   } else {
  64     delayed()->nop();             // (thread already passed)
  65   }
  66   int call_offset = offset();  // offset of return address
  67   restore_thread(L7_thread_cache);
  68   reset_last_Java_frame();
  69 
  70   // check for pending exceptions
  71   { Label L;
  72     Address exception_addr(G2_thread, Thread::pending_exception_offset());
  73     ld_ptr(exception_addr, Gtemp);
  74     br_null_short(Gtemp, pt, L);
  75     Address vm_result_addr(G2_thread, JavaThread::vm_result_offset());
  76     st_ptr(G0, vm_result_addr);
  77     Address vm_result_addr_2(G2_thread, JavaThread::vm_result_2_offset());
  78     st_ptr(G0, vm_result_addr_2);
  79 
  80     if (frame_size() == no_frame_size) {
  81       // we use O7 linkage so that forward_exception_entry has the issuing PC
  82       call(StubRoutines::forward_exception_entry(), relocInfo::runtime_call_type);
  83       delayed()->restore();
  84     } else if (_stub_id == Runtime1::forward_exception_id) {
  85       should_not_reach_here();
  86     } else {
  87       AddressLiteral exc(Runtime1::entry_for(Runtime1::forward_exception_id));
  88       jump_to(exc, G4);
  89       delayed()->nop();
  90     }
  91     bind(L);
  92   }
  93 
  94   // get oop result if there is one and reset the value in the thread
  95   if (oop_result1->is_valid()) {                    // get oop result if there is one and reset it in the thread
  96     get_vm_result  (oop_result1);
  97   } else {
  98     // be a little paranoid and clear the result
  99     Address vm_result_addr(G2_thread, JavaThread::vm_result_offset());
 100     st_ptr(G0, vm_result_addr);
 101   }
 102 
 103   if (oop_result2->is_valid()) {
 104     get_vm_result_2(oop_result2);
 105   } else {
 106     // be a little paranoid and clear the result
 107     Address vm_result_addr_2(G2_thread, JavaThread::vm_result_2_offset());
 108     st_ptr(G0, vm_result_addr_2);
 109   }
 110 
 111   return call_offset;
 112 }
 113 
 114 
 115 int StubAssembler::call_RT(Register oop_result1, Register oop_result2, address entry, Register arg1) {
 116   // O0 is reserved for the thread
 117   mov(arg1, O1);
 118   return call_RT(oop_result1, oop_result2, entry, 1);
 119 }
 120 
 121 
 122 int StubAssembler::call_RT(Register oop_result1, Register oop_result2, address entry, Register arg1, Register arg2) {
 123   // O0 is reserved for the thread
 124   mov(arg1, O1);
 125   mov(arg2, O2); assert(arg2 != O1, "smashed argument");
 126   return call_RT(oop_result1, oop_result2, entry, 2);
 127 }
 128 
 129 
 130 int StubAssembler::call_RT(Register oop_result1, Register oop_result2, address entry, Register arg1, Register arg2, Register arg3) {
 131   // O0 is reserved for the thread
 132   mov(arg1, O1);
 133   mov(arg2, O2); assert(arg2 != O1,               "smashed argument");
 134   mov(arg3, O3); assert(arg3 != O1 && arg3 != O2, "smashed argument");
 135   return call_RT(oop_result1, oop_result2, entry, 3);
 136 }
 137 
 138 
 139 // Implementation of Runtime1
 140 
 141 #define __ sasm->
 142 
 143 static int cpu_reg_save_offsets[FrameMap::nof_cpu_regs];
 144 static int fpu_reg_save_offsets[FrameMap::nof_fpu_regs];
 145 static int reg_save_size_in_words;
 146 static int frame_size_in_bytes = -1;
 147 
 148 static OopMap* generate_oop_map(StubAssembler* sasm, bool save_fpu_registers) {
 149   assert(frame_size_in_bytes == __ total_frame_size_in_bytes(reg_save_size_in_words),
 150          "mismatch in calculation");
 151   sasm->set_frame_size(frame_size_in_bytes / BytesPerWord);
 152   int frame_size_in_slots = frame_size_in_bytes / sizeof(jint);
 153   OopMap* oop_map = new OopMap(frame_size_in_slots, 0);
 154 
 155   int i;
 156   for (i = 0; i < FrameMap::nof_cpu_regs; i++) {
 157     Register r = as_Register(i);
 158     if (r == G1 || r == G3 || r == G4 || r == G5) {
 159       int sp_offset = cpu_reg_save_offsets[i];
 160       oop_map->set_callee_saved(VMRegImpl::stack2reg(sp_offset),
 161                                 r->as_VMReg());
 162     }
 163   }
 164 
 165   if (save_fpu_registers) {
 166     for (i = 0; i < FrameMap::nof_fpu_regs; i++) {
 167       FloatRegister r = as_FloatRegister(i);
 168       int sp_offset = fpu_reg_save_offsets[i];
 169       oop_map->set_callee_saved(VMRegImpl::stack2reg(sp_offset),
 170                                 r->as_VMReg());
 171     }
 172   }
 173   return oop_map;
 174 }
 175 
 176 static OopMap* save_live_registers(StubAssembler* sasm, bool save_fpu_registers = true) {
 177   assert(frame_size_in_bytes == __ total_frame_size_in_bytes(reg_save_size_in_words),
 178          "mismatch in calculation");
 179   __ save_frame_c1(frame_size_in_bytes);
 180 
 181   // Record volatile registers as callee-save values in an OopMap so their save locations will be
 182   // propagated to the caller frame's RegisterMap during StackFrameStream construction (needed for
 183   // deoptimization; see compiledVFrame::create_stack_value).  The caller's I, L and O registers
 184   // are saved in register windows - I's and L's in the caller's frame and O's in the stub frame
 185   // (as the stub's I's) when the runtime routine called by the stub creates its frame.
 186   // OopMap frame sizes are in c2 stack slot sizes (sizeof(jint))
 187 
 188   int i;
 189   for (i = 0; i < FrameMap::nof_cpu_regs; i++) {
 190     Register r = as_Register(i);
 191     if (r == G1 || r == G3 || r == G4 || r == G5) {
 192       int sp_offset = cpu_reg_save_offsets[i];
 193       __ st_ptr(r, SP, (sp_offset * BytesPerWord) + STACK_BIAS);
 194     }
 195   }
 196 
 197   if (save_fpu_registers) {
 198     for (i = 0; i < FrameMap::nof_fpu_regs; i++) {
 199       FloatRegister r = as_FloatRegister(i);
 200       int sp_offset = fpu_reg_save_offsets[i];
 201       __ stf(FloatRegisterImpl::S, r, SP, (sp_offset * BytesPerWord) + STACK_BIAS);
 202     }
 203   }
 204 
 205   return generate_oop_map(sasm, save_fpu_registers);
 206 }
 207 
 208 static void restore_live_registers(StubAssembler* sasm, bool restore_fpu_registers = true) {
 209   for (int i = 0; i < FrameMap::nof_cpu_regs; i++) {
 210     Register r = as_Register(i);
 211     if (r == G1 || r == G3 || r == G4 || r == G5) {
 212       __ ld_ptr(SP, (cpu_reg_save_offsets[i] * BytesPerWord) + STACK_BIAS, r);
 213     }
 214   }
 215 
 216   if (restore_fpu_registers) {
 217     for (int i = 0; i < FrameMap::nof_fpu_regs; i++) {
 218       FloatRegister r = as_FloatRegister(i);
 219       __ ldf(FloatRegisterImpl::S, SP, (fpu_reg_save_offsets[i] * BytesPerWord) + STACK_BIAS, r);
 220     }
 221   }
 222 }
 223 
 224 
 225 void Runtime1::initialize_pd() {
 226   // compute word offsets from SP at which live (non-windowed) registers are captured by stub routines
 227   //
 228   // A stub routine will have a frame that is at least large enough to hold
 229   // a register window save area (obviously) and the volatile g registers
 230   // and floating registers. A user of save_live_registers can have a frame
 231   // that has more scratch area in it (although typically they will use L-regs).
 232   // in that case the frame will look like this (stack growing down)
 233   //
 234   // FP -> |             |
 235   //       | scratch mem |
 236   //       |   "      "  |
 237   //       --------------
 238   //       | float regs  |
 239   //       |   "    "    |
 240   //       ---------------
 241   //       | G regs      |
 242   //       | "  "        |
 243   //       ---------------
 244   //       | abi reg.    |
 245   //       | window save |
 246   //       | area        |
 247   // SP -> ---------------
 248   //
 249   int i;
 250   int sp_offset = round_to(frame::register_save_words, 2); //  start doubleword aligned
 251 
 252   // only G int registers are saved explicitly; others are found in register windows
 253   for (i = 0; i < FrameMap::nof_cpu_regs; i++) {
 254     Register r = as_Register(i);
 255     if (r == G1 || r == G3 || r == G4 || r == G5) {
 256       cpu_reg_save_offsets[i] = sp_offset;
 257       sp_offset++;
 258     }
 259   }
 260 
 261   // all float registers are saved explicitly
 262   assert(FrameMap::nof_fpu_regs == 32, "double registers not handled here");
 263   for (i = 0; i < FrameMap::nof_fpu_regs; i++) {
 264     fpu_reg_save_offsets[i] = sp_offset;
 265     sp_offset++;
 266   }
 267   reg_save_size_in_words = sp_offset - frame::memory_parameter_word_sp_offset;
 268   // this should match assembler::total_frame_size_in_bytes, which
 269   // isn't callable from this context.  It's checked by an assert when
 270   // it's used though.
 271   frame_size_in_bytes = align_size_up(sp_offset * wordSize, 8);
 272 }
 273 
 274 
 275 OopMapSet* Runtime1::generate_exception_throw(StubAssembler* sasm, address target, bool has_argument) {
 276   // make a frame and preserve the caller's caller-save registers
 277   OopMap* oop_map = save_live_registers(sasm);
 278   int call_offset;
 279   if (!has_argument) {
 280     call_offset = __ call_RT(noreg, noreg, target);
 281   } else {
 282     call_offset = __ call_RT(noreg, noreg, target, G4);
 283   }
 284   OopMapSet* oop_maps = new OopMapSet();
 285   oop_maps->add_gc_map(call_offset, oop_map);
 286 
 287   __ should_not_reach_here();
 288   return oop_maps;
 289 }
 290 
 291 
 292 OopMapSet* Runtime1::generate_stub_call(StubAssembler* sasm, Register result, address target,
 293                                         Register arg1, Register arg2, Register arg3) {
 294   // make a frame and preserve the caller's caller-save registers
 295   OopMap* oop_map = save_live_registers(sasm);
 296 
 297   int call_offset;
 298   if (arg1 == noreg) {
 299     call_offset = __ call_RT(result, noreg, target);
 300   } else if (arg2 == noreg) {
 301     call_offset = __ call_RT(result, noreg, target, arg1);
 302   } else if (arg3 == noreg) {
 303     call_offset = __ call_RT(result, noreg, target, arg1, arg2);
 304   } else {
 305     call_offset = __ call_RT(result, noreg, target, arg1, arg2, arg3);
 306   }
 307   OopMapSet* oop_maps = NULL;
 308 
 309   oop_maps = new OopMapSet();
 310   oop_maps->add_gc_map(call_offset, oop_map);
 311   restore_live_registers(sasm);
 312 
 313   __ ret();
 314   __ delayed()->restore();
 315 
 316   return oop_maps;
 317 }
 318 
 319 
 320 OopMapSet* Runtime1::generate_patching(StubAssembler* sasm, address target) {
 321   // make a frame and preserve the caller's caller-save registers
 322   OopMap* oop_map = save_live_registers(sasm);
 323 
 324   // call the runtime patching routine, returns non-zero if nmethod got deopted.
 325   int call_offset = __ call_RT(noreg, noreg, target);
 326   OopMapSet* oop_maps = new OopMapSet();
 327   oop_maps->add_gc_map(call_offset, oop_map);
 328 
 329   // re-execute the patched instruction or, if the nmethod was deoptmized, return to the
 330   // deoptimization handler entry that will cause re-execution of the current bytecode
 331   DeoptimizationBlob* deopt_blob = SharedRuntime::deopt_blob();
 332   assert(deopt_blob != NULL, "deoptimization blob must have been created");
 333 
 334   Label no_deopt;
 335   __ br_null_short(O0, Assembler::pt, no_deopt);
 336 
 337   // return to the deoptimization handler entry for unpacking and rexecute
 338   // if we simply returned the we'd deopt as if any call we patched had just
 339   // returned.
 340 
 341   restore_live_registers(sasm);
 342 
 343   AddressLiteral dest(deopt_blob->unpack_with_reexecution());
 344   __ jump_to(dest, O0);
 345   __ delayed()->restore();
 346 
 347   __ bind(no_deopt);
 348   restore_live_registers(sasm);
 349   __ ret();
 350   __ delayed()->restore();
 351 
 352   return oop_maps;
 353 }
 354 
 355 OopMapSet* Runtime1::generate_code_for(StubID id, StubAssembler* sasm) {
 356 
 357   OopMapSet* oop_maps = NULL;
 358   // for better readability
 359   const bool must_gc_arguments = true;
 360   const bool dont_gc_arguments = false;
 361 
 362   // stub code & info for the different stubs
 363   switch (id) {
 364     case forward_exception_id:
 365       {
 366         oop_maps = generate_handle_exception(id, sasm);
 367       }
 368       break;
 369 
 370     case new_instance_id:
 371     case fast_new_instance_id:
 372     case fast_new_instance_init_check_id:
 373       {
 374         Register G5_klass = G5; // Incoming
 375         Register O0_obj   = O0; // Outgoing
 376 
 377         if (id == new_instance_id) {
 378           __ set_info("new_instance", dont_gc_arguments);
 379         } else if (id == fast_new_instance_id) {
 380           __ set_info("fast new_instance", dont_gc_arguments);
 381         } else {
 382           assert(id == fast_new_instance_init_check_id, "bad StubID");
 383           __ set_info("fast new_instance init check", dont_gc_arguments);
 384         }
 385 
 386         if ((id == fast_new_instance_id || id == fast_new_instance_init_check_id) &&
 387             UseTLAB && FastTLABRefill) {
 388           Label slow_path;
 389           Register G1_obj_size = G1;
 390           Register G3_t1 = G3;
 391           Register G4_t2 = G4;
 392           assert_different_registers(G5_klass, G1_obj_size, G3_t1, G4_t2);
 393 
 394           // Push a frame since we may do dtrace notification for the
 395           // allocation which requires calling out and we don't want
 396           // to stomp the real return address.
 397           __ save_frame(0);
 398 
 399           if (id == fast_new_instance_init_check_id) {
 400             // make sure the klass is initialized
 401             __ ld(G5_klass, instanceKlass::init_state_offset_in_bytes() + sizeof(oopDesc), G3_t1);
 402             __ cmp_and_br_short(G3_t1, instanceKlass::fully_initialized, Assembler::notEqual, Assembler::pn, slow_path);
 403           }
 404 #ifdef ASSERT
 405           // assert object can be fast path allocated
 406           {
 407             Label ok, not_ok;
 408           __ ld(G5_klass, Klass::layout_helper_offset_in_bytes() + sizeof(oopDesc), G1_obj_size);
 409           // make sure it's an instance (LH > 0)
 410           __ cmp_and_br_short(G1_obj_size, 0, Assembler::lessEqual, Assembler::pn, not_ok);
 411           __ btst(Klass::_lh_instance_slow_path_bit, G1_obj_size);
 412           __ br(Assembler::zero, false, Assembler::pn, ok);
 413           __ delayed()->nop();
 414           __ bind(not_ok);
 415           __ stop("assert(can be fast path allocated)");
 416           __ should_not_reach_here();
 417           __ bind(ok);
 418           }
 419 #endif // ASSERT
 420           // if we got here then the TLAB allocation failed, so try
 421           // refilling the TLAB or allocating directly from eden.
 422           Label retry_tlab, try_eden;
 423           __ tlab_refill(retry_tlab, try_eden, slow_path); // preserves G5_klass
 424 
 425           __ bind(retry_tlab);
 426 
 427           // get the instance size
 428           __ ld(G5_klass, klassOopDesc::header_size() * HeapWordSize + Klass::layout_helper_offset_in_bytes(), G1_obj_size);
 429 
 430           __ tlab_allocate(O0_obj, G1_obj_size, 0, G3_t1, slow_path);
 431 
 432           __ initialize_object(O0_obj, G5_klass, G1_obj_size, 0, G3_t1, G4_t2);
 433           __ verify_oop(O0_obj);
 434           __ mov(O0, I0);
 435           __ ret();
 436           __ delayed()->restore();
 437 
 438           __ bind(try_eden);
 439           // get the instance size
 440           __ ld(G5_klass, klassOopDesc::header_size() * HeapWordSize + Klass::layout_helper_offset_in_bytes(), G1_obj_size);
 441           __ eden_allocate(O0_obj, G1_obj_size, 0, G3_t1, G4_t2, slow_path);
 442           __ incr_allocated_bytes(G1_obj_size, G3_t1, G4_t2);
 443 
 444           __ initialize_object(O0_obj, G5_klass, G1_obj_size, 0, G3_t1, G4_t2);
 445           __ verify_oop(O0_obj);
 446           __ mov(O0, I0);
 447           __ ret();
 448           __ delayed()->restore();
 449 
 450           __ bind(slow_path);
 451 
 452           // pop this frame so generate_stub_call can push it's own
 453           __ restore();
 454         }
 455 
 456         oop_maps = generate_stub_call(sasm, I0, CAST_FROM_FN_PTR(address, new_instance), G5_klass);
 457         // I0->O0: new instance
 458       }
 459 
 460       break;
 461 
 462     case counter_overflow_id:
 463         // G4 contains bci, G5 contains method
 464       oop_maps = generate_stub_call(sasm, noreg, CAST_FROM_FN_PTR(address, counter_overflow), G4, G5);
 465       break;
 466 
 467     case new_type_array_id:
 468     case new_object_array_id:
 469       {
 470         Register G5_klass = G5; // Incoming
 471         Register G4_length = G4; // Incoming
 472         Register O0_obj   = O0; // Outgoing
 473 
 474         Address klass_lh(G5_klass, ((klassOopDesc::header_size() * HeapWordSize)
 475                                     + Klass::layout_helper_offset_in_bytes()));
 476         assert(Klass::_lh_header_size_shift % BitsPerByte == 0, "bytewise");
 477         assert(Klass::_lh_header_size_mask == 0xFF, "bytewise");
 478         // Use this offset to pick out an individual byte of the layout_helper:
 479         const int klass_lh_header_size_offset = ((BytesPerInt - 1)  // 3 - 2 selects byte {0,1,0,0}
 480                                                  - Klass::_lh_header_size_shift / BitsPerByte);
 481 
 482         if (id == new_type_array_id) {
 483           __ set_info("new_type_array", dont_gc_arguments);
 484         } else {
 485           __ set_info("new_object_array", dont_gc_arguments);
 486         }
 487 
 488 #ifdef ASSERT
 489         // assert object type is really an array of the proper kind
 490         {
 491           Label ok;
 492           Register G3_t1 = G3;
 493           __ ld(klass_lh, G3_t1);
 494           __ sra(G3_t1, Klass::_lh_array_tag_shift, G3_t1);
 495           int tag = ((id == new_type_array_id)
 496                      ? Klass::_lh_array_tag_type_value
 497                      : Klass::_lh_array_tag_obj_value);
 498           __ cmp_and_brx_short(G3_t1, tag, Assembler::equal, Assembler::pt, ok);
 499           __ stop("assert(is an array klass)");
 500           __ should_not_reach_here();
 501           __ bind(ok);
 502         }
 503 #endif // ASSERT
 504 
 505         if (UseTLAB && FastTLABRefill) {
 506           Label slow_path;
 507           Register G1_arr_size = G1;
 508           Register G3_t1 = G3;
 509           Register O1_t2 = O1;
 510           assert_different_registers(G5_klass, G4_length, G1_arr_size, G3_t1, O1_t2);
 511 
 512           // check that array length is small enough for fast path
 513           __ set(C1_MacroAssembler::max_array_allocation_length, G3_t1);
 514           __ cmp_and_br_short(G4_length, G3_t1, Assembler::greaterUnsigned, Assembler::pn, slow_path);
 515 
 516           // if we got here then the TLAB allocation failed, so try
 517           // refilling the TLAB or allocating directly from eden.
 518           Label retry_tlab, try_eden;
 519           __ tlab_refill(retry_tlab, try_eden, slow_path); // preserves G4_length and G5_klass
 520 
 521           __ bind(retry_tlab);
 522 
 523           // get the allocation size: (length << (layout_helper & 0x1F)) + header_size
 524           __ ld(klass_lh, G3_t1);
 525           __ sll(G4_length, G3_t1, G1_arr_size);
 526           __ srl(G3_t1, Klass::_lh_header_size_shift, G3_t1);
 527           __ and3(G3_t1, Klass::_lh_header_size_mask, G3_t1);
 528           __ add(G1_arr_size, G3_t1, G1_arr_size);
 529           __ add(G1_arr_size, MinObjAlignmentInBytesMask, G1_arr_size);  // align up
 530           __ and3(G1_arr_size, ~MinObjAlignmentInBytesMask, G1_arr_size);
 531 
 532           __ tlab_allocate(O0_obj, G1_arr_size, 0, G3_t1, slow_path);  // preserves G1_arr_size
 533 
 534           __ initialize_header(O0_obj, G5_klass, G4_length, G3_t1, O1_t2);
 535           __ ldub(klass_lh, G3_t1, klass_lh_header_size_offset);
 536           __ sub(G1_arr_size, G3_t1, O1_t2);  // body length
 537           __ add(O0_obj, G3_t1, G3_t1);       // body start
 538           __ initialize_body(G3_t1, O1_t2);
 539           __ verify_oop(O0_obj);
 540           __ retl();
 541           __ delayed()->nop();
 542 
 543           __ bind(try_eden);
 544           // get the allocation size: (length << (layout_helper & 0x1F)) + header_size
 545           __ ld(klass_lh, G3_t1);
 546           __ sll(G4_length, G3_t1, G1_arr_size);
 547           __ srl(G3_t1, Klass::_lh_header_size_shift, G3_t1);
 548           __ and3(G3_t1, Klass::_lh_header_size_mask, G3_t1);
 549           __ add(G1_arr_size, G3_t1, G1_arr_size);
 550           __ add(G1_arr_size, MinObjAlignmentInBytesMask, G1_arr_size);
 551           __ and3(G1_arr_size, ~MinObjAlignmentInBytesMask, G1_arr_size);
 552 
 553           __ eden_allocate(O0_obj, G1_arr_size, 0, G3_t1, O1_t2, slow_path);  // preserves G1_arr_size
 554           __ incr_allocated_bytes(G1_arr_size, G3_t1, O1_t2);
 555 
 556           __ initialize_header(O0_obj, G5_klass, G4_length, G3_t1, O1_t2);
 557           __ ldub(klass_lh, G3_t1, klass_lh_header_size_offset);
 558           __ sub(G1_arr_size, G3_t1, O1_t2);  // body length
 559           __ add(O0_obj, G3_t1, G3_t1);       // body start
 560           __ initialize_body(G3_t1, O1_t2);
 561           __ verify_oop(O0_obj);
 562           __ retl();
 563           __ delayed()->nop();
 564 
 565           __ bind(slow_path);
 566         }
 567 
 568         if (id == new_type_array_id) {
 569           oop_maps = generate_stub_call(sasm, I0, CAST_FROM_FN_PTR(address, new_type_array), G5_klass, G4_length);
 570         } else {
 571           oop_maps = generate_stub_call(sasm, I0, CAST_FROM_FN_PTR(address, new_object_array), G5_klass, G4_length);
 572         }
 573         // I0 -> O0: new array
 574       }
 575       break;
 576 
 577     case new_multi_array_id:
 578       { // O0: klass
 579         // O1: rank
 580         // O2: address of 1st dimension
 581         __ set_info("new_multi_array", dont_gc_arguments);
 582         oop_maps = generate_stub_call(sasm, I0, CAST_FROM_FN_PTR(address, new_multi_array), I0, I1, I2);
 583         // I0 -> O0: new multi array
 584       }
 585       break;
 586 
 587     case register_finalizer_id:
 588       {
 589         __ set_info("register_finalizer", dont_gc_arguments);
 590 
 591         // load the klass and check the has finalizer flag
 592         Label register_finalizer;
 593         Register t = O1;
 594         __ load_klass(O0, t);
 595         __ ld(t, Klass::access_flags_offset_in_bytes() + sizeof(oopDesc), t);
 596         __ set(JVM_ACC_HAS_FINALIZER, G3);
 597         __ andcc(G3, t, G0);
 598         __ br(Assembler::notZero, false, Assembler::pt, register_finalizer);
 599         __ delayed()->nop();
 600 
 601         // do a leaf return
 602         __ retl();
 603         __ delayed()->nop();
 604 
 605         __ bind(register_finalizer);
 606         OopMap* oop_map = save_live_registers(sasm);
 607         int call_offset = __ call_RT(noreg, noreg,
 608                                      CAST_FROM_FN_PTR(address, SharedRuntime::register_finalizer), I0);
 609         oop_maps = new OopMapSet();
 610         oop_maps->add_gc_map(call_offset, oop_map);
 611 
 612         // Now restore all the live registers
 613         restore_live_registers(sasm);
 614 
 615         __ ret();
 616         __ delayed()->restore();
 617       }
 618       break;
 619 
 620     case throw_range_check_failed_id:
 621       { __ set_info("range_check_failed", dont_gc_arguments); // arguments will be discarded
 622         // G4: index
 623         oop_maps = generate_exception_throw(sasm, CAST_FROM_FN_PTR(address, throw_range_check_exception), true);
 624       }
 625       break;
 626 
 627     case throw_index_exception_id:
 628       { __ set_info("index_range_check_failed", dont_gc_arguments); // arguments will be discarded
 629         // G4: index
 630         oop_maps = generate_exception_throw(sasm, CAST_FROM_FN_PTR(address, throw_index_exception), true);
 631       }
 632       break;
 633 
 634     case throw_div0_exception_id:
 635       { __ set_info("throw_div0_exception", dont_gc_arguments);
 636         oop_maps = generate_exception_throw(sasm, CAST_FROM_FN_PTR(address, throw_div0_exception), false);
 637       }
 638       break;
 639 
 640     case throw_null_pointer_exception_id:
 641       { __ set_info("throw_null_pointer_exception", dont_gc_arguments);
 642         oop_maps = generate_exception_throw(sasm, CAST_FROM_FN_PTR(address, throw_null_pointer_exception), false);
 643       }
 644       break;
 645 
 646     case handle_exception_id:
 647       { __ set_info("handle_exception", dont_gc_arguments);
 648         oop_maps = generate_handle_exception(id, sasm);
 649       }
 650       break;
 651 
 652     case handle_exception_from_callee_id:
 653       { __ set_info("handle_exception_from_callee", dont_gc_arguments);
 654         oop_maps = generate_handle_exception(id, sasm);
 655       }
 656       break;
 657 
 658     case unwind_exception_id:
 659       {
 660         // O0: exception
 661         // I7: address of call to this method
 662 
 663         __ set_info("unwind_exception", dont_gc_arguments);
 664         __ mov(Oexception, Oexception->after_save());
 665         __ add(I7, frame::pc_return_offset, Oissuing_pc->after_save());
 666 
 667         __ call_VM_leaf(L7_thread_cache, CAST_FROM_FN_PTR(address, SharedRuntime::exception_handler_for_return_address),
 668                         G2_thread, Oissuing_pc->after_save());
 669         __ verify_not_null_oop(Oexception->after_save());
 670 
 671         // Restore SP from L7 if the exception PC is a method handle call site.
 672         __ mov(O0, G5);  // Save the target address.
 673         __ lduw(Address(G2_thread, JavaThread::is_method_handle_return_offset()), L0);
 674         __ tst(L0);  // Condition codes are preserved over the restore.
 675         __ restore();
 676 
 677         __ jmp(G5, 0);
 678         __ delayed()->movcc(Assembler::notZero, false, Assembler::icc, L7_mh_SP_save, SP);  // Restore SP if required.
 679       }
 680       break;
 681 
 682     case throw_array_store_exception_id:
 683       {
 684         __ set_info("throw_array_store_exception", dont_gc_arguments);
 685         oop_maps = generate_exception_throw(sasm, CAST_FROM_FN_PTR(address, throw_array_store_exception), true);
 686       }
 687       break;
 688 
 689     case throw_class_cast_exception_id:
 690       {
 691         // G4: object
 692         __ set_info("throw_class_cast_exception", dont_gc_arguments);
 693         oop_maps = generate_exception_throw(sasm, CAST_FROM_FN_PTR(address, throw_class_cast_exception), true);
 694       }
 695       break;
 696 
 697     case throw_incompatible_class_change_error_id:
 698       {
 699         __ set_info("throw_incompatible_class_cast_exception", dont_gc_arguments);
 700         oop_maps = generate_exception_throw(sasm, CAST_FROM_FN_PTR(address, throw_incompatible_class_change_error), false);
 701       }
 702       break;
 703 
 704     case invalidate_profile_inlining_id:
 705       { 
 706         OopMap* oop_map = save_live_registers(sasm);
 707 
 708         int call_offset = __ call_RT(noreg, noreg, CAST_FROM_FN_PTR(address, invalidate_profile_inlining), G4, G5);
 709 
 710         oop_maps = new OopMapSet();
 711         oop_maps->add_gc_map(call_offset, oop_map);
 712 
 713         DeoptimizationBlob* deopt_blob = SharedRuntime::deopt_blob();
 714         assert(deopt_blob != NULL, "deoptimization blob must have been created");
 715         restore_live_registers(sasm);
 716         __ restore();
 717         // Invalid inlining is detected before the body of the
 718         // inlinined method is executed so we need deoptimization to
 719         // trigger "re-execution" of the method call.
 720         __ br(Assembler::always, false, Assembler::pt, deopt_blob->unpack_with_reexecution(), relocInfo::runtime_call_type);
 721         __ delayed()->nop();
 722       }
 723       break;
 724 
 725     case slow_subtype_check_id:
 726       { // Support for uint StubRoutine::partial_subtype_check( Klass sub, Klass super );
 727         // Arguments :
 728         //
 729         //      ret  : G3
 730         //      sub  : G3, argument, destroyed
 731         //      super: G1, argument, not changed
 732         //      raddr: O7, blown by call
 733         Label miss;
 734 
 735         __ save_frame(0);               // Blow no registers!
 736 
 737         __ check_klass_subtype_slow_path(G3, G1, L0, L1, L2, L4, NULL, &miss);
 738 
 739         __ mov(1, G3);
 740         __ ret();                       // Result in G5 is 'true'
 741         __ delayed()->restore();        // free copy or add can go here
 742 
 743         __ bind(miss);
 744         __ mov(0, G3);
 745         __ ret();                       // Result in G5 is 'false'
 746         __ delayed()->restore();        // free copy or add can go here
 747       }
 748 
 749     case monitorenter_nofpu_id:
 750     case monitorenter_id:
 751       { // G4: object
 752         // G5: lock address
 753         __ set_info("monitorenter", dont_gc_arguments);
 754 
 755         int save_fpu_registers = (id == monitorenter_id);
 756         // make a frame and preserve the caller's caller-save registers
 757         OopMap* oop_map = save_live_registers(sasm, save_fpu_registers);
 758 
 759         int call_offset = __ call_RT(noreg, noreg, CAST_FROM_FN_PTR(address, monitorenter), G4, G5);
 760 
 761         oop_maps = new OopMapSet();
 762         oop_maps->add_gc_map(call_offset, oop_map);
 763         restore_live_registers(sasm, save_fpu_registers);
 764 
 765         __ ret();
 766         __ delayed()->restore();
 767       }
 768       break;
 769 
 770     case monitorexit_nofpu_id:
 771     case monitorexit_id:
 772       { // G4: lock address
 773         // note: really a leaf routine but must setup last java sp
 774         //       => use call_RT for now (speed can be improved by
 775         //       doing last java sp setup manually)
 776         __ set_info("monitorexit", dont_gc_arguments);
 777 
 778         int save_fpu_registers = (id == monitorexit_id);
 779         // make a frame and preserve the caller's caller-save registers
 780         OopMap* oop_map = save_live_registers(sasm, save_fpu_registers);
 781 
 782         int call_offset = __ call_RT(noreg, noreg, CAST_FROM_FN_PTR(address, monitorexit), G4);
 783 
 784         oop_maps = new OopMapSet();
 785         oop_maps->add_gc_map(call_offset, oop_map);
 786         restore_live_registers(sasm, save_fpu_registers);
 787 
 788         __ ret();
 789         __ delayed()->restore();
 790       }
 791       break;
 792 
 793     case deoptimize_id:
 794       {
 795         __ set_info("deoptimize", dont_gc_arguments);
 796         OopMap* oop_map = save_live_registers(sasm);
 797         int call_offset = __ call_RT(noreg, noreg, CAST_FROM_FN_PTR(address, deoptimize));
 798         oop_maps = new OopMapSet();
 799         oop_maps->add_gc_map(call_offset, oop_map);
 800         restore_live_registers(sasm);
 801         DeoptimizationBlob* deopt_blob = SharedRuntime::deopt_blob();
 802         assert(deopt_blob != NULL, "deoptimization blob must have been created");
 803         AddressLiteral dest(deopt_blob->unpack_with_reexecution());
 804         __ jump_to(dest, O0);
 805         __ delayed()->restore();
 806       }
 807       break;
 808 
 809     case access_field_patching_id:
 810       { __ set_info("access_field_patching", dont_gc_arguments);
 811         oop_maps = generate_patching(sasm, CAST_FROM_FN_PTR(address, access_field_patching));
 812       }
 813       break;
 814 
 815     case load_klass_patching_id:
 816       { __ set_info("load_klass_patching", dont_gc_arguments);
 817         oop_maps = generate_patching(sasm, CAST_FROM_FN_PTR(address, move_klass_patching));
 818       }
 819       break;
 820 
 821     case dtrace_object_alloc_id:
 822       { // O0: object
 823         __ set_info("dtrace_object_alloc", dont_gc_arguments);
 824         // we can't gc here so skip the oopmap but make sure that all
 825         // the live registers get saved.
 826         save_live_registers(sasm);
 827 
 828         __ save_thread(L7_thread_cache);
 829         __ call(CAST_FROM_FN_PTR(address, SharedRuntime::dtrace_object_alloc),
 830                 relocInfo::runtime_call_type);
 831         __ delayed()->mov(I0, O0);
 832         __ restore_thread(L7_thread_cache);
 833 
 834         restore_live_registers(sasm);
 835         __ ret();
 836         __ delayed()->restore();
 837       }
 838       break;
 839 
 840 #ifndef SERIALGC
 841     case g1_pre_barrier_slow_id:
 842       { // G4: previous value of memory
 843         BarrierSet* bs = Universe::heap()->barrier_set();
 844         if (bs->kind() != BarrierSet::G1SATBCTLogging) {
 845           __ save_frame(0);
 846           __ set((int)id, O1);
 847           __ call_RT(noreg, noreg, CAST_FROM_FN_PTR(address, unimplemented_entry), I0);
 848           __ should_not_reach_here();
 849           break;
 850         }
 851 
 852         __ set_info("g1_pre_barrier_slow_id", dont_gc_arguments);
 853 
 854         Register pre_val = G4;
 855         Register tmp  = G1_scratch;
 856         Register tmp2 = G3_scratch;
 857 
 858         Label refill, restart;
 859         bool with_frame = false; // I don't know if we can do with-frame.
 860         int satb_q_index_byte_offset =
 861           in_bytes(JavaThread::satb_mark_queue_offset() +
 862                    PtrQueue::byte_offset_of_index());
 863         int satb_q_buf_byte_offset =
 864           in_bytes(JavaThread::satb_mark_queue_offset() +
 865                    PtrQueue::byte_offset_of_buf());
 866 
 867         __ bind(restart);
 868         // Load the index into the SATB buffer. PtrQueue::_index is a
 869         // size_t so ld_ptr is appropriate
 870         __ ld_ptr(G2_thread, satb_q_index_byte_offset, tmp);
 871 
 872         // index == 0?
 873         __ cmp_and_brx_short(tmp, G0, Assembler::equal, Assembler::pn, refill);
 874 
 875         __ ld_ptr(G2_thread, satb_q_buf_byte_offset, tmp2);
 876         __ sub(tmp, oopSize, tmp);
 877 
 878         __ st_ptr(pre_val, tmp2, tmp);  // [_buf + index] := <address_of_card>
 879         // Use return-from-leaf
 880         __ retl();
 881         __ delayed()->st_ptr(tmp, G2_thread, satb_q_index_byte_offset);
 882 
 883         __ bind(refill);
 884         __ save_frame(0);
 885 
 886         __ mov(pre_val, L0);
 887         __ mov(tmp,     L1);
 888         __ mov(tmp2,    L2);
 889 
 890         __ call_VM_leaf(L7_thread_cache,
 891                         CAST_FROM_FN_PTR(address,
 892                                          SATBMarkQueueSet::handle_zero_index_for_thread),
 893                                          G2_thread);
 894 
 895         __ mov(L0, pre_val);
 896         __ mov(L1, tmp);
 897         __ mov(L2, tmp2);
 898 
 899         __ br(Assembler::always, /*annul*/false, Assembler::pt, restart);
 900         __ delayed()->restore();
 901       }
 902       break;
 903 
 904     case g1_post_barrier_slow_id:
 905       {
 906         BarrierSet* bs = Universe::heap()->barrier_set();
 907         if (bs->kind() != BarrierSet::G1SATBCTLogging) {
 908           __ save_frame(0);
 909           __ set((int)id, O1);
 910           __ call_RT(noreg, noreg, CAST_FROM_FN_PTR(address, unimplemented_entry), I0);
 911           __ should_not_reach_here();
 912           break;
 913         }
 914 
 915         __ set_info("g1_post_barrier_slow_id", dont_gc_arguments);
 916 
 917         Register addr = G4;
 918         Register cardtable = G5;
 919         Register tmp  = G1_scratch;
 920         Register tmp2 = G3_scratch;
 921         jbyte* byte_map_base = ((CardTableModRefBS*)bs)->byte_map_base;
 922 
 923         Label not_already_dirty, restart, refill;
 924 
 925 #ifdef _LP64
 926         __ srlx(addr, CardTableModRefBS::card_shift, addr);
 927 #else
 928         __ srl(addr, CardTableModRefBS::card_shift, addr);
 929 #endif
 930 
 931         AddressLiteral rs(byte_map_base);
 932         __ set(rs, cardtable);         // cardtable := <card table base>
 933         __ ldub(addr, cardtable, tmp); // tmp := [addr + cardtable]
 934 
 935         assert(CardTableModRefBS::dirty_card_val() == 0, "otherwise check this code");
 936         __ cmp_and_br_short(tmp, G0, Assembler::notEqual, Assembler::pt, not_already_dirty);
 937 
 938         // We didn't take the branch, so we're already dirty: return.
 939         // Use return-from-leaf
 940         __ retl();
 941         __ delayed()->nop();
 942 
 943         // Not dirty.
 944         __ bind(not_already_dirty);
 945 
 946         // Get cardtable + tmp into a reg by itself
 947         __ add(addr, cardtable, tmp2);
 948 
 949         // First, dirty it.
 950         __ stb(G0, tmp2, 0);  // [cardPtr] := 0  (i.e., dirty).
 951 
 952         Register tmp3 = cardtable;
 953         Register tmp4 = tmp;
 954 
 955         // these registers are now dead
 956         addr = cardtable = tmp = noreg;
 957 
 958         int dirty_card_q_index_byte_offset =
 959           in_bytes(JavaThread::dirty_card_queue_offset() +
 960                    PtrQueue::byte_offset_of_index());
 961         int dirty_card_q_buf_byte_offset =
 962           in_bytes(JavaThread::dirty_card_queue_offset() +
 963                    PtrQueue::byte_offset_of_buf());
 964 
 965         __ bind(restart);
 966 
 967         // Get the index into the update buffer. PtrQueue::_index is
 968         // a size_t so ld_ptr is appropriate here.
 969         __ ld_ptr(G2_thread, dirty_card_q_index_byte_offset, tmp3);
 970 
 971         // index == 0?
 972         __ cmp_and_brx_short(tmp3, G0, Assembler::equal,  Assembler::pn, refill);
 973 
 974         __ ld_ptr(G2_thread, dirty_card_q_buf_byte_offset, tmp4);
 975         __ sub(tmp3, oopSize, tmp3);
 976 
 977         __ st_ptr(tmp2, tmp4, tmp3);  // [_buf + index] := <address_of_card>
 978         // Use return-from-leaf
 979         __ retl();
 980         __ delayed()->st_ptr(tmp3, G2_thread, dirty_card_q_index_byte_offset);
 981 
 982         __ bind(refill);
 983         __ save_frame(0);
 984 
 985         __ mov(tmp2, L0);
 986         __ mov(tmp3, L1);
 987         __ mov(tmp4, L2);
 988 
 989         __ call_VM_leaf(L7_thread_cache,
 990                         CAST_FROM_FN_PTR(address,
 991                                          DirtyCardQueueSet::handle_zero_index_for_thread),
 992                                          G2_thread);
 993 
 994         __ mov(L0, tmp2);
 995         __ mov(L1, tmp3);
 996         __ mov(L2, tmp4);
 997 
 998         __ br(Assembler::always, /*annul*/false, Assembler::pt, restart);
 999         __ delayed()->restore();
1000       }
1001       break;
1002 #endif // !SERIALGC
1003 
1004     default:
1005       { __ set_info("unimplemented entry", dont_gc_arguments);
1006         __ save_frame(0);
1007         __ set((int)id, O1);
1008         __ call_RT(noreg, noreg, CAST_FROM_FN_PTR(address, unimplemented_entry), O1);
1009         __ should_not_reach_here();
1010       }
1011       break;
1012   }
1013   return oop_maps;
1014 }
1015 
1016 
1017 OopMapSet* Runtime1::generate_handle_exception(StubID id, StubAssembler* sasm) {
1018   __ block_comment("generate_handle_exception");
1019 
1020   // Save registers, if required.
1021   OopMapSet* oop_maps = new OopMapSet();
1022   OopMap* oop_map = NULL;
1023   switch (id) {
1024   case forward_exception_id:
1025     // We're handling an exception in the context of a compiled frame.
1026     // The registers have been saved in the standard places.  Perform
1027     // an exception lookup in the caller and dispatch to the handler
1028     // if found.  Otherwise unwind and dispatch to the callers
1029     // exception handler.
1030      oop_map = generate_oop_map(sasm, true);
1031 
1032      // transfer the pending exception to the exception_oop
1033      __ ld_ptr(G2_thread, in_bytes(JavaThread::pending_exception_offset()), Oexception);
1034      __ ld_ptr(Oexception, 0, G0);
1035      __ st_ptr(G0, G2_thread, in_bytes(JavaThread::pending_exception_offset()));
1036      __ add(I7, frame::pc_return_offset, Oissuing_pc);
1037     break;
1038   case handle_exception_id:
1039     // At this point all registers MAY be live.
1040     oop_map = save_live_registers(sasm);
1041     __ mov(Oexception->after_save(),  Oexception);
1042     __ mov(Oissuing_pc->after_save(), Oissuing_pc);
1043     break;
1044   case handle_exception_from_callee_id:
1045     // At this point all registers except exception oop (Oexception)
1046     // and exception pc (Oissuing_pc) are dead.
1047     oop_map = new OopMap(frame_size_in_bytes / sizeof(jint), 0);
1048     sasm->set_frame_size(frame_size_in_bytes / BytesPerWord);
1049     __ save_frame_c1(frame_size_in_bytes);
1050     __ mov(Oexception->after_save(),  Oexception);
1051     __ mov(Oissuing_pc->after_save(), Oissuing_pc);
1052     break;
1053   default:  ShouldNotReachHere();
1054   }
1055 
1056   __ verify_not_null_oop(Oexception);
1057 
1058   // save the exception and issuing pc in the thread
1059   __ st_ptr(Oexception,  G2_thread, in_bytes(JavaThread::exception_oop_offset()));
1060   __ st_ptr(Oissuing_pc, G2_thread, in_bytes(JavaThread::exception_pc_offset()));
1061 
1062   // use the throwing pc as the return address to lookup (has bci & oop map)
1063   __ mov(Oissuing_pc, I7);
1064   __ sub(I7, frame::pc_return_offset, I7);
1065   int call_offset = __ call_RT(noreg, noreg, CAST_FROM_FN_PTR(address, exception_handler_for_pc));
1066   oop_maps->add_gc_map(call_offset, oop_map);
1067 
1068   // Note: if nmethod has been deoptimized then regardless of
1069   // whether it had a handler or not we will deoptimize
1070   // by entering the deopt blob with a pending exception.
1071 
1072   // Restore the registers that were saved at the beginning, remove
1073   // the frame and jump to the exception handler.
1074   switch (id) {
1075   case forward_exception_id:
1076   case handle_exception_id:
1077     restore_live_registers(sasm);
1078     __ jmp(O0, 0);
1079     __ delayed()->restore();
1080     break;
1081   case handle_exception_from_callee_id:
1082     // Restore SP from L7 if the exception PC is a method handle call site.
1083     __ mov(O0, G5);  // Save the target address.
1084     __ lduw(Address(G2_thread, JavaThread::is_method_handle_return_offset()), L0);
1085     __ tst(L0);  // Condition codes are preserved over the restore.
1086     __ restore();
1087 
1088     __ jmp(G5, 0);  // jump to the exception handler
1089     __ delayed()->movcc(Assembler::notZero, false, Assembler::icc, L7_mh_SP_save, SP);  // Restore SP if required.
1090     break;
1091   default:  ShouldNotReachHere();
1092   }
1093 
1094   return oop_maps;
1095 }
1096 
1097 
1098 #undef __
1099 
1100 const char *Runtime1::pd_name_for_address(address entry) {
1101   return "<unknown function>";
1102 }