1 /* 2 * Copyright (c) 2015, Oracle and/or its affiliates. All rights reserved. 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * This code is free software; you can redistribute it and/or modify it 6 * under the terms of the GNU General Public License version 2 only, as 7 * published by the Free Software Foundation. 8 * 9 * This code is distributed in the hope that it will be useful, but WITHOUT 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 12 * version 2 for more details (a copy is included in the LICENSE file that 13 * accompanied this code). 14 * 15 * You should have received a copy of the GNU General Public License version 16 * 2 along with this work; if not, write to the Free Software Foundation, 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 18 * 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 20 * or visit www.oracle.com if you need additional information or have any 21 * questions. 22 * 23 */ 24 25 #include "precompiled.hpp" 26 #include "interpreter/interpreter.hpp" 27 #include "oops/constMethod.hpp" 28 #include "oops/method.hpp" 29 #include "runtime/frame.inline.hpp" 30 #include "utilities/debug.hpp" 31 #include "utilities/macros.hpp" 32 33 34 int AbstractInterpreter::BasicType_as_index(BasicType type) { 35 int i = 0; 36 switch (type) { 37 case T_BOOLEAN: i = 0; break; 38 case T_CHAR : i = 1; break; 39 case T_BYTE : i = 2; break; 40 case T_SHORT : i = 3; break; 41 case T_INT : i = 4; break; 42 case T_LONG : i = 5; break; 43 case T_VOID : i = 6; break; 44 case T_FLOAT : i = 7; break; 45 case T_DOUBLE : i = 8; break; 46 case T_OBJECT : i = 9; break; 47 case T_ARRAY : i = 9; break; 48 default : ShouldNotReachHere(); 49 } 50 assert(0 <= i && i < AbstractInterpreter::number_of_result_handlers, "index out of bounds"); 51 return i; 52 } 53 54 static int size_activation_helper(int callee_extra_locals, int max_stack, int monitor_size) { 55 56 // Figure out the size of an interpreter frame (in words) given that we have a fully allocated 57 // expression stack, the callee will have callee_extra_locals (so we can account for 58 // frame extension) and monitor_size for monitors. Basically we need to calculate 59 // this exactly like generate_fixed_frame/generate_compute_interpreter_state. 60 // 61 // 62 // The big complicating thing here is that we must ensure that the stack stays properly 63 // aligned. This would be even uglier if monitor size wasn't modulo what the stack 64 // needs to be aligned for). We are given that the sp (fp) is already aligned by 65 // the caller so we must ensure that it is properly aligned for our callee. 66 // 67 const int rounded_vm_local_words = 68 round_to(frame::interpreter_frame_vm_local_words,WordsPerLong); 69 // callee_locals and max_stack are counts, not the size in frame. 70 const int locals_size = 71 round_to(callee_extra_locals * Interpreter::stackElementWords, WordsPerLong); 72 const int max_stack_words = max_stack * Interpreter::stackElementWords; 73 return (round_to((max_stack_words 74 + rounded_vm_local_words 75 + frame::memory_parameter_word_sp_offset), WordsPerLong) 76 // already rounded 77 + locals_size + monitor_size); 78 } 79 80 // How much stack a method top interpreter activation needs in words. 81 int AbstractInterpreter::size_top_interpreter_activation(Method* method) { 82 83 // See call_stub code 84 int call_stub_size = round_to(7 + frame::memory_parameter_word_sp_offset, 85 WordsPerLong); // 7 + register save area 86 87 // Save space for one monitor to get into the interpreted method in case 88 // the method is synchronized 89 int monitor_size = method->is_synchronized() ? 90 1*frame::interpreter_frame_monitor_size() : 0; 91 return size_activation_helper(method->max_locals(), method->max_stack(), 92 monitor_size) + call_stub_size; 93 } 94 95 int AbstractInterpreter::size_activation(int max_stack, 96 int temps, 97 int extra_args, 98 int monitors, 99 int callee_params, 100 int callee_locals, 101 bool is_top_frame) { 102 // Note: This calculation must exactly parallel the frame setup 103 // in InterpreterGenerator::generate_fixed_frame. 104 105 int monitor_size = monitors * frame::interpreter_frame_monitor_size(); 106 107 assert(monitor_size == round_to(monitor_size, WordsPerLong), "must align"); 108 109 // 110 // Note: if you look closely this appears to be doing something much different 111 // than generate_fixed_frame. What is happening is this. On sparc we have to do 112 // this dance with interpreter_sp_adjustment because the window save area would 113 // appear just below the bottom (tos) of the caller's java expression stack. Because 114 // the interpreter want to have the locals completely contiguous generate_fixed_frame 115 // will adjust the caller's sp for the "extra locals" (max_locals - parameter_size). 116 // Now in generate_fixed_frame the extension of the caller's sp happens in the callee. 117 // In this code the opposite occurs the caller adjusts it's own stack base on the callee. 118 // This is mostly ok but it does cause a problem when we get to the initial frame (the oldest) 119 // because the oldest frame would have adjust its callers frame and yet that frame 120 // already exists and isn't part of this array of frames we are unpacking. So at first 121 // glance this would seem to mess up that frame. However Deoptimization::fetch_unroll_info_helper() 122 // will after it calculates all of the frame's on_stack_size()'s will then figure out the 123 // amount to adjust the caller of the initial (oldest) frame and the calculation will all 124 // add up. It does seem like it simpler to account for the adjustment here (and remove the 125 // callee... parameters here). However this would mean that this routine would have to take 126 // the caller frame as input so we could adjust its sp (and set it's interpreter_sp_adjustment) 127 // and run the calling loop in the reverse order. This would also would appear to mean making 128 // this code aware of what the interactions are when that initial caller fram was an osr or 129 // other adapter frame. deoptimization is complicated enough and hard enough to debug that 130 // there is no sense in messing working code. 131 // 132 133 int rounded_cls = round_to((callee_locals - callee_params), WordsPerLong); 134 assert(rounded_cls == round_to(rounded_cls, WordsPerLong), "must align"); 135 136 int raw_frame_size = size_activation_helper(rounded_cls, max_stack, monitor_size); 137 138 return raw_frame_size; 139 } 140 141 void AbstractInterpreter::layout_activation(Method* method, 142 int tempcount, 143 int popframe_extra_args, 144 int moncount, 145 int caller_actual_parameters, 146 int callee_param_count, 147 int callee_local_count, 148 frame* caller, 149 frame* interpreter_frame, 150 bool is_top_frame, 151 bool is_bottom_frame) { 152 // Set up the following variables: 153 // - Lmethod 154 // - Llocals 155 // - Lmonitors (to the indicated number of monitors) 156 // - Lesp (to the indicated number of temps) 157 // The frame caller on entry is a description of the caller of the 158 // frame we are about to layout. We are guaranteed that we will be 159 // able to fill in a new interpreter frame as its callee (i.e. the 160 // stack space is allocated and the amount was determined by an 161 // earlier call to the size_activation() method). On return caller 162 // while describe the interpreter frame we just layed out. 163 164 // The skeleton frame must already look like an interpreter frame 165 // even if not fully filled out. 166 assert(interpreter_frame->is_interpreted_frame(), "Must be interpreted frame"); 167 168 int rounded_vm_local_words = round_to(frame::interpreter_frame_vm_local_words,WordsPerLong); 169 int monitor_size = moncount * frame::interpreter_frame_monitor_size(); 170 assert(monitor_size == round_to(monitor_size, WordsPerLong), "must align"); 171 172 intptr_t* fp = interpreter_frame->fp(); 173 174 JavaThread* thread = JavaThread::current(); 175 RegisterMap map(thread, false); 176 // More verification that skeleton frame is properly walkable 177 assert(fp == caller->sp(), "fp must match"); 178 179 intptr_t* montop = fp - rounded_vm_local_words; 180 181 // preallocate monitors (cf. __ add_monitor_to_stack) 182 intptr_t* monitors = montop - monitor_size; 183 184 // preallocate stack space 185 intptr_t* esp = monitors - 1 - 186 (tempcount * Interpreter::stackElementWords) - 187 popframe_extra_args; 188 189 int local_words = method->max_locals() * Interpreter::stackElementWords; 190 NEEDS_CLEANUP; 191 intptr_t* locals; 192 if (caller->is_interpreted_frame()) { 193 // Can force the locals area to end up properly overlapping the top of the expression stack. 194 intptr_t* Lesp_ptr = caller->interpreter_frame_tos_address() - 1; 195 // Note that this computation means we replace size_of_parameters() values from the caller 196 // interpreter frame's expression stack with our argument locals 197 int parm_words = caller_actual_parameters * Interpreter::stackElementWords; 198 locals = Lesp_ptr + parm_words; 199 int delta = local_words - parm_words; 200 int computed_sp_adjustment = (delta > 0) ? round_to(delta, WordsPerLong) : 0; 201 *interpreter_frame->register_addr(I5_savedSP) = (intptr_t) (fp + computed_sp_adjustment) - STACK_BIAS; 202 if (!is_bottom_frame) { 203 // Llast_SP is set below for the current frame to SP (with the 204 // extra space for the callee's locals). Here we adjust 205 // Llast_SP for the caller's frame, removing the extra space 206 // for the current method's locals. 207 *caller->register_addr(Llast_SP) = *interpreter_frame->register_addr(I5_savedSP); 208 } else { 209 assert(*caller->register_addr(Llast_SP) >= *interpreter_frame->register_addr(I5_savedSP), "strange Llast_SP"); 210 } 211 } else { 212 assert(caller->is_compiled_frame() || caller->is_entry_frame(), "only possible cases"); 213 // Don't have Lesp available; lay out locals block in the caller 214 // adjacent to the register window save area. 215 // 216 // Compiled frames do not allocate a varargs area which is why this if 217 // statement is needed. 218 // 219 if (caller->is_compiled_frame()) { 220 locals = fp + frame::register_save_words + local_words - 1; 221 } else { 222 locals = fp + frame::memory_parameter_word_sp_offset + local_words - 1; 223 } 224 if (!caller->is_entry_frame()) { 225 // Caller wants his own SP back 226 int caller_frame_size = caller->cb()->frame_size(); 227 *interpreter_frame->register_addr(I5_savedSP) = (intptr_t)(caller->fp() - caller_frame_size) - STACK_BIAS; 228 } 229 } 230 if (TraceDeoptimization) { 231 if (caller->is_entry_frame()) { 232 // make sure I5_savedSP and the entry frames notion of saved SP 233 // agree. This assertion duplicate a check in entry frame code 234 // but catches the failure earlier. 235 assert(*caller->register_addr(Lscratch) == *interpreter_frame->register_addr(I5_savedSP), 236 "would change callers SP"); 237 } 238 if (caller->is_entry_frame()) { 239 tty->print("entry "); 240 } 241 if (caller->is_compiled_frame()) { 242 tty->print("compiled "); 243 if (caller->is_deoptimized_frame()) { 244 tty->print("(deopt) "); 245 } 246 } 247 if (caller->is_interpreted_frame()) { 248 tty->print("interpreted "); 249 } 250 tty->print_cr("caller fp=" INTPTR_FORMAT " sp=" INTPTR_FORMAT, p2i(caller->fp()), p2i(caller->sp())); 251 tty->print_cr("save area = " INTPTR_FORMAT ", " INTPTR_FORMAT, p2i(caller->sp()), p2i(caller->sp() + 16)); 252 tty->print_cr("save area = " INTPTR_FORMAT ", " INTPTR_FORMAT, p2i(caller->fp()), p2i(caller->fp() + 16)); 253 tty->print_cr("interpreter fp=" INTPTR_FORMAT ", " INTPTR_FORMAT, p2i(interpreter_frame->fp()), p2i(interpreter_frame->sp())); 254 tty->print_cr("save area = " INTPTR_FORMAT ", " INTPTR_FORMAT, p2i(interpreter_frame->sp()), p2i(interpreter_frame->sp() + 16)); 255 tty->print_cr("save area = " INTPTR_FORMAT ", " INTPTR_FORMAT, p2i(interpreter_frame->fp()), p2i(interpreter_frame->fp() + 16)); 256 tty->print_cr("Llocals = " INTPTR_FORMAT, p2i(locals)); 257 tty->print_cr("Lesp = " INTPTR_FORMAT, p2i(esp)); 258 tty->print_cr("Lmonitors = " INTPTR_FORMAT, p2i(monitors)); 259 } 260 261 if (method->max_locals() > 0) { 262 assert(locals < caller->sp() || locals >= (caller->sp() + 16), "locals in save area"); 263 assert(locals < caller->fp() || locals > (caller->fp() + 16), "locals in save area"); 264 assert(locals < interpreter_frame->sp() || locals > (interpreter_frame->sp() + 16), "locals in save area"); 265 assert(locals < interpreter_frame->fp() || locals >= (interpreter_frame->fp() + 16), "locals in save area"); 266 } 267 #ifdef _LP64 268 assert(*interpreter_frame->register_addr(I5_savedSP) & 1, "must be odd"); 269 #endif 270 271 *interpreter_frame->register_addr(Lmethod) = (intptr_t) method; 272 *interpreter_frame->register_addr(Llocals) = (intptr_t) locals; 273 *interpreter_frame->register_addr(Lmonitors) = (intptr_t) monitors; 274 *interpreter_frame->register_addr(Lesp) = (intptr_t) esp; 275 // Llast_SP will be same as SP as there is no adapter space 276 *interpreter_frame->register_addr(Llast_SP) = (intptr_t) interpreter_frame->sp() - STACK_BIAS; 277 *interpreter_frame->register_addr(LcpoolCache) = (intptr_t) method->constants()->cache(); 278 #ifdef FAST_DISPATCH 279 *interpreter_frame->register_addr(IdispatchTables) = (intptr_t) Interpreter::dispatch_table(); 280 #endif 281 282 283 #ifdef ASSERT 284 BasicObjectLock* mp = (BasicObjectLock*)monitors; 285 286 assert(interpreter_frame->interpreter_frame_method() == method, "method matches"); 287 assert(interpreter_frame->interpreter_frame_local_at(9) == (intptr_t *)((intptr_t)locals - (9 * Interpreter::stackElementSize)), "locals match"); 288 assert(interpreter_frame->interpreter_frame_monitor_end() == mp, "monitor_end matches"); 289 assert(((intptr_t *)interpreter_frame->interpreter_frame_monitor_begin()) == ((intptr_t *)mp)+monitor_size, "monitor_begin matches"); 290 assert(interpreter_frame->interpreter_frame_tos_address()-1 == esp, "esp matches"); 291 292 // check bounds 293 intptr_t* lo = interpreter_frame->sp() + (frame::memory_parameter_word_sp_offset - 1); 294 intptr_t* hi = interpreter_frame->fp() - rounded_vm_local_words; 295 assert(lo < monitors && montop <= hi, "monitors in bounds"); 296 assert(lo <= esp && esp < monitors, "esp in bounds"); 297 #endif // ASSERT 298 } 299