1 /*
   2  * Copyright (c) 2004, 2010, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  *
  23  */
  24 
  25 #include "precompiled.hpp"
  26 #include "asm/macroAssembler.hpp"
  27 #include "memory/resourceArea.hpp"
  28 #include "prims/jniFastGetField.hpp"
  29 #include "prims/jvm_misc.hpp"
  30 #include "runtime/safepoint.hpp"
  31 
  32 #define __ masm->
  33 
  34 #define BUFFER_SIZE 30
  35 
  36 #ifdef _WINDOWS
  37 GetBooleanField_t JNI_FastGetField::jni_fast_GetBooleanField_fp;
  38 GetByteField_t    JNI_FastGetField::jni_fast_GetByteField_fp;
  39 GetCharField_t    JNI_FastGetField::jni_fast_GetCharField_fp;
  40 GetShortField_t   JNI_FastGetField::jni_fast_GetShortField_fp;
  41 GetIntField_t     JNI_FastGetField::jni_fast_GetIntField_fp;
  42 GetLongField_t    JNI_FastGetField::jni_fast_GetLongField_fp;
  43 GetFloatField_t   JNI_FastGetField::jni_fast_GetFloatField_fp;
  44 GetDoubleField_t  JNI_FastGetField::jni_fast_GetDoubleField_fp;
  45 #endif
  46 
  47 // Instead of issuing lfence for LoadLoad barrier, we create data dependency
  48 // between loads, which is much more efficient than lfence.
  49 
  50 address JNI_FastGetField::generate_fast_get_int_field0(BasicType type) {
  51   const char *name;
  52   switch (type) {
  53     case T_BOOLEAN: name = "jni_fast_GetBooleanField"; break;
  54     case T_BYTE:    name = "jni_fast_GetByteField";    break;
  55     case T_CHAR:    name = "jni_fast_GetCharField";    break;
  56     case T_SHORT:   name = "jni_fast_GetShortField";   break;
  57     case T_INT:     name = "jni_fast_GetIntField";     break;
  58     default:        ShouldNotReachHere();
  59   }
  60   ResourceMark rm;
  61   BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
  62   CodeBuffer cbuf(blob);
  63   MacroAssembler* masm = new MacroAssembler(&cbuf);
  64   address fast_entry = __ pc();
  65 
  66   Label slow;
  67 
  68   // stack layout:    offset from rsp (in words):
  69   //  return pc        0
  70   //  jni env          1
  71   //  obj              2
  72   //  jfieldID         3
  73 
  74   ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
  75   __ mov32 (rcx, counter);
  76   __ testb (rcx, 1);
  77   __ jcc (Assembler::notZero, slow);
  78   if (os::is_MP()) {
  79     __ mov(rax, rcx);
  80     __ andptr(rax, 1);                         // rax, must end up 0
  81     __ movptr(rdx, Address(rsp, rax, Address::times_1, 2*wordSize));
  82                                               // obj, notice rax, is 0.
  83                                               // rdx is data dependent on rcx.
  84   } else {
  85     __ movptr (rdx, Address(rsp, 2*wordSize));  // obj
  86   }
  87   __ movptr(rax, Address(rsp, 3*wordSize));  // jfieldID
  88   __ movptr(rdx, Address(rdx, 0));           // *obj
  89   __ shrptr (rax, 2);                         // offset
  90 
  91   assert(count < LIST_CAPACITY, "LIST_CAPACITY too small");
  92   speculative_load_pclist[count] = __ pc();
  93   switch (type) {
  94     case T_BOOLEAN: __ movzbl (rax, Address(rdx, rax, Address::times_1)); break;
  95     case T_BYTE:    __ movsbl (rax, Address(rdx, rax, Address::times_1)); break;
  96     case T_CHAR:    __ movzwl (rax, Address(rdx, rax, Address::times_1)); break;
  97     case T_SHORT:   __ movswl (rax, Address(rdx, rax, Address::times_1)); break;
  98     case T_INT:     __ movl   (rax, Address(rdx, rax, Address::times_1)); break;
  99     default:        ShouldNotReachHere();
 100   }
 101 
 102   Address ca1;
 103   if (os::is_MP()) {
 104     __ lea(rdx, counter);
 105     __ xorptr(rdx, rax);
 106     __ xorptr(rdx, rax);
 107     __ cmp32(rcx, Address(rdx, 0));
 108     // ca1 is the same as ca because
 109     // rax, ^ counter_addr ^ rax, = address
 110     // ca1 is data dependent on rax,.
 111   } else {
 112     __ cmp32(rcx, counter);
 113   }
 114   __ jcc (Assembler::notEqual, slow);
 115 
 116 #ifndef _WINDOWS
 117   __ ret (0);
 118 #else
 119   // __stdcall calling convention
 120   __ ret (3*wordSize);
 121 #endif
 122 
 123   slowcase_entry_pclist[count++] = __ pc();
 124   __ bind (slow);
 125   address slow_case_addr;
 126   switch (type) {
 127     case T_BOOLEAN: slow_case_addr = jni_GetBooleanField_addr(); break;
 128     case T_BYTE:    slow_case_addr = jni_GetByteField_addr();    break;
 129     case T_CHAR:    slow_case_addr = jni_GetCharField_addr();    break;
 130     case T_SHORT:   slow_case_addr = jni_GetShortField_addr();   break;
 131     case T_INT:     slow_case_addr = jni_GetIntField_addr();
 132   }
 133   // tail call
 134   __ jump (ExternalAddress(slow_case_addr));
 135 
 136   __ flush ();
 137 
 138 #ifndef _WINDOWS
 139   return fast_entry;
 140 #else
 141   switch (type) {
 142   case T_BOOLEAN: jni_fast_GetBooleanField_fp = (GetBooleanField_t) fast_entry; break;
 143   case T_BYTE:    jni_fast_GetByteField_fp    = (GetByteField_t)    fast_entry; break;
 144   case T_CHAR:    jni_fast_GetCharField_fp    = (GetCharField_t)    fast_entry; break;
 145   case T_SHORT:   jni_fast_GetShortField_fp   = (GetShortField_t)   fast_entry; break;
 146   case T_INT:     jni_fast_GetIntField_fp     = (GetIntField_t)     fast_entry; break;
 147   }
 148   return os::win32::fast_jni_accessor_wrapper(type);
 149 #endif
 150 }
 151 
 152 address JNI_FastGetField::generate_fast_get_boolean_field() {
 153   return generate_fast_get_int_field0(T_BOOLEAN);
 154 }
 155 
 156 address JNI_FastGetField::generate_fast_get_byte_field() {
 157   return generate_fast_get_int_field0(T_BYTE);
 158 }
 159 
 160 address JNI_FastGetField::generate_fast_get_char_field() {
 161   return generate_fast_get_int_field0(T_CHAR);
 162 }
 163 
 164 address JNI_FastGetField::generate_fast_get_short_field() {
 165   return generate_fast_get_int_field0(T_SHORT);
 166 }
 167 
 168 address JNI_FastGetField::generate_fast_get_int_field() {
 169   return generate_fast_get_int_field0(T_INT);
 170 }
 171 
 172 address JNI_FastGetField::generate_fast_get_long_field() {
 173   const char *name = "jni_fast_GetLongField";
 174   ResourceMark rm;
 175   BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
 176   CodeBuffer cbuf(blob);
 177   MacroAssembler* masm = new MacroAssembler(&cbuf);
 178   address fast_entry = __ pc();
 179 
 180   Label slow;
 181 
 182   // stack layout:    offset from rsp (in words):
 183   //  old rsi          0
 184   //  return pc        1
 185   //  jni env          2
 186   //  obj              3
 187   //  jfieldID         4
 188 
 189   ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
 190 
 191   __ push  (rsi);
 192   __ mov32 (rcx, counter);
 193   __ testb (rcx, 1);
 194   __ jcc (Assembler::notZero, slow);
 195   if (os::is_MP()) {
 196     __ mov(rax, rcx);
 197     __ andptr(rax, 1);                         // rax, must end up 0
 198     __ movptr(rdx, Address(rsp, rax, Address::times_1, 3*wordSize));
 199                                               // obj, notice rax, is 0.
 200                                               // rdx is data dependent on rcx.
 201   } else {
 202     __ movptr(rdx, Address(rsp, 3*wordSize));  // obj
 203   }
 204   __ movptr(rsi, Address(rsp, 4*wordSize));  // jfieldID
 205   __ movptr(rdx, Address(rdx, 0));           // *obj
 206   __ shrptr(rsi, 2);                         // offset
 207 
 208   assert(count < LIST_CAPACITY-1, "LIST_CAPACITY too small");
 209   speculative_load_pclist[count++] = __ pc();
 210   __ movptr(rax, Address(rdx, rsi, Address::times_1));
 211 #ifndef _LP64
 212   speculative_load_pclist[count] = __ pc();
 213   __ movl(rdx, Address(rdx, rsi, Address::times_1, 4));
 214 #endif // _LP64
 215 
 216   if (os::is_MP()) {
 217     __ lea(rsi, counter);
 218     __ xorptr(rsi, rdx);
 219     __ xorptr(rsi, rax);
 220     __ xorptr(rsi, rdx);
 221     __ xorptr(rsi, rax);
 222     __ cmp32(rcx, Address(rsi, 0));
 223     // ca1 is the same as ca because
 224     // rax, ^ rdx ^ counter_addr ^ rax, ^ rdx = address
 225     // ca1 is data dependent on both rax, and rdx.
 226   } else {
 227     __ cmp32(rcx, counter);
 228   }
 229   __ jcc (Assembler::notEqual, slow);
 230 
 231   __ pop (rsi);
 232 
 233 #ifndef _WINDOWS
 234   __ ret (0);
 235 #else
 236   // __stdcall calling convention
 237   __ ret (3*wordSize);
 238 #endif
 239 
 240   slowcase_entry_pclist[count-1] = __ pc();
 241   slowcase_entry_pclist[count++] = __ pc();
 242   __ bind (slow);
 243   __ pop  (rsi);
 244   address slow_case_addr = jni_GetLongField_addr();;
 245   // tail call
 246   __ jump (ExternalAddress(slow_case_addr));
 247 
 248   __ flush ();
 249 
 250 #ifndef _WINDOWS
 251   return fast_entry;
 252 #else
 253   jni_fast_GetLongField_fp = (GetLongField_t) fast_entry;
 254   return os::win32::fast_jni_accessor_wrapper(T_LONG);
 255 #endif
 256 }
 257 
 258 address JNI_FastGetField::generate_fast_get_float_field0(BasicType type) {
 259   const char *name;
 260   switch (type) {
 261     case T_FLOAT:  name = "jni_fast_GetFloatField";  break;
 262     case T_DOUBLE: name = "jni_fast_GetDoubleField"; break;
 263     default:       ShouldNotReachHere();
 264   }
 265   ResourceMark rm;
 266   BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
 267   CodeBuffer cbuf(blob);
 268   MacroAssembler* masm = new MacroAssembler(&cbuf);
 269   address fast_entry = __ pc();
 270 
 271   Label slow_with_pop, slow;
 272 
 273   // stack layout:    offset from rsp (in words):
 274   //  return pc        0
 275   //  jni env          1
 276   //  obj              2
 277   //  jfieldID         3
 278 
 279   ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
 280 
 281   __ mov32 (rcx, counter);
 282   __ testb (rcx, 1);
 283   __ jcc (Assembler::notZero, slow);
 284   if (os::is_MP()) {
 285     __ mov(rax, rcx);
 286     __ andptr(rax, 1);                         // rax, must end up 0
 287     __ movptr(rdx, Address(rsp, rax, Address::times_1, 2*wordSize));
 288                                               // obj, notice rax, is 0.
 289                                               // rdx is data dependent on rcx.
 290   } else {
 291     __ movptr(rdx, Address(rsp, 2*wordSize)); // obj
 292   }
 293   __ movptr(rax, Address(rsp, 3*wordSize));  // jfieldID
 294   __ movptr(rdx, Address(rdx, 0));           // *obj
 295   __ shrptr(rax, 2);                         // offset
 296 
 297   assert(count < LIST_CAPACITY, "LIST_CAPACITY too small");
 298   speculative_load_pclist[count] = __ pc();
 299   switch (type) {
 300 #ifndef _LP64
 301     case T_FLOAT:  __ fld_s (Address(rdx, rax, Address::times_1)); break;
 302     case T_DOUBLE: __ fld_d (Address(rdx, rax, Address::times_1)); break;
 303 #else
 304     case T_FLOAT:  __ movflt (xmm0, Address(robj, roffset, Address::times_1)); break;
 305     case T_DOUBLE: __ movdbl (xmm0, Address(robj, roffset, Address::times_1)); break;
 306 #endif // _LP64
 307     default:       ShouldNotReachHere();
 308   }
 309 
 310   Address ca1;
 311   if (os::is_MP()) {
 312     __ fst_s (Address(rsp, -4));
 313     __ lea(rdx, counter);
 314     __ movl (rax, Address(rsp, -4));
 315     // garbage hi-order bits on 64bit are harmless.
 316     __ xorptr(rdx, rax);
 317     __ xorptr(rdx, rax);
 318     __ cmp32(rcx, Address(rdx, 0));
 319                                           // rax, ^ counter_addr ^ rax, = address
 320                                           // ca1 is data dependent on the field
 321                                           // access.
 322   } else {
 323     __ cmp32(rcx, counter);
 324   }
 325   __ jcc (Assembler::notEqual, slow_with_pop);
 326 
 327 #ifndef _WINDOWS
 328   __ ret (0);
 329 #else
 330   // __stdcall calling convention
 331   __ ret (3*wordSize);
 332 #endif
 333 
 334   __ bind (slow_with_pop);
 335   // invalid load. pop FPU stack.
 336   __ fstp_d (0);
 337 
 338   slowcase_entry_pclist[count++] = __ pc();
 339   __ bind (slow);
 340   address slow_case_addr;
 341   switch (type) {
 342     case T_FLOAT:  slow_case_addr = jni_GetFloatField_addr();  break;
 343     case T_DOUBLE: slow_case_addr = jni_GetDoubleField_addr(); break;
 344     default:       ShouldNotReachHere();
 345   }
 346   // tail call
 347   __ jump (ExternalAddress(slow_case_addr));
 348 
 349   __ flush ();
 350 
 351 #ifndef _WINDOWS
 352   return fast_entry;
 353 #else
 354   switch (type) {
 355   case T_FLOAT:  jni_fast_GetFloatField_fp  = (GetFloatField_t)  fast_entry; break;
 356   case T_DOUBLE: jni_fast_GetDoubleField_fp = (GetDoubleField_t) fast_entry; break;
 357   }
 358   return os::win32::fast_jni_accessor_wrapper(type);
 359 #endif
 360 }
 361 
 362 address JNI_FastGetField::generate_fast_get_float_field() {
 363   return generate_fast_get_float_field0(T_FLOAT);
 364 }
 365 
 366 address JNI_FastGetField::generate_fast_get_double_field() {
 367   return generate_fast_get_float_field0(T_DOUBLE);
 368 }