1 /*
2  * Copyright (c) 2004, 2020, Oracle and/or its affiliates. All rights reserved.
3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4  *
5  * This code is free software; you can redistribute it and/or modify it
6  * under the terms of the GNU General Public License version 2 only, as
7  * published by the Free Software Foundation.
8  *
9  * This code is distributed in the hope that it will be useful, but WITHOUT
10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12  * version 2 for more details (a copy is included in the LICENSE file that
13  * accompanied this code).
14  *
15  * You should have received a copy of the GNU General Public License version
16  * 2 along with this work; if not, write to the Free Software Foundation,
17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18  *
19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20  * or visit www.oracle.com if you need additional information or have any
21  * questions.
22  *
23  */
24 
25 #include "precompiled.hpp"
26 #include "asm/macroAssembler.hpp"
27 #include "memory/resourceArea.hpp"
28 #include "prims/jniFastGetField.hpp"
29 #include "prims/jvm_misc.hpp"
30 #include "prims/jvmtiExport.hpp"
31 #include "runtime/safepoint.hpp"
32 #include "runtime/stubRoutines.hpp"
33 
34 #define __ masm->
35 
36 #define BUFFER_SIZE 30
37 
38 #ifdef _WINDOWS
39 GetBooleanField_t JNI_FastGetField::jni_fast_GetBooleanField_fp;
40 GetByteField_t    JNI_FastGetField::jni_fast_GetByteField_fp;
41 GetCharField_t    JNI_FastGetField::jni_fast_GetCharField_fp;
42 GetShortField_t   JNI_FastGetField::jni_fast_GetShortField_fp;
43 GetIntField_t     JNI_FastGetField::jni_fast_GetIntField_fp;
44 GetLongField_t    JNI_FastGetField::jni_fast_GetLongField_fp;
45 GetFloatField_t   JNI_FastGetField::jni_fast_GetFloatField_fp;
46 GetDoubleField_t  JNI_FastGetField::jni_fast_GetDoubleField_fp;
47 #endif
48 
49 // Instead of issuing lfence for LoadLoad barrier, we create data dependency
50 // between loads, which is much more efficient than lfence.
51 
generate_fast_get_int_field0(BasicType type)52 address JNI_FastGetField::generate_fast_get_int_field0(BasicType type) {
53   const char *name = NULL;
54   switch (type) {
55     case T_BOOLEAN: name = "jni_fast_GetBooleanField"; break;
56     case T_BYTE:    name = "jni_fast_GetByteField";    break;
57     case T_CHAR:    name = "jni_fast_GetCharField";    break;
58     case T_SHORT:   name = "jni_fast_GetShortField";   break;
59     case T_INT:     name = "jni_fast_GetIntField";     break;
60     default:        ShouldNotReachHere();
61   }
62   ResourceMark rm;
63   BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
64   CodeBuffer cbuf(blob);
65   MacroAssembler* masm = new MacroAssembler(&cbuf);
66   address fast_entry = __ pc();
67 
68   Label slow;
69 
70   // stack layout:    offset from rsp (in words):
71   //  return pc        0
72   //  jni env          1
73   //  obj              2
74   //  jfieldID         3
75 
76   ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
77   __ mov32 (rcx, counter);
78   __ testb (rcx, 1);
79   __ jcc (Assembler::notZero, slow);
80 
81   if (JvmtiExport::can_post_field_access()) {
82     // Check to see if a field access watch has been set before we
83     // take the fast path.
84     __ cmp32(ExternalAddress((address) JvmtiExport::get_field_access_count_addr()), 0);
85     __ jcc(Assembler::notZero, slow);
86   }
87 
88   __ mov(rax, rcx);
89   __ andptr(rax, 1);                         // rax, must end up 0
90   __ movptr(rdx, Address(rsp, rax, Address::times_1, 2*wordSize));
91                                             // obj, notice rax, is 0.
92                                             // rdx is data dependent on rcx.
93   __ movptr(rax, Address(rsp, 3*wordSize));  // jfieldID
94 
95   __ clear_jweak_tag(rdx);
96 
97   __ movptr(rdx, Address(rdx, 0));           // *obj
98   __ shrptr (rax, 2);                         // offset
99 
100   assert(count < LIST_CAPACITY, "LIST_CAPACITY too small");
101   speculative_load_pclist[count] = __ pc();
102   switch (type) {
103     case T_BOOLEAN: __ movzbl (rax, Address(rdx, rax, Address::times_1)); break;
104     case T_BYTE:    __ movsbl (rax, Address(rdx, rax, Address::times_1)); break;
105     case T_CHAR:    __ movzwl (rax, Address(rdx, rax, Address::times_1)); break;
106     case T_SHORT:   __ movswl (rax, Address(rdx, rax, Address::times_1)); break;
107     case T_INT:     __ movl   (rax, Address(rdx, rax, Address::times_1)); break;
108     default:        ShouldNotReachHere();
109   }
110 
111   Address ca1;
112   __ lea(rdx, counter);
113   __ xorptr(rdx, rax);
114   __ xorptr(rdx, rax);
115   __ cmp32(rcx, Address(rdx, 0));
116   // ca1 is the same as ca because
117   // rax, ^ counter_addr ^ rax, = address
118   // ca1 is data dependent on rax,.
119   __ jcc (Assembler::notEqual, slow);
120 
121 #ifndef _WINDOWS
122   __ ret (0);
123 #else
124   // __stdcall calling convention
125   __ ret (3*wordSize);
126 #endif
127 
128   slowcase_entry_pclist[count++] = __ pc();
129   __ bind (slow);
130   address slow_case_addr = NULL;
131   switch (type) {
132     case T_BOOLEAN: slow_case_addr = jni_GetBooleanField_addr(); break;
133     case T_BYTE:    slow_case_addr = jni_GetByteField_addr();    break;
134     case T_CHAR:    slow_case_addr = jni_GetCharField_addr();    break;
135     case T_SHORT:   slow_case_addr = jni_GetShortField_addr();   break;
136     case T_INT:     slow_case_addr = jni_GetIntField_addr();     break;
137     default:        ShouldNotReachHere();
138   }
139   // tail call
140   __ jump (ExternalAddress(slow_case_addr));
141 
142   __ flush ();
143 
144 #ifndef _WINDOWS
145   return fast_entry;
146 #else
147   switch (type) {
148   case T_BOOLEAN: jni_fast_GetBooleanField_fp = (GetBooleanField_t) fast_entry; break;
149   case T_BYTE:    jni_fast_GetByteField_fp    = (GetByteField_t)    fast_entry; break;
150   case T_CHAR:    jni_fast_GetCharField_fp    = (GetCharField_t)    fast_entry; break;
151   case T_SHORT:   jni_fast_GetShortField_fp   = (GetShortField_t)   fast_entry; break;
152   case T_INT:     jni_fast_GetIntField_fp     = (GetIntField_t)     fast_entry; break;
153   }
154   return os::win32::fast_jni_accessor_wrapper(type);
155 #endif
156 }
157 
generate_fast_get_boolean_field()158 address JNI_FastGetField::generate_fast_get_boolean_field() {
159   return generate_fast_get_int_field0(T_BOOLEAN);
160 }
161 
generate_fast_get_byte_field()162 address JNI_FastGetField::generate_fast_get_byte_field() {
163   return generate_fast_get_int_field0(T_BYTE);
164 }
165 
generate_fast_get_char_field()166 address JNI_FastGetField::generate_fast_get_char_field() {
167   return generate_fast_get_int_field0(T_CHAR);
168 }
169 
generate_fast_get_short_field()170 address JNI_FastGetField::generate_fast_get_short_field() {
171   return generate_fast_get_int_field0(T_SHORT);
172 }
173 
generate_fast_get_int_field()174 address JNI_FastGetField::generate_fast_get_int_field() {
175   return generate_fast_get_int_field0(T_INT);
176 }
177 
generate_fast_get_long_field()178 address JNI_FastGetField::generate_fast_get_long_field() {
179   const char *name = "jni_fast_GetLongField";
180   ResourceMark rm;
181   BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
182   CodeBuffer cbuf(blob);
183   MacroAssembler* masm = new MacroAssembler(&cbuf);
184   address fast_entry = __ pc();
185 
186   Label slow;
187 
188   // stack layout:    offset from rsp (in words):
189   //  old rsi          0
190   //  return pc        1
191   //  jni env          2
192   //  obj              3
193   //  jfieldID         4
194 
195   ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
196 
197   __ push  (rsi);
198   __ mov32 (rcx, counter);
199   __ testb (rcx, 1);
200   __ jcc (Assembler::notZero, slow);
201 
202   if (JvmtiExport::can_post_field_access()) {
203     // Check to see if a field access watch has been set before we
204     // take the fast path.
205     __ cmp32(ExternalAddress((address) JvmtiExport::get_field_access_count_addr()), 0);
206     __ jcc(Assembler::notZero, slow);
207   }
208 
209   __ mov(rax, rcx);
210   __ andptr(rax, 1);                         // rax, must end up 0
211   __ movptr(rdx, Address(rsp, rax, Address::times_1, 3*wordSize));
212                                             // obj, notice rax, is 0.
213                                             // rdx is data dependent on rcx.
214   __ movptr(rsi, Address(rsp, 4*wordSize));  // jfieldID
215 
216   __ clear_jweak_tag(rdx);
217 
218   __ movptr(rdx, Address(rdx, 0));           // *obj
219   __ shrptr(rsi, 2);                         // offset
220 
221   assert(count < LIST_CAPACITY-1, "LIST_CAPACITY too small");
222   speculative_load_pclist[count++] = __ pc();
223   __ movptr(rax, Address(rdx, rsi, Address::times_1));
224 #ifndef _LP64
225   speculative_load_pclist[count] = __ pc();
226   __ movl(rdx, Address(rdx, rsi, Address::times_1, 4));
227 #endif // _LP64
228 
229   __ lea(rsi, counter);
230   __ xorptr(rsi, rdx);
231   __ xorptr(rsi, rax);
232   __ xorptr(rsi, rdx);
233   __ xorptr(rsi, rax);
234   __ cmp32(rcx, Address(rsi, 0));
235   // ca1 is the same as ca because
236   // rax, ^ rdx ^ counter_addr ^ rax, ^ rdx = address
237   // ca1 is data dependent on both rax, and rdx.
238   __ jcc (Assembler::notEqual, slow);
239 
240   __ pop (rsi);
241 
242 #ifndef _WINDOWS
243   __ ret (0);
244 #else
245   // __stdcall calling convention
246   __ ret (3*wordSize);
247 #endif
248 
249   slowcase_entry_pclist[count-1] = __ pc();
250   slowcase_entry_pclist[count++] = __ pc();
251   __ bind (slow);
252   __ pop  (rsi);
253   address slow_case_addr = jni_GetLongField_addr();;
254   // tail call
255   __ jump (ExternalAddress(slow_case_addr));
256 
257   __ flush ();
258 
259 #ifndef _WINDOWS
260   return fast_entry;
261 #else
262   jni_fast_GetLongField_fp = (GetLongField_t) fast_entry;
263   return os::win32::fast_jni_accessor_wrapper(T_LONG);
264 #endif
265 }
266 
generate_fast_get_float_field0(BasicType type)267 address JNI_FastGetField::generate_fast_get_float_field0(BasicType type) {
268   const char *name = NULL;
269   switch (type) {
270     case T_FLOAT:  name = "jni_fast_GetFloatField";  break;
271     case T_DOUBLE: name = "jni_fast_GetDoubleField"; break;
272     default:       ShouldNotReachHere();
273   }
274   ResourceMark rm;
275   BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
276   CodeBuffer cbuf(blob);
277   MacroAssembler* masm = new MacroAssembler(&cbuf);
278   address fast_entry = __ pc();
279 
280   Label slow_with_pop, slow;
281 
282   // stack layout:    offset from rsp (in words):
283   //  return pc        0
284   //  jni env          1
285   //  obj              2
286   //  jfieldID         3
287 
288   ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
289 
290   __ mov32 (rcx, counter);
291   __ testb (rcx, 1);
292   __ jcc (Assembler::notZero, slow);
293 
294   if (JvmtiExport::can_post_field_access()) {
295     // Check to see if a field access watch has been set before we
296     // take the fast path.
297     __ cmp32(ExternalAddress((address) JvmtiExport::get_field_access_count_addr()), 0);
298     __ jcc(Assembler::notZero, slow);
299   }
300 
301   __ mov(rax, rcx);
302   __ andptr(rax, 1);                         // rax, must end up 0
303   __ movptr(rdx, Address(rsp, rax, Address::times_1, 2*wordSize));
304                                             // obj, notice rax, is 0.
305                                             // rdx is data dependent on rcx.
306   __ movptr(rax, Address(rsp, 3*wordSize));  // jfieldID
307 
308   __ clear_jweak_tag(rdx);
309 
310   __ movptr(rdx, Address(rdx, 0));           // *obj
311   __ shrptr(rax, 2);                         // offset
312 
313   assert(count < LIST_CAPACITY, "LIST_CAPACITY too small");
314   speculative_load_pclist[count] = __ pc();
315   switch (type) {
316 #ifndef _LP64
317     case T_FLOAT:  __ fld_s (Address(rdx, rax, Address::times_1)); break;
318     case T_DOUBLE: __ fld_d (Address(rdx, rax, Address::times_1)); break;
319 #else
320     case T_FLOAT:  __ movflt (xmm0, Address(robj, roffset, Address::times_1)); break;
321     case T_DOUBLE: __ movdbl (xmm0, Address(robj, roffset, Address::times_1)); break;
322 #endif // _LP64
323     default:       ShouldNotReachHere();
324   }
325 
326   Address ca1;
327   __ fst_s (Address(rsp, -4));
328   __ lea(rdx, counter);
329   __ movl (rax, Address(rsp, -4));
330   // garbage hi-order bits on 64bit are harmless.
331   __ xorptr(rdx, rax);
332   __ xorptr(rdx, rax);
333   __ cmp32(rcx, Address(rdx, 0));
334   // rax, ^ counter_addr ^ rax, = address
335   // ca1 is data dependent on the field
336   // access.
337   __ jcc (Assembler::notEqual, slow_with_pop);
338 
339 #ifndef _WINDOWS
340   __ ret (0);
341 #else
342   // __stdcall calling convention
343   __ ret (3*wordSize);
344 #endif
345 
346   __ bind (slow_with_pop);
347   // invalid load. pop FPU stack.
348   __ fstp_d (0);
349 
350   slowcase_entry_pclist[count++] = __ pc();
351   __ bind (slow);
352   address slow_case_addr = NULL;
353   switch (type) {
354     case T_FLOAT:  slow_case_addr = jni_GetFloatField_addr();  break;
355     case T_DOUBLE: slow_case_addr = jni_GetDoubleField_addr(); break;
356     default:       ShouldNotReachHere();
357   }
358   // tail call
359   __ jump (ExternalAddress(slow_case_addr));
360 
361   __ flush ();
362 
363 #ifndef _WINDOWS
364   return fast_entry;
365 #else
366   switch (type) {
367   case T_FLOAT:  jni_fast_GetFloatField_fp  = (GetFloatField_t)  fast_entry; break;
368   case T_DOUBLE: jni_fast_GetDoubleField_fp = (GetDoubleField_t) fast_entry; break;
369   }
370   return os::win32::fast_jni_accessor_wrapper(type);
371 #endif
372 }
373 
generate_fast_get_float_field()374 address JNI_FastGetField::generate_fast_get_float_field() {
375   return generate_fast_get_float_field0(T_FLOAT);
376 }
377 
generate_fast_get_double_field()378 address JNI_FastGetField::generate_fast_get_double_field() {
379   return generate_fast_get_float_field0(T_DOUBLE);
380 }
381