jniFastGetField_x86_32.cpp revision 9244:825cee2cd7a6
1/*
2 * Copyright (c) 2004, 2010, Oracle and/or its affiliates. All rights reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.
8 *
9 * This code is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12 * version 2 for more details (a copy is included in the LICENSE file that
13 * accompanied this code).
14 *
15 * You should have received a copy of the GNU General Public License version
16 * 2 along with this work; if not, write to the Free Software Foundation,
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18 *
19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20 * or visit www.oracle.com if you need additional information or have any
21 * questions.
22 *
23 */
24
25#include "precompiled.hpp"
26#include "asm/macroAssembler.hpp"
27#include "memory/resourceArea.hpp"
28#include "prims/jniFastGetField.hpp"
29#include "prims/jvm_misc.hpp"
30#include "runtime/safepoint.hpp"
31
32#define __ masm->
33
34#define BUFFER_SIZE 30
35
36#ifdef _WINDOWS
37GetBooleanField_t JNI_FastGetField::jni_fast_GetBooleanField_fp;
38GetByteField_t    JNI_FastGetField::jni_fast_GetByteField_fp;
39GetCharField_t    JNI_FastGetField::jni_fast_GetCharField_fp;
40GetShortField_t   JNI_FastGetField::jni_fast_GetShortField_fp;
41GetIntField_t     JNI_FastGetField::jni_fast_GetIntField_fp;
42GetLongField_t    JNI_FastGetField::jni_fast_GetLongField_fp;
43GetFloatField_t   JNI_FastGetField::jni_fast_GetFloatField_fp;
44GetDoubleField_t  JNI_FastGetField::jni_fast_GetDoubleField_fp;
45#endif
46
47// Instead of issuing lfence for LoadLoad barrier, we create data dependency
48// between loads, which is much more efficient than lfence.
49
50address JNI_FastGetField::generate_fast_get_int_field0(BasicType type) {
51  const char *name = NULL;
52  switch (type) {
53    case T_BOOLEAN: name = "jni_fast_GetBooleanField"; break;
54    case T_BYTE:    name = "jni_fast_GetByteField";    break;
55    case T_CHAR:    name = "jni_fast_GetCharField";    break;
56    case T_SHORT:   name = "jni_fast_GetShortField";   break;
57    case T_INT:     name = "jni_fast_GetIntField";     break;
58    default:        ShouldNotReachHere();
59  }
60  ResourceMark rm;
61  BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
62  CodeBuffer cbuf(blob);
63  MacroAssembler* masm = new MacroAssembler(&cbuf);
64  address fast_entry = __ pc();
65
66  Label slow;
67
68  // stack layout:    offset from rsp (in words):
69  //  return pc        0
70  //  jni env          1
71  //  obj              2
72  //  jfieldID         3
73
74  ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
75  __ mov32 (rcx, counter);
76  __ testb (rcx, 1);
77  __ jcc (Assembler::notZero, slow);
78  if (os::is_MP()) {
79    __ mov(rax, rcx);
80    __ andptr(rax, 1);                         // rax, must end up 0
81    __ movptr(rdx, Address(rsp, rax, Address::times_1, 2*wordSize));
82                                              // obj, notice rax, is 0.
83                                              // rdx is data dependent on rcx.
84  } else {
85    __ movptr (rdx, Address(rsp, 2*wordSize));  // obj
86  }
87  __ movptr(rax, Address(rsp, 3*wordSize));  // jfieldID
88  __ movptr(rdx, Address(rdx, 0));           // *obj
89  __ shrptr (rax, 2);                         // offset
90
91  assert(count < LIST_CAPACITY, "LIST_CAPACITY too small");
92  speculative_load_pclist[count] = __ pc();
93  switch (type) {
94    case T_BOOLEAN: __ movzbl (rax, Address(rdx, rax, Address::times_1)); break;
95    case T_BYTE:    __ movsbl (rax, Address(rdx, rax, Address::times_1)); break;
96    case T_CHAR:    __ movzwl (rax, Address(rdx, rax, Address::times_1)); break;
97    case T_SHORT:   __ movswl (rax, Address(rdx, rax, Address::times_1)); break;
98    case T_INT:     __ movl   (rax, Address(rdx, rax, Address::times_1)); break;
99    default:        ShouldNotReachHere();
100  }
101
102  Address ca1;
103  if (os::is_MP()) {
104    __ lea(rdx, counter);
105    __ xorptr(rdx, rax);
106    __ xorptr(rdx, rax);
107    __ cmp32(rcx, Address(rdx, 0));
108    // ca1 is the same as ca because
109    // rax, ^ counter_addr ^ rax, = address
110    // ca1 is data dependent on rax,.
111  } else {
112    __ cmp32(rcx, counter);
113  }
114  __ jcc (Assembler::notEqual, slow);
115
116#ifndef _WINDOWS
117  __ ret (0);
118#else
119  // __stdcall calling convention
120  __ ret (3*wordSize);
121#endif
122
123  slowcase_entry_pclist[count++] = __ pc();
124  __ bind (slow);
125  address slow_case_addr = NULL;
126  switch (type) {
127    case T_BOOLEAN: slow_case_addr = jni_GetBooleanField_addr(); break;
128    case T_BYTE:    slow_case_addr = jni_GetByteField_addr();    break;
129    case T_CHAR:    slow_case_addr = jni_GetCharField_addr();    break;
130    case T_SHORT:   slow_case_addr = jni_GetShortField_addr();   break;
131    case T_INT:     slow_case_addr = jni_GetIntField_addr();
132  }
133  // tail call
134  __ jump (ExternalAddress(slow_case_addr));
135
136  __ flush ();
137
138#ifndef _WINDOWS
139  return fast_entry;
140#else
141  switch (type) {
142  case T_BOOLEAN: jni_fast_GetBooleanField_fp = (GetBooleanField_t) fast_entry; break;
143  case T_BYTE:    jni_fast_GetByteField_fp    = (GetByteField_t)    fast_entry; break;
144  case T_CHAR:    jni_fast_GetCharField_fp    = (GetCharField_t)    fast_entry; break;
145  case T_SHORT:   jni_fast_GetShortField_fp   = (GetShortField_t)   fast_entry; break;
146  case T_INT:     jni_fast_GetIntField_fp     = (GetIntField_t)     fast_entry; break;
147  }
148  return os::win32::fast_jni_accessor_wrapper(type);
149#endif
150}
151
152address JNI_FastGetField::generate_fast_get_boolean_field() {
153  return generate_fast_get_int_field0(T_BOOLEAN);
154}
155
156address JNI_FastGetField::generate_fast_get_byte_field() {
157  return generate_fast_get_int_field0(T_BYTE);
158}
159
160address JNI_FastGetField::generate_fast_get_char_field() {
161  return generate_fast_get_int_field0(T_CHAR);
162}
163
164address JNI_FastGetField::generate_fast_get_short_field() {
165  return generate_fast_get_int_field0(T_SHORT);
166}
167
168address JNI_FastGetField::generate_fast_get_int_field() {
169  return generate_fast_get_int_field0(T_INT);
170}
171
172address JNI_FastGetField::generate_fast_get_long_field() {
173  const char *name = "jni_fast_GetLongField";
174  ResourceMark rm;
175  BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
176  CodeBuffer cbuf(blob);
177  MacroAssembler* masm = new MacroAssembler(&cbuf);
178  address fast_entry = __ pc();
179
180  Label slow;
181
182  // stack layout:    offset from rsp (in words):
183  //  old rsi          0
184  //  return pc        1
185  //  jni env          2
186  //  obj              3
187  //  jfieldID         4
188
189  ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
190
191  __ push  (rsi);
192  __ mov32 (rcx, counter);
193  __ testb (rcx, 1);
194  __ jcc (Assembler::notZero, slow);
195  if (os::is_MP()) {
196    __ mov(rax, rcx);
197    __ andptr(rax, 1);                         // rax, must end up 0
198    __ movptr(rdx, Address(rsp, rax, Address::times_1, 3*wordSize));
199                                              // obj, notice rax, is 0.
200                                              // rdx is data dependent on rcx.
201  } else {
202    __ movptr(rdx, Address(rsp, 3*wordSize));  // obj
203  }
204  __ movptr(rsi, Address(rsp, 4*wordSize));  // jfieldID
205  __ movptr(rdx, Address(rdx, 0));           // *obj
206  __ shrptr(rsi, 2);                         // offset
207
208  assert(count < LIST_CAPACITY-1, "LIST_CAPACITY too small");
209  speculative_load_pclist[count++] = __ pc();
210  __ movptr(rax, Address(rdx, rsi, Address::times_1));
211#ifndef _LP64
212  speculative_load_pclist[count] = __ pc();
213  __ movl(rdx, Address(rdx, rsi, Address::times_1, 4));
214#endif // _LP64
215
216  if (os::is_MP()) {
217    __ lea(rsi, counter);
218    __ xorptr(rsi, rdx);
219    __ xorptr(rsi, rax);
220    __ xorptr(rsi, rdx);
221    __ xorptr(rsi, rax);
222    __ cmp32(rcx, Address(rsi, 0));
223    // ca1 is the same as ca because
224    // rax, ^ rdx ^ counter_addr ^ rax, ^ rdx = address
225    // ca1 is data dependent on both rax, and rdx.
226  } else {
227    __ cmp32(rcx, counter);
228  }
229  __ jcc (Assembler::notEqual, slow);
230
231  __ pop (rsi);
232
233#ifndef _WINDOWS
234  __ ret (0);
235#else
236  // __stdcall calling convention
237  __ ret (3*wordSize);
238#endif
239
240  slowcase_entry_pclist[count-1] = __ pc();
241  slowcase_entry_pclist[count++] = __ pc();
242  __ bind (slow);
243  __ pop  (rsi);
244  address slow_case_addr = jni_GetLongField_addr();;
245  // tail call
246  __ jump (ExternalAddress(slow_case_addr));
247
248  __ flush ();
249
250#ifndef _WINDOWS
251  return fast_entry;
252#else
253  jni_fast_GetLongField_fp = (GetLongField_t) fast_entry;
254  return os::win32::fast_jni_accessor_wrapper(T_LONG);
255#endif
256}
257
258address JNI_FastGetField::generate_fast_get_float_field0(BasicType type) {
259  const char *name = NULL;
260  switch (type) {
261    case T_FLOAT:  name = "jni_fast_GetFloatField";  break;
262    case T_DOUBLE: name = "jni_fast_GetDoubleField"; break;
263    default:       ShouldNotReachHere();
264  }
265  ResourceMark rm;
266  BufferBlob* blob = BufferBlob::create(name, BUFFER_SIZE*wordSize);
267  CodeBuffer cbuf(blob);
268  MacroAssembler* masm = new MacroAssembler(&cbuf);
269  address fast_entry = __ pc();
270
271  Label slow_with_pop, slow;
272
273  // stack layout:    offset from rsp (in words):
274  //  return pc        0
275  //  jni env          1
276  //  obj              2
277  //  jfieldID         3
278
279  ExternalAddress counter(SafepointSynchronize::safepoint_counter_addr());
280
281  __ mov32 (rcx, counter);
282  __ testb (rcx, 1);
283  __ jcc (Assembler::notZero, slow);
284  if (os::is_MP()) {
285    __ mov(rax, rcx);
286    __ andptr(rax, 1);                         // rax, must end up 0
287    __ movptr(rdx, Address(rsp, rax, Address::times_1, 2*wordSize));
288                                              // obj, notice rax, is 0.
289                                              // rdx is data dependent on rcx.
290  } else {
291    __ movptr(rdx, Address(rsp, 2*wordSize)); // obj
292  }
293  __ movptr(rax, Address(rsp, 3*wordSize));  // jfieldID
294  __ movptr(rdx, Address(rdx, 0));           // *obj
295  __ shrptr(rax, 2);                         // offset
296
297  assert(count < LIST_CAPACITY, "LIST_CAPACITY too small");
298  speculative_load_pclist[count] = __ pc();
299  switch (type) {
300#ifndef _LP64
301    case T_FLOAT:  __ fld_s (Address(rdx, rax, Address::times_1)); break;
302    case T_DOUBLE: __ fld_d (Address(rdx, rax, Address::times_1)); break;
303#else
304    case T_FLOAT:  __ movflt (xmm0, Address(robj, roffset, Address::times_1)); break;
305    case T_DOUBLE: __ movdbl (xmm0, Address(robj, roffset, Address::times_1)); break;
306#endif // _LP64
307    default:       ShouldNotReachHere();
308  }
309
310  Address ca1;
311  if (os::is_MP()) {
312    __ fst_s (Address(rsp, -4));
313    __ lea(rdx, counter);
314    __ movl (rax, Address(rsp, -4));
315    // garbage hi-order bits on 64bit are harmless.
316    __ xorptr(rdx, rax);
317    __ xorptr(rdx, rax);
318    __ cmp32(rcx, Address(rdx, 0));
319                                          // rax, ^ counter_addr ^ rax, = address
320                                          // ca1 is data dependent on the field
321                                          // access.
322  } else {
323    __ cmp32(rcx, counter);
324  }
325  __ jcc (Assembler::notEqual, slow_with_pop);
326
327#ifndef _WINDOWS
328  __ ret (0);
329#else
330  // __stdcall calling convention
331  __ ret (3*wordSize);
332#endif
333
334  __ bind (slow_with_pop);
335  // invalid load. pop FPU stack.
336  __ fstp_d (0);
337
338  slowcase_entry_pclist[count++] = __ pc();
339  __ bind (slow);
340  address slow_case_addr = NULL;
341  switch (type) {
342    case T_FLOAT:  slow_case_addr = jni_GetFloatField_addr();  break;
343    case T_DOUBLE: slow_case_addr = jni_GetDoubleField_addr(); break;
344    default:       ShouldNotReachHere();
345  }
346  // tail call
347  __ jump (ExternalAddress(slow_case_addr));
348
349  __ flush ();
350
351#ifndef _WINDOWS
352  return fast_entry;
353#else
354  switch (type) {
355  case T_FLOAT:  jni_fast_GetFloatField_fp  = (GetFloatField_t)  fast_entry; break;
356  case T_DOUBLE: jni_fast_GetDoubleField_fp = (GetDoubleField_t) fast_entry; break;
357  }
358  return os::win32::fast_jni_accessor_wrapper(type);
359#endif
360}
361
362address JNI_FastGetField::generate_fast_get_float_field() {
363  return generate_fast_get_float_field0(T_FLOAT);
364}
365
366address JNI_FastGetField::generate_fast_get_double_field() {
367  return generate_fast_get_float_field0(T_DOUBLE);
368}
369