94e3514d8f
Always create interpreter method entries for intrinsified methods but replace them with vanilla entries if the intrinsic is disabled at runtime. Reviewed-by: kvn, iklam
471 lines
16 KiB
C++
471 lines
16 KiB
C++
/*
|
|
* Copyright (c) 1997, 2016, Oracle and/or its affiliates. All rights reserved.
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* This code is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 only, as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* version 2 for more details (a copy is included in the LICENSE file that
|
|
* accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU General Public License version
|
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
* or visit www.oracle.com if you need additional information or have any
|
|
* questions.
|
|
*
|
|
*/
|
|
|
|
#include "precompiled.hpp"
|
|
#include "asm/macroAssembler.hpp"
|
|
#include "interpreter/interp_masm.hpp"
|
|
#include "interpreter/interpreter.hpp"
|
|
#include "interpreter/interpreterRuntime.hpp"
|
|
#include "interpreter/templateInterpreterGenerator.hpp"
|
|
#include "runtime/arguments.hpp"
|
|
#include "runtime/sharedRuntime.hpp"
|
|
|
|
#define __ _masm->
|
|
|
|
|
|
address TemplateInterpreterGenerator::generate_slow_signature_handler() {
|
|
address entry = __ pc();
|
|
// rbx,: method
|
|
// rcx: temporary
|
|
// rdi: pointer to locals
|
|
// rsp: end of copied parameters area
|
|
__ mov(rcx, rsp);
|
|
__ call_VM(noreg, CAST_FROM_FN_PTR(address, InterpreterRuntime::slow_signature_handler), rbx, rdi, rcx);
|
|
__ ret(0);
|
|
return entry;
|
|
}
|
|
|
|
/**
|
|
* Method entry for static native methods:
|
|
* int java.util.zip.CRC32.update(int crc, int b)
|
|
*/
|
|
address TemplateInterpreterGenerator::generate_CRC32_update_entry() {
|
|
if (UseCRC32Intrinsics) {
|
|
address entry = __ pc();
|
|
|
|
// rbx: Method*
|
|
// rsi: senderSP must preserved for slow path, set SP to it on fast path
|
|
// rdx: scratch
|
|
// rdi: scratch
|
|
|
|
Label slow_path;
|
|
// If we need a safepoint check, generate full interpreter entry.
|
|
ExternalAddress state(SafepointSynchronize::address_of_state());
|
|
__ cmp32(ExternalAddress(SafepointSynchronize::address_of_state()),
|
|
SafepointSynchronize::_not_synchronized);
|
|
__ jcc(Assembler::notEqual, slow_path);
|
|
|
|
// We don't generate local frame and don't align stack because
|
|
// we call stub code and there is no safepoint on this path.
|
|
|
|
// Load parameters
|
|
const Register crc = rax; // crc
|
|
const Register val = rdx; // source java byte value
|
|
const Register tbl = rdi; // scratch
|
|
|
|
// Arguments are reversed on java expression stack
|
|
__ movl(val, Address(rsp, wordSize)); // byte value
|
|
__ movl(crc, Address(rsp, 2*wordSize)); // Initial CRC
|
|
|
|
__ lea(tbl, ExternalAddress(StubRoutines::crc_table_addr()));
|
|
__ notl(crc); // ~crc
|
|
__ update_byte_crc32(crc, val, tbl);
|
|
__ notl(crc); // ~crc
|
|
// result in rax
|
|
|
|
// _areturn
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set sp to sender sp
|
|
__ jmp(rdi);
|
|
|
|
// generate a vanilla native entry as the slow path
|
|
__ bind(slow_path);
|
|
__ jump_to_entry(Interpreter::entry_for_kind(Interpreter::native));
|
|
return entry;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/**
|
|
* Method entry for static native methods:
|
|
* int java.util.zip.CRC32.updateBytes(int crc, byte[] b, int off, int len)
|
|
* int java.util.zip.CRC32.updateByteBuffer(int crc, long buf, int off, int len)
|
|
*/
|
|
address TemplateInterpreterGenerator::generate_CRC32_updateBytes_entry(AbstractInterpreter::MethodKind kind) {
|
|
if (UseCRC32Intrinsics) {
|
|
address entry = __ pc();
|
|
|
|
// rbx,: Method*
|
|
// rsi: senderSP must preserved for slow path, set SP to it on fast path
|
|
// rdx: scratch
|
|
// rdi: scratch
|
|
|
|
Label slow_path;
|
|
// If we need a safepoint check, generate full interpreter entry.
|
|
ExternalAddress state(SafepointSynchronize::address_of_state());
|
|
__ cmp32(ExternalAddress(SafepointSynchronize::address_of_state()),
|
|
SafepointSynchronize::_not_synchronized);
|
|
__ jcc(Assembler::notEqual, slow_path);
|
|
|
|
// We don't generate local frame and don't align stack because
|
|
// we call stub code and there is no safepoint on this path.
|
|
|
|
// Load parameters
|
|
const Register crc = rax; // crc
|
|
const Register buf = rdx; // source java byte array address
|
|
const Register len = rdi; // length
|
|
|
|
// value x86_32
|
|
// interp. arg ptr ESP + 4
|
|
// int java.util.zip.CRC32.updateBytes(int crc, byte[] b, int off, int len)
|
|
// 3 2 1 0
|
|
// int java.util.zip.CRC32.updateByteBuffer(int crc, long buf, int off, int len)
|
|
// 4 2,3 1 0
|
|
|
|
// Arguments are reversed on java expression stack
|
|
__ movl(len, Address(rsp, 4 + 0)); // Length
|
|
// Calculate address of start element
|
|
if (kind == Interpreter::java_util_zip_CRC32_updateByteBuffer) {
|
|
__ movptr(buf, Address(rsp, 4 + 2 * wordSize)); // long buf
|
|
__ addptr(buf, Address(rsp, 4 + 1 * wordSize)); // + offset
|
|
__ movl(crc, Address(rsp, 4 + 4 * wordSize)); // Initial CRC
|
|
} else {
|
|
__ movptr(buf, Address(rsp, 4 + 2 * wordSize)); // byte[] array
|
|
__ addptr(buf, arrayOopDesc::base_offset_in_bytes(T_BYTE)); // + header size
|
|
__ addptr(buf, Address(rsp, 4 + 1 * wordSize)); // + offset
|
|
__ movl(crc, Address(rsp, 4 + 3 * wordSize)); // Initial CRC
|
|
}
|
|
|
|
__ super_call_VM_leaf(CAST_FROM_FN_PTR(address, StubRoutines::updateBytesCRC32()), crc, buf, len);
|
|
// result in rax
|
|
|
|
// _areturn
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set sp to sender sp
|
|
__ jmp(rdi);
|
|
|
|
// generate a vanilla native entry as the slow path
|
|
__ bind(slow_path);
|
|
__ jump_to_entry(Interpreter::entry_for_kind(Interpreter::native));
|
|
return entry;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/**
|
|
* Method entry for static native methods:
|
|
* int java.util.zip.CRC32C.updateBytes(int crc, byte[] b, int off, int end)
|
|
* int java.util.zip.CRC32C.updateByteBuffer(int crc, long address, int off, int end)
|
|
*/
|
|
address TemplateInterpreterGenerator::generate_CRC32C_updateBytes_entry(AbstractInterpreter::MethodKind kind) {
|
|
if (UseCRC32CIntrinsics) {
|
|
address entry = __ pc();
|
|
// Load parameters
|
|
const Register crc = rax; // crc
|
|
const Register buf = rcx; // source java byte array address
|
|
const Register len = rdx; // length
|
|
const Register end = len;
|
|
|
|
// value x86_32
|
|
// interp. arg ptr ESP + 4
|
|
// int java.util.zip.CRC32.updateBytes(int crc, byte[] b, int off, int end)
|
|
// 3 2 1 0
|
|
// int java.util.zip.CRC32.updateByteBuffer(int crc, long address, int off, int end)
|
|
// 4 2,3 1 0
|
|
|
|
// Arguments are reversed on java expression stack
|
|
__ movl(end, Address(rsp, 4 + 0)); // end
|
|
__ subl(len, Address(rsp, 4 + 1 * wordSize)); // end - offset == length
|
|
// Calculate address of start element
|
|
if (kind == Interpreter::java_util_zip_CRC32C_updateDirectByteBuffer) {
|
|
__ movptr(buf, Address(rsp, 4 + 2 * wordSize)); // long address
|
|
__ addptr(buf, Address(rsp, 4 + 1 * wordSize)); // + offset
|
|
__ movl(crc, Address(rsp, 4 + 4 * wordSize)); // Initial CRC
|
|
} else {
|
|
__ movptr(buf, Address(rsp, 4 + 2 * wordSize)); // byte[] array
|
|
__ addptr(buf, arrayOopDesc::base_offset_in_bytes(T_BYTE)); // + header size
|
|
__ addptr(buf, Address(rsp, 4 + 1 * wordSize)); // + offset
|
|
__ movl(crc, Address(rsp, 4 + 3 * wordSize)); // Initial CRC
|
|
}
|
|
__ super_call_VM_leaf(CAST_FROM_FN_PTR(address, StubRoutines::updateBytesCRC32C()), crc, buf, len);
|
|
// result in rax
|
|
// _areturn
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set sp to sender sp
|
|
__ jmp(rdi);
|
|
|
|
return entry;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/**
|
|
* Method entry for static native method:
|
|
* java.lang.Float.intBitsToFloat(int bits)
|
|
*/
|
|
address TemplateInterpreterGenerator::generate_Float_intBitsToFloat_entry() {
|
|
if (UseSSE >= 1) {
|
|
address entry = __ pc();
|
|
|
|
// rsi: the sender's SP
|
|
|
|
// Skip safepoint check (compiler intrinsic versions of this method
|
|
// do not perform safepoint checks either).
|
|
|
|
// Load 'bits' into xmm0 (interpreter returns results in xmm0)
|
|
__ movflt(xmm0, Address(rsp, wordSize));
|
|
|
|
// Return
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set rsp to the sender's SP
|
|
__ jmp(rdi);
|
|
return entry;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
/**
|
|
* Method entry for static native method:
|
|
* java.lang.Float.floatToRawIntBits(float value)
|
|
*/
|
|
address TemplateInterpreterGenerator::generate_Float_floatToRawIntBits_entry() {
|
|
if (UseSSE >= 1) {
|
|
address entry = __ pc();
|
|
|
|
// rsi: the sender's SP
|
|
|
|
// Skip safepoint check (compiler intrinsic versions of this method
|
|
// do not perform safepoint checks either).
|
|
|
|
// Load the parameter (a floating-point value) into rax.
|
|
__ movl(rax, Address(rsp, wordSize));
|
|
|
|
// Return
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set rsp to the sender's SP
|
|
__ jmp(rdi);
|
|
return entry;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
|
|
/**
|
|
* Method entry for static native method:
|
|
* java.lang.Double.longBitsToDouble(long bits)
|
|
*/
|
|
address TemplateInterpreterGenerator::generate_Double_longBitsToDouble_entry() {
|
|
if (UseSSE >= 2) {
|
|
address entry = __ pc();
|
|
|
|
// rsi: the sender's SP
|
|
|
|
// Skip safepoint check (compiler intrinsic versions of this method
|
|
// do not perform safepoint checks either).
|
|
|
|
// Load 'bits' into xmm0 (interpreter returns results in xmm0)
|
|
__ movdbl(xmm0, Address(rsp, wordSize));
|
|
|
|
// Return
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set rsp to the sender's SP
|
|
__ jmp(rdi);
|
|
return entry;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
/**
|
|
* Method entry for static native method:
|
|
* java.lang.Double.doubleToRawLongBits(double value)
|
|
*/
|
|
address TemplateInterpreterGenerator::generate_Double_doubleToRawLongBits_entry() {
|
|
if (UseSSE >= 2) {
|
|
address entry = __ pc();
|
|
|
|
// rsi: the sender's SP
|
|
|
|
// Skip safepoint check (compiler intrinsic versions of this method
|
|
// do not perform safepoint checks either).
|
|
|
|
// Load the parameter (a floating-point value) into rax.
|
|
__ movl(rdx, Address(rsp, 2*wordSize));
|
|
__ movl(rax, Address(rsp, wordSize));
|
|
|
|
// Return
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set rsp to the sender's SP
|
|
__ jmp(rdi);
|
|
return entry;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
address TemplateInterpreterGenerator::generate_math_entry(AbstractInterpreter::MethodKind kind) {
|
|
|
|
// rbx,: Method*
|
|
// rcx: scratrch
|
|
// rsi: sender sp
|
|
|
|
if (!InlineIntrinsics) return NULL; // Generate a vanilla entry
|
|
|
|
address entry_point = __ pc();
|
|
|
|
// These don't need a safepoint check because they aren't virtually
|
|
// callable. We won't enter these intrinsics from compiled code.
|
|
// If in the future we added an intrinsic which was virtually callable
|
|
// we'd have to worry about how to safepoint so that this code is used.
|
|
|
|
// mathematical functions inlined by compiler
|
|
// (interpreter must provide identical implementation
|
|
// in order to avoid monotonicity bugs when switching
|
|
// from interpreter to compiler in the middle of some
|
|
// computation)
|
|
//
|
|
// stack: [ ret adr ] <-- rsp
|
|
// [ lo(arg) ]
|
|
// [ hi(arg) ]
|
|
//
|
|
if (kind == Interpreter::java_lang_math_fmaD) {
|
|
if (!UseFMA) {
|
|
return NULL; // Generate a vanilla entry
|
|
}
|
|
__ movdbl(xmm2, Address(rsp, 5 * wordSize));
|
|
__ movdbl(xmm1, Address(rsp, 3 * wordSize));
|
|
__ movdbl(xmm0, Address(rsp, 1 * wordSize));
|
|
__ fmad(xmm0, xmm1, xmm2, xmm0);
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set sp to sender sp
|
|
__ jmp(rdi);
|
|
|
|
return entry_point;
|
|
} else if (kind == Interpreter::java_lang_math_fmaF) {
|
|
if (!UseFMA) {
|
|
return NULL; // Generate a vanilla entry
|
|
}
|
|
__ movflt(xmm2, Address(rsp, 3 * wordSize));
|
|
__ movflt(xmm1, Address(rsp, 2 * wordSize));
|
|
__ movflt(xmm0, Address(rsp, 1 * wordSize));
|
|
__ fmaf(xmm0, xmm1, xmm2, xmm0);
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set sp to sender sp
|
|
__ jmp(rdi);
|
|
|
|
return entry_point;
|
|
}
|
|
|
|
__ fld_d(Address(rsp, 1*wordSize));
|
|
switch (kind) {
|
|
case Interpreter::java_lang_math_sin :
|
|
__ subptr(rsp, 2 * wordSize);
|
|
__ fstp_d(Address(rsp, 0));
|
|
if (VM_Version::supports_sse2() && StubRoutines::dsin() != NULL) {
|
|
__ call(RuntimeAddress(CAST_FROM_FN_PTR(address, StubRoutines::dsin())));
|
|
} else {
|
|
__ call_VM_leaf0(CAST_FROM_FN_PTR(address, SharedRuntime::dsin));
|
|
}
|
|
__ addptr(rsp, 2 * wordSize);
|
|
break;
|
|
case Interpreter::java_lang_math_cos :
|
|
__ subptr(rsp, 2 * wordSize);
|
|
__ fstp_d(Address(rsp, 0));
|
|
if (VM_Version::supports_sse2() && StubRoutines::dcos() != NULL) {
|
|
__ call(RuntimeAddress(CAST_FROM_FN_PTR(address, StubRoutines::dcos())));
|
|
} else {
|
|
__ call_VM_leaf0(CAST_FROM_FN_PTR(address, SharedRuntime::dcos));
|
|
}
|
|
__ addptr(rsp, 2 * wordSize);
|
|
break;
|
|
case Interpreter::java_lang_math_tan :
|
|
__ subptr(rsp, 2 * wordSize);
|
|
__ fstp_d(Address(rsp, 0));
|
|
if (StubRoutines::dtan() != NULL) {
|
|
__ call(RuntimeAddress(CAST_FROM_FN_PTR(address, StubRoutines::dtan())));
|
|
} else {
|
|
__ call_VM_leaf0(CAST_FROM_FN_PTR(address, SharedRuntime::dtan));
|
|
}
|
|
__ addptr(rsp, 2 * wordSize);
|
|
break;
|
|
case Interpreter::java_lang_math_sqrt:
|
|
__ fsqrt();
|
|
break;
|
|
case Interpreter::java_lang_math_abs:
|
|
__ fabs();
|
|
break;
|
|
case Interpreter::java_lang_math_log:
|
|
__ subptr(rsp, 2 * wordSize);
|
|
__ fstp_d(Address(rsp, 0));
|
|
if (StubRoutines::dlog() != NULL) {
|
|
__ call(RuntimeAddress(CAST_FROM_FN_PTR(address, StubRoutines::dlog())));
|
|
} else {
|
|
__ call_VM_leaf0(CAST_FROM_FN_PTR(address, SharedRuntime::dlog));
|
|
}
|
|
__ addptr(rsp, 2 * wordSize);
|
|
break;
|
|
case Interpreter::java_lang_math_log10:
|
|
__ subptr(rsp, 2 * wordSize);
|
|
__ fstp_d(Address(rsp, 0));
|
|
if (StubRoutines::dlog10() != NULL) {
|
|
__ call(RuntimeAddress(CAST_FROM_FN_PTR(address, StubRoutines::dlog10())));
|
|
} else {
|
|
__ call_VM_leaf0(CAST_FROM_FN_PTR(address, SharedRuntime::dlog10));
|
|
}
|
|
__ addptr(rsp, 2 * wordSize);
|
|
break;
|
|
case Interpreter::java_lang_math_pow:
|
|
__ fld_d(Address(rsp, 3*wordSize)); // second argument
|
|
__ subptr(rsp, 4 * wordSize);
|
|
__ fstp_d(Address(rsp, 0));
|
|
__ fstp_d(Address(rsp, 2 * wordSize));
|
|
if (StubRoutines::dpow() != NULL) {
|
|
__ call(RuntimeAddress(CAST_FROM_FN_PTR(address, StubRoutines::dpow())));
|
|
} else {
|
|
__ call_VM_leaf0(CAST_FROM_FN_PTR(address, SharedRuntime::dpow));
|
|
}
|
|
__ addptr(rsp, 4 * wordSize);
|
|
break;
|
|
case Interpreter::java_lang_math_exp:
|
|
__ subptr(rsp, 2*wordSize);
|
|
__ fstp_d(Address(rsp, 0));
|
|
if (StubRoutines::dexp() != NULL) {
|
|
__ call(RuntimeAddress(CAST_FROM_FN_PTR(address, StubRoutines::dexp())));
|
|
} else {
|
|
__ call_VM_leaf0(CAST_FROM_FN_PTR(address, SharedRuntime::dexp));
|
|
}
|
|
__ addptr(rsp, 2*wordSize);
|
|
break;
|
|
default :
|
|
ShouldNotReachHere();
|
|
}
|
|
|
|
// return double result in xmm0 for interpreter and compilers.
|
|
if (UseSSE >= 2) {
|
|
__ subptr(rsp, 2*wordSize);
|
|
__ fstp_d(Address(rsp, 0));
|
|
__ movdbl(xmm0, Address(rsp, 0));
|
|
__ addptr(rsp, 2*wordSize);
|
|
}
|
|
|
|
// done, result in FPU ST(0) or XMM0
|
|
__ pop(rdi); // get return address
|
|
__ mov(rsp, rsi); // set sp to sender sp
|
|
__ jmp(rdi);
|
|
|
|
return entry_point;
|
|
}
|