8295276: AArch64: Add backend support for half float conversion intrinsics
Reviewed-by: ngasson, aph, njian
This commit is contained in:
parent
3c0949824e
commit
891c706a10
@ -14577,6 +14577,32 @@ instruct convF2L_reg_reg(iRegLNoSp dst, vRegF src) %{
|
|||||||
ins_pipe(fp_f2l);
|
ins_pipe(fp_f2l);
|
||||||
%}
|
%}
|
||||||
|
|
||||||
|
instruct convF2HF_reg_reg(iRegINoSp dst, vRegF src, vRegF tmp) %{
|
||||||
|
match(Set dst (ConvF2HF src));
|
||||||
|
format %{ "fcvt $tmp, $src\t# convert single to half precision\n\t"
|
||||||
|
"smov $dst, $tmp\t# move result from $tmp to $dst"
|
||||||
|
%}
|
||||||
|
effect(TEMP tmp);
|
||||||
|
ins_encode %{
|
||||||
|
__ fcvtsh($tmp$$FloatRegister, $src$$FloatRegister);
|
||||||
|
__ smov($dst$$Register, $tmp$$FloatRegister, __ H, 0);
|
||||||
|
%}
|
||||||
|
ins_pipe(pipe_slow);
|
||||||
|
%}
|
||||||
|
|
||||||
|
instruct convHF2F_reg_reg(vRegF dst, iRegINoSp src, vRegF tmp) %{
|
||||||
|
match(Set dst (ConvHF2F src));
|
||||||
|
format %{ "mov $tmp, $src\t# move source from $src to $tmp\n\t"
|
||||||
|
"fcvt $dst, $tmp\t# convert half to single precision"
|
||||||
|
%}
|
||||||
|
effect(TEMP tmp);
|
||||||
|
ins_encode %{
|
||||||
|
__ mov($tmp$$FloatRegister, __ H, 0, $src$$Register);
|
||||||
|
__ fcvths($dst$$FloatRegister, $tmp$$FloatRegister);
|
||||||
|
%}
|
||||||
|
ins_pipe(pipe_slow);
|
||||||
|
%}
|
||||||
|
|
||||||
instruct convI2F_reg_reg(vRegF dst, iRegIorL2I src) %{
|
instruct convI2F_reg_reg(vRegF dst, iRegIorL2I src) %{
|
||||||
match(Set dst (ConvI2F src));
|
match(Set dst (ConvI2F src));
|
||||||
|
|
||||||
|
@ -1895,31 +1895,33 @@ void mvnw(Register Rd, Register Rm,
|
|||||||
#undef INSN
|
#undef INSN
|
||||||
|
|
||||||
// Floating-point data-processing (1 source)
|
// Floating-point data-processing (1 source)
|
||||||
void data_processing(unsigned op31, unsigned type, unsigned opcode,
|
void data_processing(unsigned type, unsigned opcode,
|
||||||
FloatRegister Vd, FloatRegister Vn) {
|
FloatRegister Vd, FloatRegister Vn) {
|
||||||
starti;
|
starti;
|
||||||
f(op31, 31, 29);
|
f(0b000, 31, 29);
|
||||||
f(0b11110, 28, 24);
|
f(0b11110, 28, 24);
|
||||||
f(type, 23, 22), f(1, 21), f(opcode, 20, 15), f(0b10000, 14, 10);
|
f(type, 23, 22), f(1, 21), f(opcode, 20, 15), f(0b10000, 14, 10);
|
||||||
rf(Vn, 5), rf(Vd, 0);
|
rf(Vn, 5), rf(Vd, 0);
|
||||||
}
|
}
|
||||||
|
|
||||||
#define INSN(NAME, op31, type, opcode) \
|
#define INSN(NAME, type, opcode) \
|
||||||
void NAME(FloatRegister Vd, FloatRegister Vn) { \
|
void NAME(FloatRegister Vd, FloatRegister Vn) { \
|
||||||
data_processing(op31, type, opcode, Vd, Vn); \
|
data_processing(type, opcode, Vd, Vn); \
|
||||||
}
|
}
|
||||||
|
|
||||||
INSN(fmovs, 0b000, 0b00, 0b000000);
|
INSN(fmovs, 0b00, 0b000000);
|
||||||
INSN(fabss, 0b000, 0b00, 0b000001);
|
INSN(fabss, 0b00, 0b000001);
|
||||||
INSN(fnegs, 0b000, 0b00, 0b000010);
|
INSN(fnegs, 0b00, 0b000010);
|
||||||
INSN(fsqrts, 0b000, 0b00, 0b000011);
|
INSN(fsqrts, 0b00, 0b000011);
|
||||||
INSN(fcvts, 0b000, 0b00, 0b000101); // Single-precision to double-precision
|
INSN(fcvts, 0b00, 0b000101); // Single-precision to double-precision
|
||||||
|
INSN(fcvths, 0b11, 0b000100); // Half-precision to single-precision
|
||||||
|
INSN(fcvtsh, 0b00, 0b000111); // Single-precision to half-precision
|
||||||
|
|
||||||
INSN(fmovd, 0b000, 0b01, 0b000000);
|
INSN(fmovd, 0b01, 0b000000);
|
||||||
INSN(fabsd, 0b000, 0b01, 0b000001);
|
INSN(fabsd, 0b01, 0b000001);
|
||||||
INSN(fnegd, 0b000, 0b01, 0b000010);
|
INSN(fnegd, 0b01, 0b000010);
|
||||||
INSN(fsqrtd, 0b000, 0b01, 0b000011);
|
INSN(fsqrtd, 0b01, 0b000011);
|
||||||
INSN(fcvtd, 0b000, 0b01, 0b000100); // Double-precision to single-precision
|
INSN(fcvtd, 0b01, 0b000100); // Double-precision to single-precision
|
||||||
|
|
||||||
private:
|
private:
|
||||||
void _fcvt_narrow_extend(FloatRegister Vd, SIMD_Arrangement Ta,
|
void _fcvt_narrow_extend(FloatRegister Vd, SIMD_Arrangement Ta,
|
||||||
|
@ -957,7 +957,9 @@ class LoadStorePairOp(InstructionWithModes):
|
|||||||
class FloatInstruction(Instruction):
|
class FloatInstruction(Instruction):
|
||||||
|
|
||||||
def aname(self):
|
def aname(self):
|
||||||
if (self._name.endswith("s") | self._name.endswith("d")):
|
if (self._name in ["fcvtsh", "fcvths"]):
|
||||||
|
return self._name[:len(self._name)-2]
|
||||||
|
elif (self._name.endswith("s") | self._name.endswith("d")):
|
||||||
return self._name[:len(self._name)-1]
|
return self._name[:len(self._name)-1]
|
||||||
else:
|
else:
|
||||||
return self._name
|
return self._name
|
||||||
@ -1012,6 +1014,8 @@ class SVEVectorOp(Instruction):
|
|||||||
elif not self._isPredicated and (name in ["and", "eor", "orr", "bic"]):
|
elif not self._isPredicated and (name in ["and", "eor", "orr", "bic"]):
|
||||||
self._width = RegVariant(3, 3)
|
self._width = RegVariant(3, 3)
|
||||||
self._bitwiseop = True
|
self._bitwiseop = True
|
||||||
|
elif name == "revb":
|
||||||
|
self._width = RegVariant(1, 3)
|
||||||
else:
|
else:
|
||||||
self._width = RegVariant(0, 3)
|
self._width = RegVariant(0, 3)
|
||||||
|
|
||||||
@ -1458,7 +1462,7 @@ generate(FourRegFloatOp,
|
|||||||
|
|
||||||
generate(TwoRegFloatOp,
|
generate(TwoRegFloatOp,
|
||||||
[["fmovs", "ss"], ["fabss", "ss"], ["fnegs", "ss"], ["fsqrts", "ss"],
|
[["fmovs", "ss"], ["fabss", "ss"], ["fnegs", "ss"], ["fsqrts", "ss"],
|
||||||
["fcvts", "ds"],
|
["fcvts", "ds"], ["fcvtsh", "hs"], ["fcvths", "sh"],
|
||||||
["fmovd", "dd"], ["fabsd", "dd"], ["fnegd", "dd"], ["fsqrtd", "dd"],
|
["fmovd", "dd"], ["fabsd", "dd"], ["fnegd", "dd"], ["fsqrtd", "dd"],
|
||||||
["fcvtd", "sd"],
|
["fcvtd", "sd"],
|
||||||
])
|
])
|
||||||
|
File diff suppressed because it is too large
Load Diff
Loading…
x
Reference in New Issue
Block a user