8295276: AArch64: Add backend support for half float conversion intrinsics

Reviewed-by: ngasson, aph, njian
This commit is contained in:
Bhavana Kilambi 2022-11-21 09:56:38 +00:00 committed by Ningsheng Jian
parent 3c0949824e
commit 891c706a10
4 changed files with 655 additions and 621 deletions

View File

@ -14577,6 +14577,32 @@ instruct convF2L_reg_reg(iRegLNoSp dst, vRegF src) %{
ins_pipe(fp_f2l); ins_pipe(fp_f2l);
%} %}
instruct convF2HF_reg_reg(iRegINoSp dst, vRegF src, vRegF tmp) %{
match(Set dst (ConvF2HF src));
format %{ "fcvt $tmp, $src\t# convert single to half precision\n\t"
"smov $dst, $tmp\t# move result from $tmp to $dst"
%}
effect(TEMP tmp);
ins_encode %{
__ fcvtsh($tmp$$FloatRegister, $src$$FloatRegister);
__ smov($dst$$Register, $tmp$$FloatRegister, __ H, 0);
%}
ins_pipe(pipe_slow);
%}
instruct convHF2F_reg_reg(vRegF dst, iRegINoSp src, vRegF tmp) %{
match(Set dst (ConvHF2F src));
format %{ "mov $tmp, $src\t# move source from $src to $tmp\n\t"
"fcvt $dst, $tmp\t# convert half to single precision"
%}
effect(TEMP tmp);
ins_encode %{
__ mov($tmp$$FloatRegister, __ H, 0, $src$$Register);
__ fcvths($dst$$FloatRegister, $tmp$$FloatRegister);
%}
ins_pipe(pipe_slow);
%}
instruct convI2F_reg_reg(vRegF dst, iRegIorL2I src) %{ instruct convI2F_reg_reg(vRegF dst, iRegIorL2I src) %{
match(Set dst (ConvI2F src)); match(Set dst (ConvI2F src));

View File

@ -1895,31 +1895,33 @@ void mvnw(Register Rd, Register Rm,
#undef INSN #undef INSN
// Floating-point data-processing (1 source) // Floating-point data-processing (1 source)
void data_processing(unsigned op31, unsigned type, unsigned opcode, void data_processing(unsigned type, unsigned opcode,
FloatRegister Vd, FloatRegister Vn) { FloatRegister Vd, FloatRegister Vn) {
starti; starti;
f(op31, 31, 29); f(0b000, 31, 29);
f(0b11110, 28, 24); f(0b11110, 28, 24);
f(type, 23, 22), f(1, 21), f(opcode, 20, 15), f(0b10000, 14, 10); f(type, 23, 22), f(1, 21), f(opcode, 20, 15), f(0b10000, 14, 10);
rf(Vn, 5), rf(Vd, 0); rf(Vn, 5), rf(Vd, 0);
} }
#define INSN(NAME, op31, type, opcode) \ #define INSN(NAME, type, opcode) \
void NAME(FloatRegister Vd, FloatRegister Vn) { \ void NAME(FloatRegister Vd, FloatRegister Vn) { \
data_processing(op31, type, opcode, Vd, Vn); \ data_processing(type, opcode, Vd, Vn); \
} }
INSN(fmovs, 0b000, 0b00, 0b000000); INSN(fmovs, 0b00, 0b000000);
INSN(fabss, 0b000, 0b00, 0b000001); INSN(fabss, 0b00, 0b000001);
INSN(fnegs, 0b000, 0b00, 0b000010); INSN(fnegs, 0b00, 0b000010);
INSN(fsqrts, 0b000, 0b00, 0b000011); INSN(fsqrts, 0b00, 0b000011);
INSN(fcvts, 0b000, 0b00, 0b000101); // Single-precision to double-precision INSN(fcvts, 0b00, 0b000101); // Single-precision to double-precision
INSN(fcvths, 0b11, 0b000100); // Half-precision to single-precision
INSN(fcvtsh, 0b00, 0b000111); // Single-precision to half-precision
INSN(fmovd, 0b000, 0b01, 0b000000); INSN(fmovd, 0b01, 0b000000);
INSN(fabsd, 0b000, 0b01, 0b000001); INSN(fabsd, 0b01, 0b000001);
INSN(fnegd, 0b000, 0b01, 0b000010); INSN(fnegd, 0b01, 0b000010);
INSN(fsqrtd, 0b000, 0b01, 0b000011); INSN(fsqrtd, 0b01, 0b000011);
INSN(fcvtd, 0b000, 0b01, 0b000100); // Double-precision to single-precision INSN(fcvtd, 0b01, 0b000100); // Double-precision to single-precision
private: private:
void _fcvt_narrow_extend(FloatRegister Vd, SIMD_Arrangement Ta, void _fcvt_narrow_extend(FloatRegister Vd, SIMD_Arrangement Ta,

View File

@ -957,7 +957,9 @@ class LoadStorePairOp(InstructionWithModes):
class FloatInstruction(Instruction): class FloatInstruction(Instruction):
def aname(self): def aname(self):
if (self._name.endswith("s") | self._name.endswith("d")): if (self._name in ["fcvtsh", "fcvths"]):
return self._name[:len(self._name)-2]
elif (self._name.endswith("s") | self._name.endswith("d")):
return self._name[:len(self._name)-1] return self._name[:len(self._name)-1]
else: else:
return self._name return self._name
@ -1012,6 +1014,8 @@ class SVEVectorOp(Instruction):
elif not self._isPredicated and (name in ["and", "eor", "orr", "bic"]): elif not self._isPredicated and (name in ["and", "eor", "orr", "bic"]):
self._width = RegVariant(3, 3) self._width = RegVariant(3, 3)
self._bitwiseop = True self._bitwiseop = True
elif name == "revb":
self._width = RegVariant(1, 3)
else: else:
self._width = RegVariant(0, 3) self._width = RegVariant(0, 3)
@ -1458,7 +1462,7 @@ generate(FourRegFloatOp,
generate(TwoRegFloatOp, generate(TwoRegFloatOp,
[["fmovs", "ss"], ["fabss", "ss"], ["fnegs", "ss"], ["fsqrts", "ss"], [["fmovs", "ss"], ["fabss", "ss"], ["fnegs", "ss"], ["fsqrts", "ss"],
["fcvts", "ds"], ["fcvts", "ds"], ["fcvtsh", "hs"], ["fcvths", "sh"],
["fmovd", "dd"], ["fabsd", "dd"], ["fnegd", "dd"], ["fsqrtd", "dd"], ["fmovd", "dd"], ["fabsd", "dd"], ["fnegd", "dd"], ["fsqrtd", "dd"],
["fcvtd", "sd"], ["fcvtd", "sd"],
]) ])

File diff suppressed because it is too large Load Diff