8284125: AArch64: Remove partial masked operations for SVE

Reviewed-by: njian, ngasson
This commit is contained in:
Eric Liu 2022-04-12 13:17:27 +00:00 committed by Nick Gasson
parent 83466434fd
commit a5378fb8c0
2 changed files with 342 additions and 1292 deletions

File diff suppressed because it is too large Load Diff

View File

@ -279,8 +279,7 @@ instruct storeV_partial(vReg src, vmemA mem, pRegGov pgtmp, rFlagsReg cr) %{
// vector load/store - predicated // vector load/store - predicated
instruct loadV_masked(vReg dst, vmemA mem, pRegGov pg) %{ instruct loadV_masked(vReg dst, vmemA mem, pRegGov pg) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0);
n->as_LoadVector()->memory_size() == MaxVectorSize);
match(Set dst (LoadVectorMasked mem pg)); match(Set dst (LoadVectorMasked mem pg));
ins_cost(4 * SVE_COST); ins_cost(4 * SVE_COST);
format %{ "sve_ldr $dst, $pg, $mem\t# load vector predicated (sve)" %} format %{ "sve_ldr $dst, $pg, $mem\t# load vector predicated (sve)" %}
@ -293,29 +292,8 @@ instruct loadV_masked(vReg dst, vmemA mem, pRegGov pg) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
instruct loadV_masked_partial(vReg dst, vmemA mem, pRegGov pg, pRegGov pgtmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->as_LoadVector()->memory_size() < MaxVectorSize);
match(Set dst (LoadVectorMasked mem pg));
effect(TEMP pgtmp, KILL cr);
ins_cost(6 * SVE_COST);
format %{ "sve_ldr $dst, $pg, $mem\t# load vector predicated partial (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this);
__ sve_ptrue_lanecnt(as_PRegister($pgtmp$$reg), __ elemType_to_regVariant(bt),
Matcher::vector_length(this));
__ sve_and(as_PRegister($pgtmp$$reg), as_PRegister($pgtmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
loadStoreA_predicated(C2_MacroAssembler(&cbuf), false, as_FloatRegister($dst$$reg),
as_PRegister($pgtmp$$reg), bt, bt, $mem->opcode(),
as_Register($mem$$base), $mem$$index, $mem$$scale, $mem$$disp);
%}
ins_pipe(pipe_slow);
%}
instruct storeV_masked(vReg src, vmemA mem, pRegGov pg) %{ instruct storeV_masked(vReg src, vmemA mem, pRegGov pg) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0);
n->as_StoreVector()->memory_size() == MaxVectorSize);
match(Set mem (StoreVectorMasked mem (Binary src pg))); match(Set mem (StoreVectorMasked mem (Binary src pg)));
ins_cost(4 * SVE_COST); ins_cost(4 * SVE_COST);
format %{ "sve_str $mem, $pg, $src\t# store vector predicated (sve)" %} format %{ "sve_str $mem, $pg, $src\t# store vector predicated (sve)" %}
@ -328,82 +306,6 @@ instruct storeV_masked(vReg src, vmemA mem, pRegGov pg) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
instruct storeV_masked_partial(vReg src, vmemA mem, pRegGov pg, pRegGov pgtmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->as_StoreVector()->memory_size() < MaxVectorSize);
match(Set mem (StoreVectorMasked mem (Binary src pg)));
effect(TEMP pgtmp, KILL cr);
ins_cost(6 * SVE_COST);
format %{ "sve_str $mem, $pg, $src\t# store vector predicated partial (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this, $src);
__ sve_ptrue_lanecnt(as_PRegister($pgtmp$$reg), __ elemType_to_regVariant(bt),
Matcher::vector_length(this, $src));
__ sve_and(as_PRegister($pgtmp$$reg), as_PRegister($pgtmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
loadStoreA_predicated(C2_MacroAssembler(&cbuf), true, as_FloatRegister($src$$reg),
as_PRegister($pgtmp$$reg), bt, bt, $mem->opcode(),
as_Register($mem$$base), $mem$$index, $mem$$scale, $mem$$disp);
%}
ins_pipe(pipe_slow);
%}
dnl
dnl MASKALL_IMM($1, $2 )
dnl MASKALL_IMM(type, size)
define(`MASKALL_IMM', `
instruct vmaskAll_imm$1(pRegGov dst, imm$1 src) %{
predicate(UseSVE > 0);
match(Set dst (MaskAll src));
ins_cost(SVE_COST);
format %{ "sve_ptrue_lanecnt/sve_pfalse $dst\t# mask all (sve) ($2)" %}
ins_encode %{
ifelse($1, `I', int, long) con = (ifelse($1, `I', int, long))$src$$constant;
if (con == 0) {
__ sve_pfalse(as_PRegister($dst$$reg));
} else {
assert(con == -1, "invalid constant value for mask");
BasicType bt = Matcher::vector_element_basic_type(this);
__ sve_ptrue_lanecnt(as_PRegister($dst$$reg), __ elemType_to_regVariant(bt),
Matcher::vector_length(this));
}
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
dnl MASKALL($1, $2 )
dnl MASKALL(type, size)
define(`MASKALL', `
instruct vmaskAll$1(pRegGov dst, ifelse($1, `I', iRegIorL2I, iRegL) src, vReg tmp, rFlagsReg cr) %{
predicate(UseSVE > 0);
match(Set dst (MaskAll src));
effect(TEMP tmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "sve_dup $tmp, $src\n\t"
"sve_ptrue $dst, vector_length\n\t"
"sve_cmpne $dst, $dst, $tmp, 0\t# mask all (sve) ($2)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
uint length_in_bytes = Matcher::vector_length_in_bytes(this);
__ sve_dup(as_FloatRegister($tmp$$reg), size, as_Register($src$$reg));
if (length_in_bytes < MaxVectorSize) {
__ sve_ptrue_lanecnt(as_PRegister($dst$$reg), size, Matcher::vector_length(this));
__ sve_cmp(Assembler::NE, as_PRegister($dst$$reg), size,
as_PRegister($dst$$reg), as_FloatRegister($tmp$$reg), 0);
} else {
__ sve_cmp(Assembler::NE, as_PRegister($dst$$reg), size, ptrue, as_FloatRegister($tmp$$reg), 0);
}
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
// maskAll (full or partial predicate size)
MASKALL_IMM(I, B/H/S)
MASKALL(I, B/H/S)
MASKALL_IMM(L, D)
MASKALL(L, D)
dnl dnl
dnl MASK_LOGICAL_OP($1, $2, $3 ) dnl MASK_LOGICAL_OP($1, $2, $3 )
dnl MASK_LOGICAL_OP(insn_name, op_name, insn) dnl MASK_LOGICAL_OP(insn_name, op_name, insn)
@ -1281,36 +1183,6 @@ instruct vpopcountI(vReg dst, vReg src) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
// vector mask compare
instruct vmaskcmp(pRegGov dst, vReg src1, vReg src2, immI cond, rFlagsReg cr) %{
predicate(UseSVE > 0);
match(Set dst (VectorMaskCmp (Binary src1 src2) cond));
effect(KILL cr);
ins_cost(SVE_COST);
format %{ "sve_cmp $dst, $src1, $src2\t# vector mask cmp (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this);
__ sve_compare(as_PRegister($dst$$reg), bt, ptrue, as_FloatRegister($src1$$reg),
as_FloatRegister($src2$$reg), (int)$cond$$constant);
%}
ins_pipe(pipe_slow);
%}
instruct vmaskcmp_masked(pRegGov dst, vReg src1, vReg src2, immI cond, pRegGov pg, rFlagsReg cr) %{
predicate(UseSVE > 0);
match(Set dst (VectorMaskCmp (Binary src1 src2) (Binary cond pg)));
effect(KILL cr);
ins_cost(SVE_COST);
format %{ "sve_cmp $dst, $pg, $src1, $src2\t# vector mask cmp (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this);
__ sve_compare(as_PRegister($dst$$reg), bt, as_PRegister($pg$$reg), as_FloatRegister($src1$$reg),
as_FloatRegister($src2$$reg), (int)$cond$$constant);
%}
ins_pipe(pipe_slow);
%}
// vector blend // vector blend
instruct vblend(vReg dst, vReg src1, vReg src2, pRegGov pg) %{ instruct vblend(vReg dst, vReg src1, vReg src2, pRegGov pg) %{
@ -1327,37 +1199,6 @@ instruct vblend(vReg dst, vReg src1, vReg src2, pRegGov pg) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
// vector load mask
instruct vloadmaskB(pRegGov dst, vReg src, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->bottom_type()->is_vect()->element_basic_type() == T_BYTE);
match(Set dst (VectorLoadMask src));
effect(KILL cr);
ins_cost(SVE_COST);
format %{ "vloadmaskB $dst, $src\t# vector load mask (sve) (B)" %}
ins_encode %{
__ sve_cmp(Assembler::NE, as_PRegister($dst$$reg), __ B,
ptrue, as_FloatRegister($src$$reg), 0);
%}
ins_pipe(pipe_slow);
%}
instruct vloadmask_extend(pRegGov dst, vReg src, vReg tmp, rFlagsReg cr) %{
predicate(UseSVE > 0 && n->bottom_type()->is_vect()->element_basic_type() != T_BYTE);
match(Set dst (VectorLoadMask src));
effect(TEMP tmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "vloadmask $dst, $src\t# vector load mask (sve) (H/S/D)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
__ sve_vector_extend(as_FloatRegister($tmp$$reg), size, as_FloatRegister($src$$reg), __ B);
__ sve_cmp(Assembler::NE, as_PRegister($dst$$reg), size, ptrue, as_FloatRegister($tmp$$reg), 0);
%}
ins_pipe(pipe_slow);
%}
// vector store mask // vector store mask
instruct vstoremaskB(vReg dst, pRegGov src, immI_1 size) %{ instruct vstoremaskB(vReg dst, pRegGov src, immI_1 size) %{
@ -1616,11 +1457,9 @@ dnl REDUCE_I_PREDICATE(insn_name, op_name)
define(`REDUCE_I_PREDICATE', ` define(`REDUCE_I_PREDICATE', `
instruct reduce_$1I_masked(iRegINoSp dst, iRegIorL2I src1, vReg src2, vRegD tmp, pRegGov pg) %{ instruct reduce_$1I_masked(iRegINoSp dst, iRegIorL2I src1, vReg src2, vRegD tmp, pRegGov pg) %{
ifelse($2, AddReductionVI, ifelse($2, AddReductionVI,
`predicate(UseSVE > 0);',
`predicate(UseSVE > 0 && `predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);', n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() != T_LONG);')
`predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() != T_LONG &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);')
match(Set dst ($2 (Binary src1 src2) pg)); match(Set dst ($2 (Binary src1 src2) pg));
effect(TEMP_DEF dst, TEMP tmp); effect(TEMP_DEF dst, TEMP tmp);
ins_cost(SVE_COST); ins_cost(SVE_COST);
@ -1639,11 +1478,9 @@ dnl REDUCE_L_PREDICATE(insn_name, op_name)
define(`REDUCE_L_PREDICATE', ` define(`REDUCE_L_PREDICATE', `
instruct reduce_$1L_masked(iRegLNoSp dst, iRegL src1, vReg src2, vRegD tmp, pRegGov pg) %{ instruct reduce_$1L_masked(iRegLNoSp dst, iRegL src1, vReg src2, vRegD tmp, pRegGov pg) %{
ifelse($2, AddReductionVL, ifelse($2, AddReductionVL,
`predicate(UseSVE > 0);',
`predicate(UseSVE > 0 && `predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);', n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == T_LONG);')
`predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == T_LONG &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);')
match(Set dst ($2 (Binary src1 src2) pg)); match(Set dst ($2 (Binary src1 src2) pg));
effect(TEMP_DEF dst, TEMP tmp); effect(TEMP_DEF dst, TEMP tmp);
ins_cost(SVE_COST); ins_cost(SVE_COST);
@ -1656,66 +1493,11 @@ instruct reduce_$1L_masked(iRegLNoSp dst, iRegL src1, vReg src2, vRegD tmp, pReg
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%}')dnl %}')dnl
dnl dnl
dnl REDUCE_I_PREDICATE_PARTIAL($1, $2 )
dnl REDUCE_I_PREDICATE_PARTIAL(insn_name, op_name)
define(`REDUCE_I_PREDICATE_PARTIAL', `
instruct reduce_$1I_masked_partial(iRegINoSp dst, iRegIorL2I src1, vReg src2, vRegD vtmp,
pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
ifelse($2, AddReductionVI,
`predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);',
`predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() != T_LONG &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);')
match(Set dst ($2 (Binary src1 src2) pg));
effect(TEMP_DEF dst, TEMP vtmp, TEMP ptmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "sve_reduce_$1I $dst, $src1, $pg, $src2\t# $1I reduction predicated partial (sve) (may extend)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this, $src2);
Assembler::SIMD_RegVariant variant = __ elemType_to_regVariant(bt);
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), variant, Matcher::vector_length(this, $src2));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_reduce_integral(this->ideal_Opcode(), $dst$$Register, bt,
$src1$$Register, as_FloatRegister($src2$$reg),
as_PRegister($ptmp$$reg), as_FloatRegister($vtmp$$reg));
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
dnl REDUCE_L_PREDICATE_PARTIAL($1, $2 )
dnl REDUCE_L_PREDICATE_PARTIAL(insn_name, op_name)
define(`REDUCE_L_PREDICATE_PARTIAL', `
instruct reduce_$1L_masked_partial(iRegLNoSp dst, iRegL src1, vReg src2, vRegD vtmp,
pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
ifelse($2, AddReductionVL,
`predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);',
`predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == T_LONG &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);')
match(Set dst ($2 (Binary src1 src2) pg));
effect(TEMP_DEF dst, TEMP vtmp, TEMP ptmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "sve_reduce_$1L $dst, $src1, $pg, $src2\t# $1L reduction predicated partial (sve)" %}
ins_encode %{
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), __ D, Matcher::vector_length(this, $src2));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_reduce_integral(this->ideal_Opcode(), $dst$$Register, T_LONG,
$src1$$Register, as_FloatRegister($src2$$reg),
as_PRegister($ptmp$$reg), as_FloatRegister($vtmp$$reg));
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
dnl REDUCE_ADDF_PREDICATE($1, $2, $3, $4 ) dnl REDUCE_ADDF_PREDICATE($1, $2, $3, $4 )
dnl REDUCE_ADDF_PREDICATE(insn_name, op_name, reg_dst, size) dnl REDUCE_ADDF_PREDICATE(insn_name, op_name, reg_dst, size)
define(`REDUCE_ADDF_PREDICATE', ` define(`REDUCE_ADDF_PREDICATE', `
instruct reduce_$1_masked($3 src1_dst, vReg src2, pRegGov pg) %{ instruct reduce_$1_masked($3 src1_dst, vReg src2, pRegGov pg) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0);
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);
match(Set src1_dst ($2 (Binary src1_dst src2) pg)); match(Set src1_dst ($2 (Binary src1_dst src2) pg));
ins_cost(SVE_COST); ins_cost(SVE_COST);
format %{ "sve_reduce_$1 $src1_dst, $pg, $src2\t# $1 reduction predicated (sve)" %} format %{ "sve_reduce_$1 $src1_dst, $pg, $src2\t# $1 reduction predicated (sve)" %}
@ -1726,26 +1508,6 @@ instruct reduce_$1_masked($3 src1_dst, vReg src2, pRegGov pg) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%}')dnl %}')dnl
dnl dnl
dnl REDUCE_ADDF_PREDICATE_PARTIAL($1, $2, $3, $4 )
dnl REDUCE_ADDF_PREDICATE_PARTIAL(insn_name, op_name, reg_dst, size)
define(`REDUCE_ADDF_PREDICATE_PARTIAL', `
instruct reduce_$1_masked_partial($3 src1_dst, vReg src2, pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);
match(Set src1_dst ($2 (Binary src1_dst src2) pg));
effect(TEMP ptmp, KILL cr);
ins_cost(SVE_COST);
format %{ "sve_reduce_$1 $src1_dst, $pg, $src2\t# $1 reduction predicated partial (sve)" %}
ins_encode %{
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), __ $4, Matcher::vector_length(this, $src2));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_fadda(as_FloatRegister($src1_dst$$reg), __ $4,
as_PRegister($ptmp$$reg), as_FloatRegister($src2$$reg));
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
// vector add reduction // vector add reduction
REDUCE_I(add, AddReductionVI) REDUCE_I(add, AddReductionVI)
@ -1762,10 +1524,6 @@ REDUCE_I_PREDICATE(add, AddReductionVI)
REDUCE_L_PREDICATE(add, AddReductionVL) REDUCE_L_PREDICATE(add, AddReductionVL)
REDUCE_ADDF_PREDICATE(addF, AddReductionVF, vRegF, S) REDUCE_ADDF_PREDICATE(addF, AddReductionVF, vRegF, S)
REDUCE_ADDF_PREDICATE(addD, AddReductionVD, vRegD, D) REDUCE_ADDF_PREDICATE(addD, AddReductionVD, vRegD, D)
REDUCE_I_PREDICATE_PARTIAL(add, AddReductionVI)
REDUCE_L_PREDICATE_PARTIAL(add, AddReductionVL)
REDUCE_ADDF_PREDICATE_PARTIAL(addF, AddReductionVF, vRegF, S)
REDUCE_ADDF_PREDICATE_PARTIAL(addD, AddReductionVD, vRegD, D)
// vector and reduction // vector and reduction
REDUCE_I(and, AndReductionV) REDUCE_I(and, AndReductionV)
@ -1776,8 +1534,6 @@ REDUCE_L_PARTIAL(and, AndReductionV)
// vector and reduction - predicated // vector and reduction - predicated
REDUCE_I_PREDICATE(and, AndReductionV) REDUCE_I_PREDICATE(and, AndReductionV)
REDUCE_L_PREDICATE(and, AndReductionV) REDUCE_L_PREDICATE(and, AndReductionV)
REDUCE_I_PREDICATE_PARTIAL(and, AndReductionV)
REDUCE_L_PREDICATE_PARTIAL(and, AndReductionV)
// vector or reduction // vector or reduction
REDUCE_I(or, OrReductionV) REDUCE_I(or, OrReductionV)
@ -1788,8 +1544,6 @@ REDUCE_L_PARTIAL(or, OrReductionV)
// vector or reduction - predicated // vector or reduction - predicated
REDUCE_I_PREDICATE(or, OrReductionV) REDUCE_I_PREDICATE(or, OrReductionV)
REDUCE_L_PREDICATE(or, OrReductionV) REDUCE_L_PREDICATE(or, OrReductionV)
REDUCE_I_PREDICATE_PARTIAL(or, OrReductionV)
REDUCE_L_PREDICATE_PARTIAL(or, OrReductionV)
// vector xor reduction // vector xor reduction
REDUCE_I(eor, XorReductionV) REDUCE_I(eor, XorReductionV)
@ -1800,8 +1554,6 @@ REDUCE_L_PARTIAL(eor, XorReductionV)
// vector xor reduction - predicated // vector xor reduction - predicated
REDUCE_I_PREDICATE(eor, XorReductionV) REDUCE_I_PREDICATE(eor, XorReductionV)
REDUCE_L_PREDICATE(eor, XorReductionV) REDUCE_L_PREDICATE(eor, XorReductionV)
REDUCE_I_PREDICATE_PARTIAL(eor, XorReductionV)
REDUCE_L_PREDICATE_PARTIAL(eor, XorReductionV)
dnl dnl
dnl REDUCE_MAXMIN_I($1, $2 ) dnl REDUCE_MAXMIN_I($1, $2 )
@ -1895,7 +1647,6 @@ define(`REDUCE_MAXMIN_I_PREDICATE', `
instruct reduce_$1I_masked(iRegINoSp dst, iRegIorL2I src1, vReg src2, vRegD tmp, instruct reduce_$1I_masked(iRegINoSp dst, iRegIorL2I src1, vReg src2, vRegD tmp,
pRegGov pg, rFlagsReg cr) %{ pRegGov pg, rFlagsReg cr) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() != T_LONG && n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() != T_LONG &&
is_integral_type(n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type())); is_integral_type(n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type()));
match(Set dst ($2 (Binary src1 src2) pg)); match(Set dst ($2 (Binary src1 src2) pg));
@ -1917,7 +1668,6 @@ define(`REDUCE_MAXMIN_L_PREDICATE', `
instruct reduce_$1L_masked(iRegLNoSp dst, iRegL src1, vReg src2, vRegD tmp, instruct reduce_$1L_masked(iRegLNoSp dst, iRegL src1, vReg src2, vRegD tmp,
pRegGov pg, rFlagsReg cr) %{ pRegGov pg, rFlagsReg cr) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == T_LONG); n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == T_LONG);
match(Set dst ($2 (Binary src1 src2) pg)); match(Set dst ($2 (Binary src1 src2) pg));
effect(TEMP_DEF dst, TEMP tmp, KILL cr); effect(TEMP_DEF dst, TEMP tmp, KILL cr);
@ -1931,55 +1681,6 @@ instruct reduce_$1L_masked(iRegLNoSp dst, iRegL src1, vReg src2, vRegD tmp,
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%}')dnl %}')dnl
dnl dnl
dnl REDUCE_MAXMIN_I_PREDICATE_PARTIAL($1 , $2 )
dnl REDUCE_MAXMIN_I_PREDICATE_PARTIAL(min_max, op_name)
define(`REDUCE_MAXMIN_I_PREDICATE_PARTIAL', `
instruct reduce_$1I_masked_partial(iRegINoSp dst, iRegIorL2I src1, vReg src2, vRegD vtmp,
pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() != T_LONG &&
is_integral_type(n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type()));
match(Set dst ($2 (Binary src1 src2) pg));
effect(TEMP_DEF dst, TEMP vtmp, TEMP ptmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "sve_reduce_$1I $dst, $src1, $pg, $src2\t# $1I reduction predicated partial (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this, $src2);
Assembler::SIMD_RegVariant variant = __ elemType_to_regVariant(bt);
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), variant, Matcher::vector_length(this, $src2));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_reduce_integral(this->ideal_Opcode(), $dst$$Register, bt,
$src1$$Register, as_FloatRegister($src2$$reg),
as_PRegister($ptmp$$reg), as_FloatRegister($vtmp$$reg));
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
dnl REDUCE_MAXMIN_L_PREDICATE_PARTIAL($1 , $2 )
dnl REDUCE_MAXMIN_L_PREDICATE_PARTIAL(min_max, op_name)
define(`REDUCE_MAXMIN_L_PREDICATE_PARTIAL', `
instruct reduce_$1L_masked_partial(iRegLNoSp dst, iRegL src1, vReg src2, vRegD vtmp,
pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == T_LONG);
match(Set dst ($2 (Binary src1 src2) pg));
effect(TEMP_DEF dst, TEMP vtmp, TEMP ptmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "sve_reduce_$1L $dst, $src1, $pg, $src2\t# $1L reduction predicated partial (sve)" %}
ins_encode %{
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), __ D, Matcher::vector_length(this, $src2));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_reduce_integral(this->ideal_Opcode(), $dst$$Register, T_LONG,
$src1$$Register, as_FloatRegister($src2$$reg),
as_PRegister($ptmp$$reg), as_FloatRegister($vtmp$$reg));
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
dnl REDUCE_FMINMAX($1, $2, $3, $4, $5 ) dnl REDUCE_FMINMAX($1, $2, $3, $4, $5 )
dnl REDUCE_FMINMAX(min_max, name_suffix, element_type, size, reg_src_dst) dnl REDUCE_FMINMAX(min_max, name_suffix, element_type, size, reg_src_dst)
define(`REDUCE_FMINMAX', ` define(`REDUCE_FMINMAX', `
@ -2023,8 +1724,7 @@ dnl REDUCE_FMINMAX_PREDICATE(min_max, name_suffix, element_type, size, reg_src_d
define(`REDUCE_FMINMAX_PREDICATE', ` define(`REDUCE_FMINMAX_PREDICATE', `
instruct reduce_$1$2_masked($5 dst, $5 src1, vReg src2, pRegGov pg) %{ instruct reduce_$1$2_masked($5 dst, $5 src1, vReg src2, pRegGov pg) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == $3 && n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == $3);
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);
match(Set dst (translit($1, `m', `M')ReductionV (Binary src1 src2) pg)); match(Set dst (translit($1, `m', `M')ReductionV (Binary src1 src2) pg));
ins_cost(SVE_COST); ins_cost(SVE_COST);
effect(TEMP_DEF dst); effect(TEMP_DEF dst);
@ -2036,28 +1736,6 @@ instruct reduce_$1$2_masked($5 dst, $5 src1, vReg src2, pRegGov pg) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%}')dnl %}')dnl
dnl dnl
dnl REDUCE_FMINMAX_PREDICATE_PARTIAL($1, $2, $3, $4, $5 )
dnl REDUCE_FMINMAX_PREDICATE_PARTIAL(min_max, name_suffix, element_type, size, reg_src_dst)
define(`REDUCE_FMINMAX_PREDICATE_PARTIAL', `
instruct reduce_$1$2_masked_partial($5 dst, $5 src1, vReg src2, pRegGov pg,
pRegGov ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->in(1)->in(2)->bottom_type()->is_vect()->element_basic_type() == $3 &&
n->in(1)->in(2)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);
match(Set dst (translit($1, `m', `M')ReductionV (Binary src1 src2) pg));
effect(TEMP_DEF dst, TEMP ptmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "sve_reduce_$1$2 $dst, $src1, $pg, $src2\t# $1$2 reduction predicated partial (sve)" %}
ins_encode %{
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), __ $4, Matcher::vector_length(this, $src2));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_f$1v(as_FloatRegister($dst$$reg), __ $4,
as_PRegister($ptmp$$reg), as_FloatRegister($src2$$reg));
__ f`$1'translit($4, `SD', `sd')(as_FloatRegister($dst$$reg), as_FloatRegister($dst$$reg), as_FloatRegister($src1$$reg));
%}
ins_pipe(pipe_slow);
%}')dnl
// vector max reduction // vector max reduction
REDUCE_MAXMIN_I(max, MaxReductionV) REDUCE_MAXMIN_I(max, MaxReductionV)
REDUCE_MAXMIN_L(max, MaxReductionV) REDUCE_MAXMIN_L(max, MaxReductionV)
@ -2071,12 +1749,8 @@ REDUCE_FMINMAX_PARTIAL(max, D, T_DOUBLE, D, vRegD)
// vector max reduction - predicated // vector max reduction - predicated
REDUCE_MAXMIN_I_PREDICATE(max, MaxReductionV) REDUCE_MAXMIN_I_PREDICATE(max, MaxReductionV)
REDUCE_MAXMIN_L_PREDICATE(max, MaxReductionV) REDUCE_MAXMIN_L_PREDICATE(max, MaxReductionV)
REDUCE_MAXMIN_I_PREDICATE_PARTIAL(max, MaxReductionV)
REDUCE_MAXMIN_L_PREDICATE_PARTIAL(max, MaxReductionV)
REDUCE_FMINMAX_PREDICATE(max, F, T_FLOAT, S, vRegF) REDUCE_FMINMAX_PREDICATE(max, F, T_FLOAT, S, vRegF)
REDUCE_FMINMAX_PREDICATE(max, D, T_DOUBLE, D, vRegD) REDUCE_FMINMAX_PREDICATE(max, D, T_DOUBLE, D, vRegD)
REDUCE_FMINMAX_PREDICATE_PARTIAL(max, F, T_FLOAT, S, vRegF)
REDUCE_FMINMAX_PREDICATE_PARTIAL(max, D, T_DOUBLE, D, vRegD)
// vector min reduction // vector min reduction
REDUCE_MAXMIN_I(min, MinReductionV) REDUCE_MAXMIN_I(min, MinReductionV)
@ -2091,12 +1765,8 @@ REDUCE_FMINMAX_PARTIAL(min, D, T_DOUBLE, D, vRegD)
// vector min reduction - predicated // vector min reduction - predicated
REDUCE_MAXMIN_I_PREDICATE(min, MinReductionV) REDUCE_MAXMIN_I_PREDICATE(min, MinReductionV)
REDUCE_MAXMIN_L_PREDICATE(min, MinReductionV) REDUCE_MAXMIN_L_PREDICATE(min, MinReductionV)
REDUCE_MAXMIN_I_PREDICATE_PARTIAL(min, MinReductionV)
REDUCE_MAXMIN_L_PREDICATE_PARTIAL(min, MinReductionV)
REDUCE_FMINMAX_PREDICATE(min, F, T_FLOAT, S, vRegF) REDUCE_FMINMAX_PREDICATE(min, F, T_FLOAT, S, vRegF)
REDUCE_FMINMAX_PREDICATE(min, D, T_DOUBLE, D, vRegD) REDUCE_FMINMAX_PREDICATE(min, D, T_DOUBLE, D, vRegD)
REDUCE_FMINMAX_PREDICATE_PARTIAL(min, F, T_FLOAT, S, vRegF)
REDUCE_FMINMAX_PREDICATE_PARTIAL(min, D, T_DOUBLE, D, vRegD)
// vector Math.rint, floor, ceil // vector Math.rint, floor, ceil
@ -2704,7 +2374,6 @@ VECTOR_EXTRACT(D, vRegD, D, FloatRegister)
instruct vtest_alltrue(iRegINoSp dst, pRegGov src1, pRegGov src2, pReg ptmp, rFlagsReg cr) instruct vtest_alltrue(iRegINoSp dst, pRegGov src1, pRegGov src2, pReg ptmp, rFlagsReg cr)
%{ %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->in(1)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize &&
static_cast<const VectorTestNode*>(n)->get_predicate() == BoolTest::overflow); static_cast<const VectorTestNode*>(n)->get_predicate() == BoolTest::overflow);
match(Set dst (VectorTest src1 src2)); match(Set dst (VectorTest src1 src2));
effect(TEMP ptmp, KILL cr); effect(TEMP ptmp, KILL cr);
@ -2722,7 +2391,6 @@ instruct vtest_alltrue(iRegINoSp dst, pRegGov src1, pRegGov src2, pReg ptmp, rFl
instruct vtest_anytrue(iRegINoSp dst, pRegGov src1, pRegGov src2, rFlagsReg cr) instruct vtest_anytrue(iRegINoSp dst, pRegGov src1, pRegGov src2, rFlagsReg cr)
%{ %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->in(1)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize &&
static_cast<const VectorTestNode*>(n)->get_predicate() == BoolTest::ne); static_cast<const VectorTestNode*>(n)->get_predicate() == BoolTest::ne);
match(Set dst (VectorTest src1 src2)); match(Set dst (VectorTest src1 src2));
effect(KILL cr); effect(KILL cr);
@ -2737,33 +2405,6 @@ instruct vtest_anytrue(iRegINoSp dst, pRegGov src1, pRegGov src2, rFlagsReg cr)
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
dnl dnl
dnl
dnl VTEST_PARTIAL($1, $2, $3, $4 )
dnl VTEST_PARTIAL(op_name, pred, inst, cond)
define(`VTEST_PARTIAL', `
instruct vtest_$1_partial`'(iRegINoSp dst, pRegGov src1, pRegGov src2, pRegGov ptmp, rFlagsReg cr)
%{
predicate(UseSVE > 0 &&
n->in(1)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize &&
static_cast<const VectorTestNode*>(n)->get_predicate() == BoolTest::$2);
match(Set dst (VectorTest src1 src2));
effect(TEMP ptmp, KILL cr);
ins_cost(SVE_COST);
format %{ "vtest_$1_partial $dst, $src1, $src2\t# VectorTest partial (sve) - $1" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this, $src1);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), size, Matcher::vector_length(this, $src1));
__ $3(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($src1$$reg), as_PRegister($src2$$reg));
__ csetw(as_Register($dst$$reg), Assembler::$4);
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
VTEST_PARTIAL(alltrue, overflow, sve_eors, EQ)
VTEST_PARTIAL(anytrue, ne, sve_ands, NE)
// ------------------------------ Vector insert --------------------------------- // ------------------------------ Vector insert ---------------------------------
instruct insertI_small(vReg dst, vReg src, iRegIorL2I val, immI idx, pRegGov pgtmp, rFlagsReg cr) instruct insertI_small(vReg dst, vReg src, iRegIorL2I val, immI idx, pRegGov pgtmp, rFlagsReg cr)
@ -3004,7 +2645,6 @@ instruct gatherL_partial(vReg dst, indirect mem, vReg idx, pRegGov ptmp, rFlagsR
instruct gatherI_masked(vReg dst, indirect mem, vReg idx, pRegGov pg) %{ instruct gatherI_masked(vReg dst, indirect mem, vReg idx, pRegGov pg) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->as_LoadVector()->memory_size() == MaxVectorSize &&
(n->bottom_type()->is_vect()->element_basic_type() == T_INT || (n->bottom_type()->is_vect()->element_basic_type() == T_INT ||
n->bottom_type()->is_vect()->element_basic_type() == T_FLOAT)); n->bottom_type()->is_vect()->element_basic_type() == T_FLOAT));
match(Set dst (LoadVectorGatherMasked mem (Binary idx pg))); match(Set dst (LoadVectorGatherMasked mem (Binary idx pg)));
@ -3019,7 +2659,6 @@ instruct gatherI_masked(vReg dst, indirect mem, vReg idx, pRegGov pg) %{
instruct gatherL_masked(vReg dst, indirect mem, vReg idx, pRegGov pg) %{ instruct gatherL_masked(vReg dst, indirect mem, vReg idx, pRegGov pg) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->as_LoadVector()->memory_size() == MaxVectorSize &&
(n->bottom_type()->is_vect()->element_basic_type() == T_LONG || (n->bottom_type()->is_vect()->element_basic_type() == T_LONG ||
n->bottom_type()->is_vect()->element_basic_type() == T_DOUBLE)); n->bottom_type()->is_vect()->element_basic_type() == T_DOUBLE));
match(Set dst (LoadVectorGatherMasked mem (Binary idx pg))); match(Set dst (LoadVectorGatherMasked mem (Binary idx pg)));
@ -3033,47 +2672,6 @@ instruct gatherL_masked(vReg dst, indirect mem, vReg idx, pRegGov pg) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
// ------------------------------ Vector Load Gather Predicated Partial -------------------------------
instruct gatherI_masked_partial(vReg dst, indirect mem, vReg idx, pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->as_LoadVector()->memory_size() < MaxVectorSize &&
(n->bottom_type()->is_vect()->element_basic_type() == T_INT ||
n->bottom_type()->is_vect()->element_basic_type() == T_FLOAT));
match(Set dst (LoadVectorGatherMasked mem (Binary idx pg)));
effect(TEMP ptmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "load_vector_gather $dst, $pg, $mem, $idx\t# vector load gather predicated partial (S)" %}
ins_encode %{
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), __ S, Matcher::vector_length(this));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_ld1w_gather(as_FloatRegister($dst$$reg), as_PRegister($ptmp$$reg),
as_Register($mem$$base), as_FloatRegister($idx$$reg));
%}
ins_pipe(pipe_slow);
%}
instruct gatherL_masked_partial(vReg dst, indirect mem, vReg idx, pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->as_LoadVector()->memory_size() < MaxVectorSize &&
(n->bottom_type()->is_vect()->element_basic_type() == T_LONG ||
n->bottom_type()->is_vect()->element_basic_type() == T_DOUBLE));
match(Set dst (LoadVectorGatherMasked mem (Binary idx pg)));
effect(TEMP ptmp, KILL cr);
ins_cost(4 * SVE_COST);
format %{ "load_vector_gather $dst, $pg, $mem, $idx\t# vector load gather predicated partial (D)" %}
ins_encode %{
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), __ D, Matcher::vector_length(this));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_uunpklo(as_FloatRegister($idx$$reg), __ D, as_FloatRegister($idx$$reg));
__ sve_ld1d_gather(as_FloatRegister($dst$$reg), as_PRegister($ptmp$$reg),
as_Register($mem$$base), as_FloatRegister($idx$$reg));
%}
ins_pipe(pipe_slow);
%}
// ------------------------------ Vector Store Scatter ------------------------------- // ------------------------------ Vector Store Scatter -------------------------------
instruct scatterI(indirect mem, vReg src, vReg idx) %{ instruct scatterI(indirect mem, vReg src, vReg idx) %{
@ -3148,7 +2746,6 @@ instruct scatterL_partial(indirect mem, vReg src, vReg idx, pRegGov ptmp, rFlags
instruct scatterI_masked(indirect mem, vReg src, vReg idx, pRegGov pg) %{ instruct scatterI_masked(indirect mem, vReg src, vReg idx, pRegGov pg) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->as_StoreVector()->memory_size() == MaxVectorSize &&
(n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_INT || (n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_INT ||
n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_FLOAT)); n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_FLOAT));
match(Set mem (StoreVectorScatterMasked mem (Binary src (Binary idx pg)))); match(Set mem (StoreVectorScatterMasked mem (Binary src (Binary idx pg))));
@ -3163,7 +2760,6 @@ instruct scatterI_masked(indirect mem, vReg src, vReg idx, pRegGov pg) %{
instruct scatterL_masked(indirect mem, vReg src, vReg idx, pRegGov pg) %{ instruct scatterL_masked(indirect mem, vReg src, vReg idx, pRegGov pg) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->as_StoreVector()->memory_size() == MaxVectorSize &&
(n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_LONG || (n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_LONG ||
n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_DOUBLE)); n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_DOUBLE));
match(Set mem (StoreVectorScatterMasked mem (Binary src (Binary idx pg)))); match(Set mem (StoreVectorScatterMasked mem (Binary src (Binary idx pg))));
@ -3177,47 +2773,6 @@ instruct scatterL_masked(indirect mem, vReg src, vReg idx, pRegGov pg) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
// ------------------------------ Vector Store Scatter Predicated Partial -------------------------------
instruct scatterI_masked_partial(indirect mem, vReg src, vReg idx, pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->as_StoreVector()->memory_size() < MaxVectorSize &&
(n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_INT ||
n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_FLOAT));
match(Set mem (StoreVectorScatterMasked mem (Binary src (Binary idx pg))));
effect(TEMP ptmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "store_vector_scatter $mem, $pg, $idx, $src\t# vector store scatter predicated partial (S)" %}
ins_encode %{
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), __ S, Matcher::vector_length(this, $src));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_st1w_scatter(as_FloatRegister($src$$reg), as_PRegister($ptmp$$reg),
as_Register($mem$$base), as_FloatRegister($idx$$reg));
%}
ins_pipe(pipe_slow);
%}
instruct scatterL_masked_partial(indirect mem, vReg src, vReg idx, pRegGov pg, pRegGov ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->as_StoreVector()->memory_size() < MaxVectorSize &&
(n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_LONG ||
n->in(3)->in(1)->bottom_type()->is_vect()->element_basic_type() == T_DOUBLE));
match(Set mem (StoreVectorScatterMasked mem (Binary src (Binary idx pg))));
effect(TEMP ptmp, KILL cr);
ins_cost(4 * SVE_COST);
format %{ "store_vector_scatter $mem, $pg, $idx, $src\t# vector store scatter predicated partial (D)" %}
ins_encode %{
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), __ D, Matcher::vector_length(this, $src));
__ sve_and(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg),
as_PRegister($pg$$reg), as_PRegister($pg$$reg));
__ sve_uunpklo(as_FloatRegister($idx$$reg), __ D, as_FloatRegister($idx$$reg));
__ sve_st1d_scatter(as_FloatRegister($src$$reg), as_PRegister($ptmp$$reg),
as_Register($mem$$base), as_FloatRegister($idx$$reg));
%}
ins_pipe(pipe_slow);
%}
// ------------------------------ Vector Load Const ------------------------------- // ------------------------------ Vector Load Const -------------------------------
instruct loadconB(vReg dst, immI0 src) %{ instruct loadconB(vReg dst, immI0 src) %{
@ -3259,8 +2814,7 @@ STRING_INDEXOF_CHAR(U, UTF16, false)
// ---------------------------- Vector mask reductions --------------------------- // ---------------------------- Vector mask reductions ---------------------------
instruct vmask_truecount(iRegINoSp dst, pReg src) %{ instruct vmask_truecount(iRegINoSp dst, pReg src) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0);
n->in(1)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);
match(Set dst (VectorMaskTrueCount src)); match(Set dst (VectorMaskTrueCount src));
ins_cost(SVE_COST); ins_cost(SVE_COST);
format %{ "vmask_truecount $dst, $src\t# vector mask truecount (sve)" %} format %{ "vmask_truecount $dst, $src\t# vector mask truecount (sve)" %}
@ -3272,25 +2826,33 @@ instruct vmask_truecount(iRegINoSp dst, pReg src) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
// Return the index of the first mask lane that is set, or vector length if none of
// them are set.
instruct vmask_firsttrue(iRegINoSp dst, pReg src, pReg ptmp) %{ instruct vmask_firsttrue(iRegINoSp dst, pReg src, pReg ptmp) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0);
n->in(1)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);
match(Set dst (VectorMaskFirstTrue src)); match(Set dst (VectorMaskFirstTrue src));
effect(TEMP ptmp); effect(TEMP ptmp);
ins_cost(2 * SVE_COST); ins_cost(3 * SVE_COST);
format %{ "vmask_firsttrue $dst, $src\t# vector mask firsttrue (sve)" %} format %{ "vmask_firsttrue $dst, $src\t# vector mask firsttrue (sve)" %}
ins_encode %{ ins_encode %{
uint length_in_bytes = Matcher::vector_length_in_bytes(this, $src);
BasicType bt = Matcher::vector_element_basic_type(this, $src); BasicType bt = Matcher::vector_element_basic_type(this, $src);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt); Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
__ sve_brkb(as_PRegister($ptmp$$reg), ptrue, as_PRegister($src$$reg), false); // When the input predicate is all-false, the result should be the vector length
// instead of max vector register size.
if (length_in_bytes == MaxVectorSize) {
__ sve_brkb(as_PRegister($ptmp$$reg), ptrue, as_PRegister($src$$reg), false);
} else {
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), size, Matcher::vector_length(this, $src));
__ sve_brkb(as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg), as_PRegister($src$$reg), false);
}
__ sve_cntp($dst$$Register, size, ptrue, as_PRegister($ptmp$$reg)); __ sve_cntp($dst$$Register, size, ptrue, as_PRegister($ptmp$$reg));
%} %}
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
instruct vmask_lasttrue(iRegINoSp dst, pReg src, pReg ptmp) %{ instruct vmask_lasttrue(iRegINoSp dst, pReg src, pReg ptmp) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0);
n->in(1)->bottom_type()->is_vect()->length_in_bytes() == MaxVectorSize);
match(Set dst (VectorMaskLastTrue src)); match(Set dst (VectorMaskLastTrue src));
effect(TEMP ptmp); effect(TEMP ptmp);
ins_cost(3 * SVE_COST); ins_cost(3 * SVE_COST);
@ -3302,57 +2864,6 @@ instruct vmask_lasttrue(iRegINoSp dst, pReg src, pReg ptmp) %{
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%} %}
instruct vmask_truecount_partial(iRegINoSp dst, pReg src, pReg ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->in(1)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);
match(Set dst (VectorMaskTrueCount src));
effect(TEMP ptmp, KILL cr);
ins_cost(2 * SVE_COST);
format %{ "vmask_truecount_partial $dst, $src\t# vector mask truecount partial (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this, $src);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), size, Matcher::vector_length(this, $src));
__ sve_cntp($dst$$Register, size, as_PRegister($ptmp$$reg), as_PRegister($src$$reg));
%}
ins_pipe(pipe_slow);
%}
instruct vmask_firsttrue_partial(iRegINoSp dst, pReg src, pReg ptmp1, pReg ptmp2, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->in(1)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);
match(Set dst (VectorMaskFirstTrue src));
effect(TEMP ptmp1, TEMP ptmp2, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "vmask_firsttrue_partial $dst, $src\t# vector mask firsttrue partial (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this, $src);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
__ sve_ptrue_lanecnt(as_PRegister($ptmp1$$reg), size,
Matcher::vector_length(this, $src));
__ sve_brkb(as_PRegister($ptmp2$$reg), as_PRegister($ptmp1$$reg), as_PRegister($src$$reg), false);
__ sve_cntp($dst$$Register, size, as_PRegister($ptmp1$$reg), as_PRegister($ptmp2$$reg));
%}
ins_pipe(pipe_slow);
%}
instruct vmask_lasttrue_partial(iRegINoSp dst, pReg src, pReg ptmp, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->in(1)->bottom_type()->is_vect()->length_in_bytes() < MaxVectorSize);
match(Set dst (VectorMaskLastTrue src));
effect(TEMP ptmp, KILL cr);
ins_cost(5 * SVE_COST);
format %{ "vmask_lasttrue_partial $dst, $src\t# vector mask lasttrue partial (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this, $src);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
__ sve_ptrue_lanecnt(as_PRegister($ptmp$$reg), size, Matcher::vector_length(this, $src));
__ sve_and(as_PRegister($ptmp$$reg), ptrue, as_PRegister($ptmp$$reg), as_PRegister($src$$reg));
__ sve_vmask_lasttrue($dst$$Register, bt, as_PRegister($ptmp$$reg), as_PRegister($ptmp$$reg));
%}
ins_pipe(pipe_slow);
%}
instruct vmask_tolong(iRegLNoSp dst, pReg src, vReg vtmp1, vReg vtmp2, pRegGov pgtmp, rFlagsReg cr) %{ instruct vmask_tolong(iRegLNoSp dst, pReg src, vReg vtmp1, vReg vtmp2, pRegGov pgtmp, rFlagsReg cr) %{
predicate(UseSVE > 0 && predicate(UseSVE > 0 &&
n->in(1)->bottom_type()->is_vect()->length() <= 64); n->in(1)->bottom_type()->is_vect()->length() <= 64);
@ -3368,9 +2879,133 @@ instruct vmask_tolong(iRegLNoSp dst, pReg src, vReg vtmp1, vReg vtmp2, pRegGov p
as_PRegister($pgtmp$$reg)); as_PRegister($pgtmp$$reg));
%} %}
ins_pipe(pipe_slow); ins_pipe(pipe_slow);
%}dnl %}
// ---------------------------- Vector mask generation --------------------------- // ---------------------------- Vector mask generation ---------------------------
// The rules below set predicate registers. They can guarantee the high bits of dst
// are cleared with zero when the vector length is less than the full size of
// hardware vector register width.
define(`MASKALL_IMM', `
instruct vmaskAll_imm$1(pRegGov dst, imm$1 src) %{
predicate(UseSVE > 0);
match(Set dst (MaskAll src));
ins_cost(SVE_COST);
format %{ "sve_ptrue_lanecnt/sve_pfalse $dst\t# mask all (sve) ($2)" %}
ins_encode %{
ifelse($1, `I', int, long) con = (ifelse($1, `I', int, long))$src$$constant;
if (con == 0) {
__ sve_pfalse(as_PRegister($dst$$reg));
} else {
assert(con == -1, "invalid constant value for mask");
BasicType bt = Matcher::vector_element_basic_type(this);
__ sve_ptrue_lanecnt(as_PRegister($dst$$reg), __ elemType_to_regVariant(bt),
Matcher::vector_length(this));
}
%}
ins_pipe(pipe_slow);
%}')dnl
define(`MASKALL', `
instruct vmaskAll$1(pRegGov dst, ifelse($1, `I', iRegIorL2I, iRegL) src, vReg tmp, rFlagsReg cr) %{
predicate(UseSVE > 0);
match(Set dst (MaskAll src));
effect(TEMP tmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "sve_dup $tmp, $src\n\t"
"sve_ptrue $dst, vector_length\n\t"
"sve_cmpne $dst, $dst, $tmp, 0\t# mask all (sve) ($2)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
uint length_in_bytes = Matcher::vector_length_in_bytes(this);
__ sve_dup(as_FloatRegister($tmp$$reg), size, as_Register($src$$reg));
if (length_in_bytes < MaxVectorSize) {
__ sve_ptrue_lanecnt(as_PRegister($dst$$reg), size, Matcher::vector_length(this));
__ sve_cmp(Assembler::NE, as_PRegister($dst$$reg), size,
as_PRegister($dst$$reg), as_FloatRegister($tmp$$reg), 0);
} else {
__ sve_cmp(Assembler::NE, as_PRegister($dst$$reg), size, ptrue, as_FloatRegister($tmp$$reg), 0);
}
%}
ins_pipe(pipe_slow);
%}')dnl
dnl
// maskAll (full or partial predicate size)
MASKALL_IMM(I, B/H/S)
MASKALL(I, B/H/S)
MASKALL_IMM(L, D)
MASKALL(L, D)
// vector mask compare
instruct vmaskcmp(pRegGov dst, vReg src1, vReg src2, immI cond, rFlagsReg cr) %{
predicate(UseSVE > 0);
match(Set dst (VectorMaskCmp (Binary src1 src2) cond));
effect(KILL cr);
ins_cost(2 * SVE_COST);
format %{ "sve_cmp $dst, $src1, $src2\t# vector mask cmp (sve)" %}
ins_encode %{
uint length_in_bytes = Matcher::vector_length_in_bytes(this);
BasicType bt = Matcher::vector_element_basic_type(this);
if (length_in_bytes == MaxVectorSize) {
__ sve_compare(as_PRegister($dst$$reg), bt, ptrue, as_FloatRegister($src1$$reg),
as_FloatRegister($src2$$reg), (int)$cond$$constant);
} else {
__ sve_ptrue_lanecnt(as_PRegister($dst$$reg), __ elemType_to_regVariant(bt),
Matcher::vector_length(this));
__ sve_compare(as_PRegister($dst$$reg), bt, as_PRegister($dst$$reg), as_FloatRegister($src1$$reg),
as_FloatRegister($src2$$reg), (int)$cond$$constant);
}
%}
ins_pipe(pipe_slow);
%}
instruct vmaskcmp_masked(pRegGov dst, vReg src1, vReg src2, immI cond, pRegGov pg, rFlagsReg cr) %{
predicate(UseSVE > 0);
match(Set dst (VectorMaskCmp (Binary src1 src2) (Binary cond pg)));
effect(KILL cr);
ins_cost(SVE_COST);
format %{ "sve_cmp $dst, $pg, $src1, $src2\t# vector mask cmp (sve)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this);
__ sve_compare(as_PRegister($dst$$reg), bt, as_PRegister($pg$$reg), as_FloatRegister($src1$$reg),
as_FloatRegister($src2$$reg), (int)$cond$$constant);
%}
ins_pipe(pipe_slow);
%}
// vector load mask
instruct vloadmaskB(pRegGov dst, vReg src, rFlagsReg cr) %{
predicate(UseSVE > 0 &&
n->bottom_type()->is_vect()->element_basic_type() == T_BYTE);
match(Set dst (VectorLoadMask src));
effect(KILL cr);
ins_cost(SVE_COST);
format %{ "vloadmaskB $dst, $src\t# vector load mask (sve) (B)" %}
ins_encode %{
__ sve_cmp(Assembler::NE, as_PRegister($dst$$reg), __ B,
ptrue, as_FloatRegister($src$$reg), 0);
%}
ins_pipe(pipe_slow);
%}
instruct vloadmask_extend(pRegGov dst, vReg src, vReg tmp, rFlagsReg cr) %{
predicate(UseSVE > 0 && n->bottom_type()->is_vect()->element_basic_type() != T_BYTE);
match(Set dst (VectorLoadMask src));
effect(TEMP tmp, KILL cr);
ins_cost(3 * SVE_COST);
format %{ "vloadmask $dst, $src\t# vector load mask (sve) (H/S/D)" %}
ins_encode %{
BasicType bt = Matcher::vector_element_basic_type(this);
Assembler::SIMD_RegVariant size = __ elemType_to_regVariant(bt);
__ sve_vector_extend(as_FloatRegister($tmp$$reg), size, as_FloatRegister($src$$reg), __ B);
__ sve_cmp(Assembler::NE, as_PRegister($dst$$reg), size, ptrue, as_FloatRegister($tmp$$reg), 0);
%}
ins_pipe(pipe_slow);
%}
instruct vmask_gen(pRegGov pg, iRegL len, rFlagsReg cr) %{ instruct vmask_gen(pRegGov pg, iRegL len, rFlagsReg cr) %{
predicate(UseSVE > 0); predicate(UseSVE > 0);
match(Set pg (VectorMaskGen len)); match(Set pg (VectorMaskGen len));