e95f092862
Reviewed-by: fyang
212 lines
7.8 KiB
Java
212 lines
7.8 KiB
Java
/*
|
|
* Copyright (c) 2024, Arm Limited. All rights reserved.
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* This code is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 only, as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* version 2 for more details (a copy is included in the LICENSE file that
|
|
* accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU General Public License version
|
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
* or visit www.oracle.com if you need additional information or have any
|
|
* questions.
|
|
*/
|
|
|
|
package compiler.vectorapi;
|
|
|
|
import compiler.lib.ir_framework.*;
|
|
|
|
import jdk.incubator.vector.DoubleVector;
|
|
import jdk.incubator.vector.FloatVector;
|
|
import jdk.incubator.vector.VectorOperators;
|
|
import jdk.incubator.vector.VectorSpecies;
|
|
|
|
import java.util.Random;
|
|
|
|
import jdk.test.lib.Asserts;
|
|
import jdk.test.lib.Utils;
|
|
|
|
/**
|
|
* @test
|
|
* @bug 8320725
|
|
* @library /test/lib /
|
|
* @summary Verify non-strictly ordered AddReductionVF/VD and MulReductionVF/VD
|
|
* nodes are generated in VectorAPI
|
|
* @modules jdk.incubator.vector
|
|
* @run driver compiler.vectorapi.TestVectorAddMulReduction
|
|
*/
|
|
|
|
public class TestVectorAddMulReduction {
|
|
|
|
private static final int SIZE = 1024;
|
|
private static final Random RD = Utils.getRandomInstance();
|
|
|
|
private static float[] fa;
|
|
private static float fres;
|
|
private static double[] da;
|
|
private static double dres;
|
|
|
|
static {
|
|
fa = new float[SIZE];
|
|
da = new double[SIZE];
|
|
fres = 1;
|
|
dres = 1;
|
|
for (int i = 0; i < SIZE; i++) {
|
|
fa[i] = RD.nextFloat();
|
|
da[i] = RD.nextDouble();
|
|
}
|
|
}
|
|
|
|
// Test add reduction operation for floats
|
|
@ForceInline
|
|
public static void testFloatAddKernel(VectorSpecies SPECIES, float[] f) {
|
|
for (int i = 0; i < SPECIES.loopBound(f.length); i += SPECIES.length()) {
|
|
var av = FloatVector.fromArray(SPECIES, f, i);
|
|
fres += av.reduceLanes(VectorOperators.ADD);
|
|
}
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.ADD_REDUCTION_VF, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true", "rvv", "true"},
|
|
applyIf = {"MaxVectorSize", ">=8"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testFloatAdd_64() {
|
|
testFloatAddKernel(FloatVector.SPECIES_64, fa);
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.ADD_REDUCTION_VF, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true", "rvv", "true"},
|
|
applyIf = {"MaxVectorSize", ">=16"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testFloatAdd_128() {
|
|
testFloatAddKernel(FloatVector.SPECIES_128, fa);
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.ADD_REDUCTION_VF, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true", "rvv", "true"},
|
|
applyIf = {"MaxVectorSize", ">=32"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testFloatAdd_256() {
|
|
testFloatAddKernel(FloatVector.SPECIES_256, fa);
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.ADD_REDUCTION_VF, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true", "rvv", "true"},
|
|
applyIf = {"MaxVectorSize", ">=64"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testFloatAdd_512() {
|
|
testFloatAddKernel(FloatVector.SPECIES_512, fa);
|
|
}
|
|
|
|
// Test add reduction operation for doubles
|
|
@ForceInline
|
|
public static void testDoubleAddKernel(VectorSpecies SPECIES, double[] d) {
|
|
for (int i = 0; i < SPECIES.loopBound(d.length); i += SPECIES.length()) {
|
|
var av = DoubleVector.fromArray(SPECIES, d, i);
|
|
dres += av.reduceLanes(VectorOperators.ADD);
|
|
}
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.ADD_REDUCTION_VD, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true", "rvv", "true"},
|
|
applyIf = {"MaxVectorSize", ">=16"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testDoubleAdd_128() {
|
|
testDoubleAddKernel(DoubleVector.SPECIES_128, da);
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.ADD_REDUCTION_VD, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true", "rvv", "true"},
|
|
applyIf = {"MaxVectorSize", ">=32"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testDoubleAdd_256() {
|
|
testDoubleAddKernel(DoubleVector.SPECIES_256, da);
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.ADD_REDUCTION_VD, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true", "rvv", "true"},
|
|
applyIf = {"MaxVectorSize", ">=64"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testDoubleAdd_512() {
|
|
testDoubleAddKernel(DoubleVector.SPECIES_512, da);
|
|
}
|
|
|
|
// Test mul reduction operation for floats
|
|
// On aarch64, there are no direct vector mul reduction instructions for float/double mul reduction
|
|
// and scalar instructions are emitted for 64-bit/128-bit vectors. Thus MulReductionVF/VD nodes are generated
|
|
// only for vector length of 8B/16B on vectorAPI.
|
|
@ForceInline
|
|
public static void testFloatMulKernel(VectorSpecies SPECIES, float[] f) {
|
|
for (int i = 0; i < SPECIES.loopBound(f.length); i += SPECIES.length()) {
|
|
var av = FloatVector.fromArray(SPECIES, f, i);
|
|
fres += av.reduceLanes(VectorOperators.MUL);
|
|
}
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.MUL_REDUCTION_VF, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true"},
|
|
applyIf = {"MaxVectorSize", ">=8"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testFloatMul_64() {
|
|
testFloatMulKernel(FloatVector.SPECIES_64, fa);
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.MUL_REDUCTION_VF, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true"},
|
|
applyIf = {"MaxVectorSize", ">=16"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testFloatMul_128() {
|
|
testFloatMulKernel(FloatVector.SPECIES_128, fa);
|
|
}
|
|
|
|
// Test mul reduction operation for doubles
|
|
@ForceInline
|
|
public static void testDoubleMulKernel(VectorSpecies SPECIES, double[] d) {
|
|
for (int i = 0; i < SPECIES.loopBound(d.length); i += SPECIES.length()) {
|
|
var av = DoubleVector.fromArray(SPECIES, d, i);
|
|
dres += av.reduceLanes(VectorOperators.MUL);
|
|
}
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.MUL_REDUCTION_VD, ">=1", "no_strict_order", ">=1"},
|
|
failOn = {"requires_strict_order"},
|
|
applyIfCPUFeatureOr = {"asimd", "true", "sse2", "true"},
|
|
applyIf = {"MaxVectorSize", ">=16"},
|
|
phase = CompilePhase.PRINT_IDEAL)
|
|
public static void testDoubleMul_128() {
|
|
testDoubleMulKernel(DoubleVector.SPECIES_128, da);
|
|
}
|
|
|
|
public static void main(String[] args) {
|
|
TestFramework.runWithFlags("--add-modules=jdk.incubator.vector");
|
|
}
|
|
}
|