811d08c0a4
Reviewed-by: chagedorn, rkennke, mli
183 lines
7.5 KiB
Java
183 lines
7.5 KiB
Java
/*
|
|
* Copyright (c) 2022, 2024, Oracle and/or its affiliates. All rights reserved.
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* This code is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 only, as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* version 2 for more details (a copy is included in the LICENSE file that
|
|
* accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU General Public License version
|
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
* or visit www.oracle.com if you need additional information or have any
|
|
* questions.
|
|
*/
|
|
|
|
/**
|
|
* @test
|
|
* @bug 8294588
|
|
* @summary Auto-vectorize Float.floatToFloat16, Float.float16ToFloat APIs
|
|
* @requires vm.compiler2.enabled
|
|
* @library /test/lib /
|
|
* @run driver compiler.vectorization.TestFloatConversionsVector nCOH_nAV
|
|
* @run driver compiler.vectorization.TestFloatConversionsVector nCOH_yAV
|
|
* @run driver compiler.vectorization.TestFloatConversionsVector yCOH_nAV
|
|
* @run driver compiler.vectorization.TestFloatConversionsVector yCOH_yAV
|
|
*/
|
|
|
|
package compiler.vectorization;
|
|
|
|
import compiler.lib.ir_framework.*;
|
|
import jdk.test.lib.Asserts;
|
|
|
|
public class TestFloatConversionsVector {
|
|
private static final int ARRLEN = 1024;
|
|
private static final int ITERS = 11000;
|
|
private static float [] finp;
|
|
private static short [] sout;
|
|
private static short [] sinp;
|
|
private static float [] fout;
|
|
|
|
public static void main(String args[]) {
|
|
TestFramework framework = new TestFramework(TestFloatConversionsVector.class);
|
|
framework.addFlags("-XX:-TieredCompilation", "-XX:CompileThresholdScaling=0.3");
|
|
switch (args[0]) {
|
|
case "nCOH_nAV" -> { framework.addFlags("-XX:+UnlockExperimentalVMOptions", "-XX:-UseCompactObjectHeaders", "-XX:-AlignVector"); }
|
|
case "nCOH_yAV" -> { framework.addFlags("-XX:+UnlockExperimentalVMOptions", "-XX:-UseCompactObjectHeaders", "-XX:+AlignVector"); }
|
|
case "yCOH_nAV" -> { framework.addFlags("-XX:+UnlockExperimentalVMOptions", "-XX:+UseCompactObjectHeaders", "-XX:-AlignVector"); }
|
|
case "yCOH_yAV" -> { framework.addFlags("-XX:+UnlockExperimentalVMOptions", "-XX:+UseCompactObjectHeaders", "-XX:+AlignVector"); }
|
|
default -> { throw new RuntimeException("Test argument not recognized: " + args[0]); }
|
|
};
|
|
framework.start();
|
|
System.out.println("PASSED");
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.VECTOR_CAST_F2HF, IRNode.VECTOR_SIZE + "min(max_float, max_short)", "> 0"},
|
|
applyIfOr = {"UseCompactObjectHeaders", "false", "AlignVector", "false"},
|
|
applyIfPlatformOr = {"x64", "true", "aarch64", "true", "riscv64", "true"},
|
|
applyIfCPUFeatureOr = {"f16c", "true", "avx512f", "true", "zvfh", "true", "asimd", "true", "sve", "true"})
|
|
public void test_float_float16(short[] sout, float[] finp) {
|
|
for (int i = 0; i < finp.length; i++) {
|
|
sout[i] = Float.floatToFloat16(finp[i]);
|
|
// With AlignVector, we need 8-byte alignment of vector loads/stores.
|
|
// UseCompactObjectHeaders=false UseCompactObjectHeaders=true
|
|
// F_adr = base + 16 + 4*i -> i % 2 = 0 F_adr = base + 12 + 4*i -> i % 2 = 1
|
|
// S_adr = base + 16 + 2*i -> i % 4 = 0 S_adr = base + 12 + 2*i -> i % 4 = 2
|
|
// -> vectorize -> no vectorization
|
|
}
|
|
}
|
|
|
|
@Test
|
|
public void test_float_float16_strided(short[] sout, float[] finp) {
|
|
for (int i = 0; i < finp.length/2; i++) {
|
|
sout[i*2] = Float.floatToFloat16(finp[i*2]);
|
|
}
|
|
}
|
|
|
|
@Test
|
|
public void test_float_float16_short_vector(short[] sout, float[] finp) {
|
|
for (int i = 0; i < finp.length; i+= 4) {
|
|
sout[i+0] = Float.floatToFloat16(finp[i+0]);
|
|
sout[i+1] = Float.floatToFloat16(finp[i+1]);
|
|
}
|
|
}
|
|
|
|
@Run(test = {"test_float_float16", "test_float_float16_strided",
|
|
"test_float_float16_short_vector"}, mode = RunMode.STANDALONE)
|
|
public void kernel_test_float_float16() {
|
|
finp = new float[ARRLEN];
|
|
sout = new short[ARRLEN];
|
|
|
|
for (int i = 0; i < ARRLEN; i++) {
|
|
finp[i] = (float) i * 1.4f;
|
|
}
|
|
|
|
for (int i = 0; i < ITERS; i++) {
|
|
test_float_float16(sout, finp);
|
|
}
|
|
|
|
// Verifying the result
|
|
for (int i = 0; i < ARRLEN; i++) {
|
|
Asserts.assertEquals(Float.floatToFloat16(finp[i]), sout[i]);
|
|
}
|
|
|
|
for (int i = 0; i < ITERS; i++) {
|
|
test_float_float16_strided(sout, finp);
|
|
}
|
|
|
|
// Verifying the result
|
|
for (int i = 0; i < ARRLEN/2; i++) {
|
|
Asserts.assertEquals(Float.floatToFloat16(finp[i*2]), sout[i*2]);
|
|
}
|
|
|
|
for (int i = 0; i < ITERS; i++) {
|
|
test_float_float16_short_vector(sout, finp);
|
|
}
|
|
|
|
// Verifying the result
|
|
for (int i = 0; i < ARRLEN; i++) {
|
|
Asserts.assertEquals(Float.floatToFloat16(finp[i]), sout[i]);
|
|
}
|
|
}
|
|
|
|
@Test
|
|
@IR(counts = {IRNode.VECTOR_CAST_HF2F, IRNode.VECTOR_SIZE + "min(max_float, max_short)", "> 0"},
|
|
applyIfOr = {"UseCompactObjectHeaders", "false", "AlignVector", "false"},
|
|
applyIfPlatformOr = {"x64", "true", "aarch64", "true", "riscv64", "true"},
|
|
applyIfCPUFeatureOr = {"f16c", "true", "avx512f", "true", "zvfh", "true", "asimd", "true", "sve", "true"})
|
|
public void test_float16_float(float[] fout, short[] sinp) {
|
|
for (int i = 0; i < sinp.length; i++) {
|
|
fout[i] = Float.float16ToFloat(sinp[i]);
|
|
// With AlignVector, we need 8-byte alignment of vector loads/stores.
|
|
// UseCompactObjectHeaders=false UseCompactObjectHeaders=true
|
|
// F_adr = base + 16 + 4*i -> i % 2 = 0 F_adr = base + 12 + 4*i -> i % 2 = 1
|
|
// S_adr = base + 16 + 2*i -> i % 4 = 0 S_adr = base + 12 + 2*i -> i % 4 = 2
|
|
// -> vectorize -> no vectorization
|
|
}
|
|
}
|
|
|
|
@Test
|
|
public void test_float16_float_strided(float[] fout, short[] sinp) {
|
|
for (int i = 0; i < sinp.length/2; i++) {
|
|
fout[i*2] = Float.float16ToFloat(sinp[i*2]);
|
|
}
|
|
}
|
|
|
|
@Run(test = {"test_float16_float", "test_float16_float_strided"}, mode = RunMode.STANDALONE)
|
|
public void kernel_test_float16_float() {
|
|
sinp = new short[ARRLEN];
|
|
fout = new float[ARRLEN];
|
|
|
|
for (int i = 0; i < ARRLEN; i++) {
|
|
sinp[i] = (short)i;
|
|
}
|
|
|
|
for (int i = 0; i < ITERS; i++) {
|
|
test_float16_float(fout, sinp);
|
|
}
|
|
|
|
// Verifying the result
|
|
for (int i = 0; i < ARRLEN; i++) {
|
|
Asserts.assertEquals(Float.float16ToFloat(sinp[i]), fout[i]);
|
|
}
|
|
|
|
for (int i = 0; i < ITERS; i++) {
|
|
test_float16_float_strided(fout, sinp);
|
|
}
|
|
|
|
// Verifying the result
|
|
for (int i = 0; i < ARRLEN/2; i++) {
|
|
Asserts.assertEquals(Float.float16ToFloat(sinp[i*2]), fout[i*2]);
|
|
}
|
|
}
|
|
}
|