b05c40ca3b
Reviewed-by: psandoz, vlivanov
227 lines
11 KiB
Java
227 lines
11 KiB
Java
/*
|
|
* Copyright (c) 2020, Oracle and/or its affiliates. All rights reserved.
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* This code is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 only, as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* version 2 for more details (a copy is included in the LICENSE file that
|
|
* accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU General Public License version
|
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
* or visit www.oracle.com if you need additional information or have any
|
|
* questions.
|
|
*/
|
|
|
|
package compiler.arraycopy;
|
|
import java.util.Random;
|
|
|
|
/**
|
|
* @test
|
|
* @bug 8251871
|
|
* @summary Optimize arrayCopy using AVX-512 masked instructions.
|
|
*
|
|
* @run main/othervm/timeout=600 -XX:-TieredCompilation -Xbatch -XX:+IgnoreUnrecognizedVMOptions
|
|
* -XX:UseAVX=3 -XX:+UnlockDiagnosticVMOptions -XX:ArrayOperationPartialInlineSize=0 -XX:MaxVectorSize=32 -XX:+UnlockDiagnosticVMOptions
|
|
* compiler.arraycopy.TestArrayCopyDisjoint
|
|
* @run main/othervm/timeout=600 -XX:-TieredCompilation -Xbatch -XX:+IgnoreUnrecognizedVMOptions
|
|
* -XX:UseAVX=3 -XX:+UnlockDiagnosticVMOptions -XX:ArrayOperationPartialInlineSize=0 -XX:MaxVectorSize=64
|
|
* compiler.arraycopy.TestArrayCopyDisjoint
|
|
* @run main/othervm/timeout=600 -XX:-TieredCompilation -Xbatch -XX:+IgnoreUnrecognizedVMOptions
|
|
* -XX:UseAVX=3 -XX:+UnlockDiagnosticVMOptions -XX:ArrayOperationPartialInlineSize=32 -XX:+UnlockDiagnosticVMOptions -XX:MaxVectorSize=32 -XX:+UnlockDiagnosticVMOption
|
|
* compiler.arraycopy.TestArrayCopyDisjoint
|
|
* @run main/othervm/timeout=600 -XX:-TieredCompilation -Xbatch -XX:+IgnoreUnrecognizedVMOptions
|
|
* -XX:UseAVX=3 -XX:+UnlockDiagnosticVMOptions -XX:ArrayOperationPartialInlineSize=32 -XX:+UnlockDiagnosticVMOptions -XX:MaxVectorSize=64
|
|
* compiler.arraycopy.TestArrayCopyDisjoint
|
|
* @run main/othervm/timeout=600 -XX:-TieredCompilation -Xbatch -XX:+IgnoreUnrecognizedVMOptions
|
|
* -XX:UseAVX=3 -XX:+UnlockDiagnosticVMOptions -XX:ArrayOperationPartialInlineSize=64 -XX:MaxVectorSize=64
|
|
* compiler.arraycopy.TestArrayCopyDisjoint
|
|
* @run main/othervm/timeout=600 -XX:-TieredCompilation -Xbatch -XX:+IgnoreUnrecognizedVMOptions
|
|
* -XX:UseAVX=3 -XX:+UnlockDiagnosticVMOptions -XX:ArrayOperationPartialInlineSize=32 -XX:+UnlockDiagnosticVMOptions -XX:MaxVectorSize=32 -XX:+UnlockDiagnosticVMOption -XX:ArrayCopyLoadStoreMaxElem=16
|
|
* compiler.arraycopy.TestArrayCopyDisjoint
|
|
* @run main/othervm/timeout=600 -XX:-TieredCompilation -Xbatch -XX:+IgnoreUnrecognizedVMOptions
|
|
* -XX:UseAVX=3 -XX:+UnlockDiagnosticVMOptions -XX:ArrayOperationPartialInlineSize=64 -XX:MaxVectorSize=64 -XX:ArrayCopyLoadStoreMaxElem=16
|
|
* compiler.arraycopy.TestArrayCopyDisjoint
|
|
*
|
|
*/
|
|
|
|
public class TestArrayCopyDisjoint {
|
|
|
|
public static final int SIZE = 4096;
|
|
public static byte[] fromByteArr, toByteArr;
|
|
public static char[] fromCharArr, toCharArr;
|
|
public static int[] fromIntArr, toIntArr;
|
|
public static long[] fromLongArr, toLongArr;
|
|
|
|
static public void setup() {
|
|
// Both positions aligned
|
|
fromByteArr = new byte[SIZE];
|
|
toByteArr = new byte[SIZE];
|
|
fromCharArr = new char[SIZE];
|
|
toCharArr = new char[SIZE];
|
|
fromIntArr = new int[SIZE];
|
|
toIntArr = new int[SIZE];
|
|
fromLongArr = new long[SIZE];
|
|
toLongArr = new long[SIZE];
|
|
|
|
for (int i = 0 ; i < SIZE ; i++) {
|
|
fromByteArr[i] = (byte)i;
|
|
fromCharArr[i] = (char)i;
|
|
fromIntArr[i] = i;
|
|
fromLongArr[i] = i;
|
|
}
|
|
}
|
|
|
|
public static int validate_ctr = 0;
|
|
public static <E> void validate(String msg, E arr, int length, int fromPos, int toPos) {
|
|
validate_ctr++;
|
|
if (arr instanceof byte []) {
|
|
byte [] barr = (byte [])arr;
|
|
for(int i = 0 ; i < length; i++)
|
|
if (fromByteArr[i+fromPos] != barr[i+toPos]) {
|
|
System.out.println(msg + "[" + arr.getClass() + "] Result mismtach at i = " + i
|
|
+ " expected = " + fromByteArr[i+fromPos]
|
|
+ " actual = " + barr[i+toPos]
|
|
+ " fromPos = " + fromPos
|
|
+ " toPos = " + toPos);
|
|
throw new Error("Fail");
|
|
}
|
|
}
|
|
else if (arr instanceof char []) {
|
|
char [] carr = (char [])arr;
|
|
for(int i = 0 ; i < length; i++)
|
|
if (fromCharArr[i+fromPos] != carr[i+toPos]) {
|
|
System.out.println(msg + "[" + arr.getClass() + "] Result mismtach at i = " + i
|
|
+ " expected = " + fromCharArr[i+fromPos]
|
|
+ " actual = " + carr[i+toPos]
|
|
+ " fromPos = " + fromPos
|
|
+ " toPos = " + toPos);
|
|
throw new Error("Fail");
|
|
}
|
|
}
|
|
else if (arr instanceof int []) {
|
|
int [] iarr = (int [])arr;
|
|
for(int i = 0 ; i < length; i++)
|
|
if (fromIntArr[i+fromPos] != iarr[i+toPos]) {
|
|
System.out.println(msg + "[" + arr.getClass() + "] Result mismtach at i = " + i
|
|
+ " expected = " + fromIntArr[i+fromPos]
|
|
+ " actual = " + iarr[i+toPos]
|
|
+ " fromPos = " + fromPos
|
|
+ " toPos = " + toPos);
|
|
throw new Error("Fail");
|
|
}
|
|
}
|
|
else if (arr instanceof long []) {
|
|
long [] larr = (long [])arr;
|
|
for(int i = 0 ; i < length; i++)
|
|
if (fromLongArr[i+fromPos] != larr[i+toPos]) {
|
|
System.out.println(msg + "[" + arr.getClass() + "] Result mismtach at i = " + i
|
|
+ " expected = " + fromLongArr[i+fromPos]
|
|
+ " actual = " + larr[i+toPos]
|
|
+ " fromPos = " + fromPos
|
|
+ " toPos = " + toPos);
|
|
throw new Error("Fail");
|
|
}
|
|
}
|
|
}
|
|
|
|
public static void testByte(int length, int fromPos, int toPos) {
|
|
System.arraycopy(fromByteArr, fromPos, toByteArr, toPos, length);
|
|
validate(" Test ByteArr ", toByteArr, length, fromPos, toPos);
|
|
}
|
|
|
|
public static void testChar(int length, int fromPos, int toPos) {
|
|
System.arraycopy(fromCharArr, fromPos, toCharArr, toPos, length);
|
|
validate(" Test CharArr ", toCharArr, length, fromPos, toPos);
|
|
}
|
|
|
|
public static void testInt(int length, int fromPos, int toPos) {
|
|
System.arraycopy(fromIntArr, fromPos, toIntArr, toPos, length);
|
|
validate(" Test IntArr ", toIntArr, length, fromPos, toPos);
|
|
}
|
|
|
|
public static void testLong(int length, int fromPos, int toPos) {
|
|
System.arraycopy(fromLongArr, fromPos, toLongArr, toPos, length);
|
|
validate(" Test LongArr ", toLongArr, length, fromPos, toPos);
|
|
}
|
|
|
|
public static void testByte_constant_LT32B(int fromPos, int toPos) {
|
|
System.arraycopy(fromByteArr, fromPos, toByteArr, toPos, 7);
|
|
validate(" Test Byte constant length 7 ", toByteArr, 7, fromPos, toPos);
|
|
}
|
|
public static void testByte_constant_LT64B(int fromPos, int toPos) {
|
|
System.arraycopy(fromByteArr, fromPos, toByteArr, toPos, 45);
|
|
validate(" Test Byte constant length 45 ", toByteArr, 45, fromPos, toPos);
|
|
}
|
|
|
|
public static void testChar_constant_LT32B(int fromPos, int toPos) {
|
|
System.arraycopy(fromCharArr, fromPos, toCharArr, toPos, 7);
|
|
validate(" Test Char constant length 7 ", toCharArr, 7, fromPos, toPos);
|
|
}
|
|
public static void testChar_constant_LT64B(int fromPos, int toPos) {
|
|
System.arraycopy(fromCharArr, fromPos, toCharArr, toPos, 22);
|
|
validate(" Test Char constant length 22 ", toCharArr, 22, fromPos, toPos);
|
|
}
|
|
|
|
public static void testInt_constant_LT32B(int fromPos, int toPos) {
|
|
System.arraycopy(fromIntArr, fromPos, toIntArr, toPos, 7);
|
|
validate(" Test Int constant length 7 ", toIntArr, 7, fromPos, toPos);
|
|
}
|
|
public static void testInt_constant_LT64B(int fromPos, int toPos) {
|
|
System.arraycopy(fromIntArr, fromPos, toIntArr, toPos, 11);
|
|
validate(" Test Int constant length 11 ", toIntArr, 11, fromPos, toPos);
|
|
}
|
|
|
|
public static void testLong_constant_LT32B(int fromPos, int toPos) {
|
|
System.arraycopy(fromLongArr, fromPos, toLongArr, toPos, 3);
|
|
validate(" Test Long constant length 3 ", toLongArr, 3, fromPos, toPos);
|
|
}
|
|
public static void testLong_constant_LT64B(int fromPos, int toPos) {
|
|
System.arraycopy(fromLongArr, fromPos, toLongArr, toPos, 6);
|
|
validate(" Test Long constant length 6 ", toLongArr, 6, fromPos, toPos);
|
|
}
|
|
|
|
|
|
public static void main(String [] args) {
|
|
// Cases to test each new optimized stub special blocks.
|
|
// Cases to test new PI handling (PI32 and PI64).
|
|
// Cases to test vectorized constant array copies for all primitive types.
|
|
// LT32B LT64B LT96B LT128B LT160B LT192B LOOP1 LOOP2
|
|
int [] lengths = { 29, 59, 89, 125, 159, 189, 194, 1024 };
|
|
Random r = new Random(1024);
|
|
|
|
setup();
|
|
|
|
try {
|
|
for (int i = 0 ; i < 1000000 ; i++ ) {
|
|
testByte(lengths[i % lengths.length], r.nextInt(2048) , r.nextInt(2048));
|
|
testByte_constant_LT32B (r.nextInt(2048) , r.nextInt(2048));
|
|
testByte_constant_LT64B (r.nextInt(2048) , r.nextInt(2048));
|
|
|
|
testChar(lengths[i % lengths.length] >> 1, r.nextInt(2048) , r.nextInt(2048));
|
|
testChar_constant_LT32B (r.nextInt(2048) , r.nextInt(2048));
|
|
testChar_constant_LT64B (r.nextInt(2048) , r.nextInt(2048));
|
|
|
|
testInt(lengths[i % lengths.length] >> 2, r.nextInt(2048) , r.nextInt(2048));
|
|
testInt_constant_LT32B (r.nextInt(2048) , r.nextInt(2048));
|
|
testInt_constant_LT64B (r.nextInt(2048) , r.nextInt(2048));
|
|
|
|
testLong(lengths[i % lengths.length] >> 3, r.nextInt(2048) , r.nextInt(2048));
|
|
testLong_constant_LT32B (r.nextInt(2048) , r.nextInt(2048));
|
|
testLong_constant_LT64B (r.nextInt(2048) , r.nextInt(2048));
|
|
}
|
|
System.out.println("PASS : " + validate_ctr);
|
|
} catch (Exception e) {
|
|
System.out.println(e.getMessage());
|
|
}
|
|
}
|
|
}
|