Sandhya Viswanathan 398ce2948c 8240248: Extend superword reduction optimizations for x86
Add support for and, or, xor reduction

Co-authored-by: Shravya Rukmannagari <shravya.rukmannagari@intel.com>
Reviewed-by: vlivanov, thartmann
2020-03-23 10:26:40 -07:00

239 lines
7.3 KiB
Java

/*
* Copyright (c) 2020, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*/
/**
* @test
* @bug 8240248
* @summary Add C2 x86 Superword support for scalar logical reduction optimizations : long test
*
* @run main/othervm -XX:+IgnoreUnrecognizedVMOptions -XX:LoopUnrollLimit=250
* -XX:CompileThresholdScaling=0.1
* -XX:-TieredCompilation
* -XX:+SuperWordReductions
* -XX:LoopMaxUnroll=2
* compiler.loopopts.superword.RedTest_long
* @run main/othervm -XX:+IgnoreUnrecognizedVMOptions -XX:LoopUnrollLimit=250
* -XX:CompileThresholdScaling=0.1
* -XX:-SuperWordReductions
* -XX:LoopMaxUnroll=2
* compiler.loopopts.superword.RedTest_long
*
* @run main/othervm -XX:+IgnoreUnrecognizedVMOptions -XX:LoopUnrollLimit=250
* -XX:CompileThresholdScaling=0.1
* -XX:-TieredCompilation
* -XX:+SuperWordReductions
* -XX:LoopMaxUnroll=4
* compiler.loopopts.superword.RedTest_long
* @run main/othervm -XX:+IgnoreUnrecognizedVMOptions -XX:LoopUnrollLimit=250
* -XX:CompileThresholdScaling=0.1
* -XX:-SuperWordReductions
* -XX:LoopMaxUnroll=4
* compiler.loopopts.superword.RedTest_long
*
* @run main/othervm -XX:+IgnoreUnrecognizedVMOptions -XX:LoopUnrollLimit=250
* -XX:CompileThresholdScaling=0.1
* -XX:-TieredCompilation
* -XX:+SuperWordReductions
* -XX:LoopMaxUnroll=8
* compiler.loopopts.superword.RedTest_long
* @run main/othervm -XX:+IgnoreUnrecognizedVMOptions -XX:LoopUnrollLimit=250
* -XX:CompileThresholdScaling=0.1
* -XX:-SuperWordReductions
* -XX:LoopMaxUnroll=8
* compiler.loopopts.superword.RedTest_long
*
* @run main/othervm -XX:+IgnoreUnrecognizedVMOptions -XX:LoopUnrollLimit=250
* -XX:CompileThresholdScaling=0.1
* -XX:-TieredCompilation
* -XX:+SuperWordReductions
* -XX:LoopMaxUnroll=16
* compiler.loopopts.superword.RedTest_long
* @run main/othervm -XX:+IgnoreUnrecognizedVMOptions -XX:LoopUnrollLimit=250
* -XX:CompileThresholdScaling=0.1
* -XX:-SuperWordReductions
* -XX:LoopMaxUnroll=16
* compiler.loopopts.superword.RedTest_long
*/
package compiler.loopopts.superword;
public class RedTest_long {
static final int NUM = 512;
static final int ITER = 8000;
public static void main(String[] args) throws Exception {
long[] a = new long[NUM];
long[] b = new long[NUM];
long[] c = new long[NUM];
long[] d = new long[NUM];
reductionInit1(a, b, c);
long total = 0;
long valid = 0;
for (int j = 0; j < ITER; j++) {
total = sumReductionImplement(a, b, c, d);
}
for (int j = 0; j < d.length; j++) {
valid += d[j];
}
testCorrectness(total, valid, "Add Reduction");
valid = 0;
for (int j = 0; j < ITER; j++) {
total = orReductionImplement(a, b, c, d);
}
for (int j = 0; j < d.length; j++) {
valid |= d[j];
}
testCorrectness(total, valid, "Or Reduction");
valid = -1;
for (int j = 0; j < ITER; j++) {
total = andReductionImplement(a, b, c, d);
}
for (int j = 0; j < d.length; j++) {
valid &= d[j];
}
testCorrectness(total, valid, "And Reduction");
valid = -1;
for (int j = 0; j < ITER; j++) {
total = xorReductionImplement(a, b, c, d);
}
for (int j = 0; j < d.length; j++) {
valid ^= d[j];
}
testCorrectness(total, valid, "Xor Reduction");
reductionInit2(a, b, c);
valid = 1;
for (int j = 0; j < ITER; j++) {
total = mulReductionImplement(a, b, c, d);
}
for (int j = 0; j < d.length; j++) {
valid *= d[j];
}
testCorrectness(total, valid, "Mul Reduction");
}
public static void reductionInit1(
long[] a,
long[] b,
long[] c) {
for (int i = 0; i < a.length; i++) {
a[i] = (i%2) + 0x4099;
b[i] = (i%2) + 0x1033;
c[i] = (i%2) + 0x455;
}
}
public static void reductionInit2(
long[] a,
long[] b,
long[] c) {
for (int i = 0; i < a.length; i++) {
a[i] = 0x11;
b[i] = 0x12;
c[i] = 0x13;
}
}
public static long sumReductionImplement(
long[] a,
long[] b,
long[] c,
long[] d) {
long total = 0;
for (int i = 0; i < a.length; i++) {
d[i] = (a[i] * b[i]) + (a[i] * c[i]) + (b[i] * c[i]);
total += d[i];
}
return total;
}
public static long orReductionImplement(
long[] a,
long[] b,
long[] c,
long[] d) {
long total = 0;
for (int i = 0; i < a.length; i++) {
d[i] = (a[i] * b[i]) + (a[i] * c[i]) + (b[i] * c[i]);
total |= d[i];
}
return total;
}
public static long andReductionImplement(
long[] a,
long[] b,
long[] c,
long[] d) {
long total = -1;
for (int i = 0; i < a.length; i++) {
d[i] = (a[i] * b[i]) + (a[i] * c[i]) + (b[i] * c[i]);
total &= d[i];
}
return total;
}
public static long xorReductionImplement(
long[] a,
long[] b,
long[] c,
long[] d) {
long total = -1;
for (int i = 0; i < a.length; i++) {
d[i] = (a[i] * b[i]) + (a[i] * c[i]) + (b[i] * c[i]);
total ^= d[i];
}
return total;
}
public static long mulReductionImplement(
long[] a,
long[] b,
long[] c,
long[] d) {
long total = 1;
for (int i = 0; i < a.length; i++) {
d[i] = (a[i] * b[i]) + (a[i] * c[i]) + (b[i] * c[i]);
total = total*d[i];
}
return total;
}
public static void testCorrectness(
long total,
long valid,
String op) throws Exception {
if (total == valid) {
System.out.println(op + ": Success");
} else {
System.out.println("Invalid total: " + total);
System.out.println("Expected value = " + valid);
throw new Exception(op + ": Failed");
}
}
}