89 lines
2.8 KiB
Java
89 lines
2.8 KiB
Java
|
/*
|
||
|
* Copyright (C) 2021 THL A29 Limited, a Tencent company. All rights reserved.
|
||
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
||
|
*
|
||
|
* This code is free software; you can redistribute it and/or modify it
|
||
|
* under the terms of the GNU General Public License version 2 only, as
|
||
|
* published by the Free Software Foundation.
|
||
|
*
|
||
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
||
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
||
|
* version 2 for more details (a copy is included in the LICENSE file that
|
||
|
* accompanied this code).
|
||
|
*
|
||
|
* You should have received a copy of the GNU General Public License version
|
||
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
||
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
||
|
*
|
||
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
||
|
* or visit www.oracle.com if you need additional information or have any
|
||
|
* questions.
|
||
|
*/
|
||
|
|
||
|
package org.openjdk.bench.vm.compiler;
|
||
|
|
||
|
import org.openjdk.jmh.annotations.*;
|
||
|
import org.openjdk.jmh.infra.*;
|
||
|
import java.util.concurrent.TimeUnit;
|
||
|
|
||
|
@Warmup(iterations = 3, time = 5, timeUnit = TimeUnit.SECONDS)
|
||
|
@Measurement(iterations = 4, time = 5, timeUnit = TimeUnit.SECONDS)
|
||
|
@BenchmarkMode(Mode.Throughput)
|
||
|
@OutputTimeUnit(TimeUnit.SECONDS)
|
||
|
@State(Scope.Thread)
|
||
|
@Fork(value=1)
|
||
|
public class LoopUnroll {
|
||
|
@Param({"16", "32", "64", "128", "256", "512", "1024"})
|
||
|
private int VECLEN;
|
||
|
|
||
|
private byte[][] a;
|
||
|
private byte[][] b;
|
||
|
private byte[][] c;
|
||
|
|
||
|
@Setup
|
||
|
public void init() {
|
||
|
a = new byte[VECLEN][VECLEN];
|
||
|
b = new byte[VECLEN][VECLEN];
|
||
|
c = new byte[VECLEN][VECLEN];
|
||
|
}
|
||
|
|
||
|
@CompilerControl(CompilerControl.Mode.DONT_INLINE)
|
||
|
private int run_workload1(int count, byte[][] a , byte[][] b, byte[][] c) {
|
||
|
for(int i = 0; i < a.length; i++) {
|
||
|
for (int j = 0; j < a[0].length; j++) {
|
||
|
a[i][j] = (byte)(b[i][j] + c[i][j]);
|
||
|
}
|
||
|
}
|
||
|
return a[count][count];
|
||
|
}
|
||
|
|
||
|
@Benchmark
|
||
|
public void workload1_caller(Blackhole bh) {
|
||
|
int r = 0;
|
||
|
for(int i = 0 ; i < 100; i++) {
|
||
|
r += run_workload1(i % a.length, a, b, c);
|
||
|
}
|
||
|
bh.consume(r);
|
||
|
}
|
||
|
|
||
|
@CompilerControl(CompilerControl.Mode.DONT_INLINE)
|
||
|
private int run_workload2(int count, byte[][] a , byte[][] b) {
|
||
|
for(int i = 0; i < b.length; i++) {
|
||
|
for (int j = 0; j < b[0].length; j++) {
|
||
|
a[i][j] = b[i][j];
|
||
|
}
|
||
|
}
|
||
|
return a[count][count];
|
||
|
}
|
||
|
|
||
|
@Benchmark
|
||
|
public void workload2_caller(Blackhole bh) {
|
||
|
int r = 0;
|
||
|
for(int i = 0 ; i < 100; i++) {
|
||
|
r += run_workload2(i % a.length, a, b);
|
||
|
}
|
||
|
bh.consume(r);
|
||
|
}
|
||
|
}
|