< prev index next >
test/jdk/jdk/incubator/vector/benchmark/src/main/java/benchmark/jdk/incubator/vector/LongScalar.java
Print this page
rev 55606 : 8221812: Fine-tune jmh test for vector api
Summary: To compare performance of vector api and auto vectorization, vector
api and scalar test cases are updated to keep aligned.
Reviewed-by: duke
*** 1,7 ****
/*
! * Copyright (c) 2018, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation.
--- 1,7 ----
/*
! * Copyright (c) 2018, 2019, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation.
*** 25,42 ****
--- 25,45 ----
import java.util.concurrent.TimeUnit;
import java.util.function.IntFunction;
import org.openjdk.jmh.annotations.*;
+ import org.openjdk.jmh.infra.Blackhole;
@BenchmarkMode(Mode.Throughput)
@OutputTimeUnit(TimeUnit.MILLISECONDS)
@State(Scope.Benchmark)
@Warmup(iterations = 3, time = 1)
@Measurement(iterations = 5, time = 1)
@Fork(value = 1, jvmArgsPrepend = {"--add-modules=jdk.incubator.vector"})
public class LongScalar extends AbstractVectorBenchmark {
+ static final int INVOC_COUNT = 1; // To align with vector benchmarks.
+
@Param("1024")
int size;
long[] fill(IntFunction<Long> f) {
long[] array = new long[size];
*** 70,515 ****
final IntFunction<boolean[]> fmr = vl -> rms;
final IntFunction<int[]> fs = vl -> ss;
@Benchmark
! public Object add() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a + b);
}
! return rs;
}
@Benchmark
! public Object addMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a + b);
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object sub() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a - b);
}
! return rs;
}
@Benchmark
! public Object subMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a - b);
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object mul() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a * b);
}
! return rs;
}
@Benchmark
! public Object mulMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a * b);
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object and() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a & b);
}
! return rs;
}
@Benchmark
! public Object andMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a & b);
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object or() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a | b);
}
! return rs;
}
@Benchmark
! public Object orMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a | b);
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object xor() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a ^ b);
}
! return rs;
}
@Benchmark
! public Object xorMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a ^ b);
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object shiftR() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a >>> b));
}
! return rs;
}
@Benchmark
! public Object shiftRMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)((a >>> b));
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object shiftL() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a << b));
}
! return rs;
}
@Benchmark
! public Object shiftLMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)((a << b));
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object aShiftR() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a >> b));
}
! return rs;
}
@Benchmark
! public Object aShiftRMasked() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)((a >> b));
} else {
rs[i] = a;
}
}
! return rs;
}
@Benchmark
! public Object aShiftRShift() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a >> b));
}
! return rs;
}
@Benchmark
! public Object aShiftRMaskedShift() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)((a >> b)) : a);
}
! return rs;
}
@Benchmark
! public Object shiftRShift() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a >>> b));
}
! return rs;
}
@Benchmark
! public Object shiftRMaskedShift() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)((a >>> b)) : a);
}
! return rs;
}
@Benchmark
! public Object shiftLShift() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a << b));
}
! return rs;
}
@Benchmark
! public Object shiftLMaskedShift() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)((a << b)) : a);
}
! return rs;
}
--- 73,566 ----
final IntFunction<boolean[]> fmr = vl -> rms;
final IntFunction<int[]> fs = vl -> ss;
@Benchmark
! public void add(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a + b);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void addMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a + b);
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void sub(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a - b);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void subMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a - b);
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void mul(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a * b);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void mulMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a * b);
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void and(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a & b);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void andMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a & b);
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void or(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a | b);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void orMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a | b);
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void xor(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(a ^ b);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void xorMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)(a ^ b);
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void shiftR(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a >>> b));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void shiftRMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)((a >>> b));
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void shiftL(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a << b));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void shiftLMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)((a << b));
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void aShiftR(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a >> b));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void aShiftRMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
if (ms[i % ms.length]) {
rs[i] = (long)((a >> b));
} else {
rs[i] = a;
}
}
! }
! bh.consume(rs);
}
@Benchmark
! public void aShiftRShift(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a >> b));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void aShiftRMaskedShift(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)((a >> b)) : a);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void shiftRShift(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a >>> b));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void shiftRMaskedShift(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)((a >>> b)) : a);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void shiftLShift(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)((a << b));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void shiftLMaskedShift(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)((a << b)) : a);
}
+ }
! bh.consume(rs);
}
*** 522,798 ****
@Benchmark
! public Object max() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(Math.max(a, b));
}
! return rs;
}
@Benchmark
! public Object min() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(Math.min(a, b));
}
! return rs;
}
@Benchmark
! public long andAll() {
long[] as = fa.apply(size);
long r = -1;
for (int i = 0; i < as.length; i++) {
r &= as[i];
}
! return r;
}
@Benchmark
! public long orAll() {
long[] as = fa.apply(size);
long r = 0;
for (int i = 0; i < as.length; i++) {
r |= as[i];
}
! return r;
}
@Benchmark
! public long xorAll() {
long[] as = fa.apply(size);
long r = 0;
for (int i = 0; i < as.length; i++) {
r ^= as[i];
}
! return r;
}
@Benchmark
! public long addAll() {
long[] as = fa.apply(size);
long r = 0;
for (int i = 0; i < as.length; i++) {
r += as[i];
}
! return r;
}
@Benchmark
! public long mulAll() {
long[] as = fa.apply(size);
long r = 1;
for (int i = 0; i < as.length; i++) {
r *= as[i];
}
! return r;
}
@Benchmark
! public long minAll() {
long[] as = fa.apply(size);
long r = Long.MAX_VALUE;
for (int i = 0; i < as.length; i++) {
r = (long)Math.min(r, as[i]);
}
! return r;
}
@Benchmark
! public long maxAll() {
long[] as = fa.apply(size);
long r = Long.MIN_VALUE;
for (int i = 0; i < as.length; i++) {
r = (long)Math.max(r, as[i]);
}
! return r;
}
@Benchmark
! public boolean anyTrue() {
boolean[] ms = fm.apply(size);
boolean r = false;
for (int i = 0; i < ms.length; i++) {
r |= ms[i];
}
! return r;
}
@Benchmark
! public boolean allTrue() {
boolean[] ms = fm.apply(size);
boolean r = true;
for (int i = 0; i < ms.length; i++) {
r &= ms[i];
}
! return r;
}
@Benchmark
! public boolean lessThan() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] < bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
! return r;
}
@Benchmark
! public boolean greaterThan() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] > bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
! return r;
}
@Benchmark
! public boolean equal() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] == bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
! return r;
}
@Benchmark
! public boolean notEqual() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] != bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
! return r;
}
@Benchmark
! public boolean lessThanEq() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] <= bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
! return r;
}
@Benchmark
! public boolean greaterThanEq() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] >= bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
! return r;
}
@Benchmark
! public Object blend() {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? b : a);
}
! return rs;
}
! Object rearrangeShared(int window) {
long[] as = fa.apply(size);
int[] order = fs.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i += window) {
for (int j = 0; j < window; j++) {
long a = as[i+j];
int pos = order[j];
rs[i + pos] = a;
}
}
! return rs;
}
@Benchmark
! public Object rearrange064() {
int window = 64 / Long.SIZE;
! return rearrangeShared(window);
}
@Benchmark
! public Object rearrange128() {
int window = 128 / Long.SIZE;
! return rearrangeShared(window);
}
@Benchmark
! public Object rearrange256() {
int window = 256 / Long.SIZE;
! return rearrangeShared(window);
}
@Benchmark
! public Object rearrange512() {
int window = 512 / Long.SIZE;
! return rearrangeShared(window);
}
--- 573,902 ----
@Benchmark
! public void max(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(Math.max(a, b));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void min(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
rs[i] = (long)(Math.min(a, b));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void andAll(Blackhole bh) {
long[] as = fa.apply(size);
long r = -1;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = -1;
for (int i = 0; i < as.length; i++) {
r &= as[i];
}
! }
! bh.consume(r);
}
@Benchmark
! public void orAll(Blackhole bh) {
long[] as = fa.apply(size);
long r = 0;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = 0;
for (int i = 0; i < as.length; i++) {
r |= as[i];
}
! }
! bh.consume(r);
}
@Benchmark
! public void xorAll(Blackhole bh) {
long[] as = fa.apply(size);
long r = 0;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = 0;
for (int i = 0; i < as.length; i++) {
r ^= as[i];
}
! }
! bh.consume(r);
}
@Benchmark
! public void addAll(Blackhole bh) {
long[] as = fa.apply(size);
long r = 0;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = 0;
for (int i = 0; i < as.length; i++) {
r += as[i];
}
! }
! bh.consume(r);
}
@Benchmark
! public void mulAll(Blackhole bh) {
long[] as = fa.apply(size);
long r = 1;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = 1;
for (int i = 0; i < as.length; i++) {
r *= as[i];
}
! }
! bh.consume(r);
}
@Benchmark
! public void minAll(Blackhole bh) {
long[] as = fa.apply(size);
long r = Long.MAX_VALUE;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = Long.MAX_VALUE;
for (int i = 0; i < as.length; i++) {
r = (long)Math.min(r, as[i]);
}
! }
! bh.consume(r);
}
@Benchmark
! public void maxAll(Blackhole bh) {
long[] as = fa.apply(size);
long r = Long.MIN_VALUE;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = Long.MIN_VALUE;
for (int i = 0; i < as.length; i++) {
r = (long)Math.max(r, as[i]);
}
! }
! bh.consume(r);
}
@Benchmark
! public void anyTrue(Blackhole bh) {
boolean[] ms = fm.apply(size);
boolean r = false;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = false;
for (int i = 0; i < ms.length; i++) {
r |= ms[i];
}
! }
! bh.consume(r);
}
@Benchmark
! public void allTrue(Blackhole bh) {
boolean[] ms = fm.apply(size);
boolean r = true;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = true;
for (int i = 0; i < ms.length; i++) {
r &= ms[i];
}
! }
! bh.consume(r);
}
@Benchmark
! public void lessThan(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] < bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
+ }
! bh.consume(r);
}
@Benchmark
! public void greaterThan(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] > bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
+ }
! bh.consume(r);
}
@Benchmark
! public void equal(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] == bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
+ }
! bh.consume(r);
}
@Benchmark
! public void notEqual(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] != bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
+ }
! bh.consume(r);
}
@Benchmark
! public void lessThanEq(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] <= bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
+ }
! bh.consume(r);
}
@Benchmark
! public void greaterThanEq(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
boolean r = false;
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
+ r = false;
for (int i = 0; i < as.length; i++) {
boolean m = (as[i] >= bs[i]);
r |= m; // accumulate so JIT can't eliminate the computation
}
+ }
! bh.consume(r);
}
@Benchmark
! public void blend(Blackhole bh) {
long[] as = fa.apply(size);
long[] bs = fb.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
long b = bs[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? b : a);
}
+ }
! bh.consume(rs);
}
! void rearrangeShared(int window, Blackhole bh) {
long[] as = fa.apply(size);
int[] order = fs.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i += window) {
for (int j = 0; j < window; j++) {
long a = as[i+j];
int pos = order[j];
rs[i + pos] = a;
}
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void rearrange064(Blackhole bh) {
int window = 64 / Long.SIZE;
! rearrangeShared(window, bh);
}
@Benchmark
! public void rearrange128(Blackhole bh) {
int window = 128 / Long.SIZE;
! rearrangeShared(window, bh);
}
@Benchmark
! public void rearrange256(Blackhole bh) {
int window = 256 / Long.SIZE;
! rearrangeShared(window, bh);
}
@Benchmark
! public void rearrange512(Blackhole bh) {
int window = 512 / Long.SIZE;
! rearrangeShared(window, bh);
}
*** 812,1016 ****
@Benchmark
! public Object neg() {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
rs[i] = (long)(-((long)a));
}
! return rs;
}
@Benchmark
! public Object negMasked() {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)(-((long)a)) : a);
}
! return rs;
}
@Benchmark
! public Object abs() {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
rs[i] = (long)(Math.abs((long)a));
}
! return rs;
}
@Benchmark
! public Object absMasked() {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)(Math.abs((long)a)) : a);
}
! return rs;
}
@Benchmark
! public Object not() {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
rs[i] = (long)(~((long)a));
}
! return rs;
}
@Benchmark
! public Object notMasked() {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
for (int i = 0; i < as.length; i++) {
long a = as[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)(~((long)a)) : a);
}
! return rs;
}
@Benchmark
! public Object gatherBase0() {
long[] as = fa.apply(size);
int[] is = fs.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
int ix = 0 + is[i];
rs[i] = as[ix];
}
! return rs;
}
! Object gather(int window) {
long[] as = fa.apply(size);
int[] is = fs.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i += window) {
for (int j = 0; j < window; j++) {
int ix = i + is[i + j];
rs[i + j] = as[ix];
}
}
! return rs;
}
@Benchmark
! public Object gather064() {
int window = 64 / Long.SIZE;
! return gather(window);
}
@Benchmark
! public Object gather128() {
int window = 128 / Long.SIZE;
! return gather(window);
}
@Benchmark
! public Object gather256() {
int window = 256 / Long.SIZE;
! return gather(window);
}
@Benchmark
! public Object gather512() {
int window = 512 / Long.SIZE;
! return gather(window);
}
@Benchmark
! public Object scatterBase0() {
long[] as = fa.apply(size);
int[] is = fs.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i++) {
int ix = 0 + is[i];
rs[ix] = as[i];
}
! return rs;
}
! Object scatter(int window) {
long[] as = fa.apply(size);
int[] is = fs.apply(size);
long[] rs = fr.apply(size);
for (int i = 0; i < as.length; i += window) {
for (int j = 0; j < window; j++) {
int ix = i + is[i + j];
rs[ix] = as[i + j];
}
}
! return rs;
}
@Benchmark
! public Object scatter064() {
int window = 64 / Long.SIZE;
! return scatter(window);
}
@Benchmark
! public Object scatter128() {
int window = 128 / Long.SIZE;
! return scatter(window);
}
@Benchmark
! public Object scatter256() {
int window = 256 / Long.SIZE;
! return scatter(window);
}
@Benchmark
! public Object scatter512() {
int window = 512 / Long.SIZE;
! return scatter(window);
}
}
--- 916,1140 ----
@Benchmark
! public void neg(Blackhole bh) {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
rs[i] = (long)(-((long)a));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void negMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)(-((long)a)) : a);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void abs(Blackhole bh) {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
rs[i] = (long)(Math.abs((long)a));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void absMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)(Math.abs((long)a)) : a);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void not(Blackhole bh) {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
rs[i] = (long)(~((long)a));
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void notMasked(Blackhole bh) {
long[] as = fa.apply(size);
long[] rs = fr.apply(size);
boolean[] ms = fm.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
long a = as[i];
boolean m = ms[i % ms.length];
rs[i] = (m ? (long)(~((long)a)) : a);
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void gatherBase0(Blackhole bh) {
long[] as = fa.apply(size);
int[] is = fs.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
int ix = 0 + is[i];
rs[i] = as[ix];
}
+ }
! bh.consume(rs);
}
! void gather(int window, Blackhole bh) {
long[] as = fa.apply(size);
int[] is = fs.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i += window) {
for (int j = 0; j < window; j++) {
int ix = i + is[i + j];
rs[i + j] = as[ix];
}
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void gather064(Blackhole bh) {
int window = 64 / Long.SIZE;
! gather(window, bh);
}
@Benchmark
! public void gather128(Blackhole bh) {
int window = 128 / Long.SIZE;
! gather(window, bh);
}
@Benchmark
! public void gather256(Blackhole bh) {
int window = 256 / Long.SIZE;
! gather(window, bh);
}
@Benchmark
! public void gather512(Blackhole bh) {
int window = 512 / Long.SIZE;
! gather(window, bh);
}
@Benchmark
! public void scatterBase0(Blackhole bh) {
long[] as = fa.apply(size);
int[] is = fs.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i++) {
int ix = 0 + is[i];
rs[ix] = as[i];
}
+ }
! bh.consume(rs);
}
! void scatter(int window, Blackhole bh) {
long[] as = fa.apply(size);
int[] is = fs.apply(size);
long[] rs = fr.apply(size);
+ for (int ic = 0; ic < INVOC_COUNT; ic++) {
for (int i = 0; i < as.length; i += window) {
for (int j = 0; j < window; j++) {
int ix = i + is[i + j];
rs[ix] = as[i + j];
}
}
+ }
! bh.consume(rs);
}
@Benchmark
! public void scatter064(Blackhole bh) {
int window = 64 / Long.SIZE;
! scatter(window, bh);
}
@Benchmark
! public void scatter128(Blackhole bh) {
int window = 128 / Long.SIZE;
! scatter(window, bh);
}
@Benchmark
! public void scatter256(Blackhole bh) {
int window = 256 / Long.SIZE;
! scatter(window, bh);
}
@Benchmark
! public void scatter512(Blackhole bh) {
int window = 512 / Long.SIZE;
! scatter(window, bh);
}
}
< prev index next >