/* * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. Oracle designates this * particular file as subject to the "Classpath" exception as provided * by Oracle in the LICENSE file that accompanied this code. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have * questions. */ package jdk.incubator.vector; import java.nio.ByteBuffer; import java.nio.ByteOrder; import java.nio.FloatBuffer; import java.nio.ReadOnlyBufferException; import java.util.Arrays; import java.util.Objects; import java.util.function.IntUnaryOperator; import jdk.internal.misc.Unsafe; import jdk.internal.vm.annotation.ForceInline; import static jdk.incubator.vector.VectorIntrinsics.*; @SuppressWarnings("cast") final class Float64Vector extends FloatVector { static final Float64Species SPECIES = new Float64Species(); static final Float64Vector ZERO = new Float64Vector(); static final int LENGTH = SPECIES.length(); // Index vector species private static final IntVector.IntSpecies INDEX_SPEC; static { int bitSize = Vector.bitSizeForVectorLength(int.class, LENGTH); Vector.Shape shape = Shape.forBitSize(bitSize); INDEX_SPEC = (IntVector.IntSpecies) Species.of(int.class, shape); } private final float[] vec; // Don't access directly, use getElements() instead. private float[] getElements() { return VectorIntrinsics.maybeRebox(this).vec; } Float64Vector() { vec = new float[SPECIES.length()]; } Float64Vector(float[] v) { vec = v; } @Override public int length() { return LENGTH; } // Unary operator @Override Float64Vector uOp(FUnOp f) { float[] vec = getElements(); float[] res = new float[length()]; for (int i = 0; i < length(); i++) { res[i] = f.apply(i, vec[i]); } return new Float64Vector(res); } @Override Float64Vector uOp(Mask o, FUnOp f) { float[] vec = getElements(); float[] res = new float[length()]; boolean[] mbits = ((Float64Mask)o).getBits(); for (int i = 0; i < length(); i++) { res[i] = mbits[i] ? f.apply(i, vec[i]) : vec[i]; } return new Float64Vector(res); } // Binary operator @Override Float64Vector bOp(Vector o, FBinOp f) { float[] res = new float[length()]; float[] vec1 = this.getElements(); float[] vec2 = ((Float64Vector)o).getElements(); for (int i = 0; i < length(); i++) { res[i] = f.apply(i, vec1[i], vec2[i]); } return new Float64Vector(res); } @Override Float64Vector bOp(Vector o1, Mask o2, FBinOp f) { float[] res = new float[length()]; float[] vec1 = this.getElements(); float[] vec2 = ((Float64Vector)o1).getElements(); boolean[] mbits = ((Float64Mask)o2).getBits(); for (int i = 0; i < length(); i++) { res[i] = mbits[i] ? f.apply(i, vec1[i], vec2[i]) : vec1[i]; } return new Float64Vector(res); } // Trinary operator @Override Float64Vector tOp(Vector o1, Vector o2, FTriOp f) { float[] res = new float[length()]; float[] vec1 = this.getElements(); float[] vec2 = ((Float64Vector)o1).getElements(); float[] vec3 = ((Float64Vector)o2).getElements(); for (int i = 0; i < length(); i++) { res[i] = f.apply(i, vec1[i], vec2[i], vec3[i]); } return new Float64Vector(res); } @Override Float64Vector tOp(Vector o1, Vector o2, Mask o3, FTriOp f) { float[] res = new float[length()]; float[] vec1 = getElements(); float[] vec2 = ((Float64Vector)o1).getElements(); float[] vec3 = ((Float64Vector)o2).getElements(); boolean[] mbits = ((Float64Mask)o3).getBits(); for (int i = 0; i < length(); i++) { res[i] = mbits[i] ? f.apply(i, vec1[i], vec2[i], vec3[i]) : vec1[i]; } return new Float64Vector(res); } @Override float rOp(float v, FBinOp f) { float[] vec = getElements(); for (int i = 0; i < length(); i++) { v = f.apply(i, v, vec[i]); } return v; } @Override @ForceInline public Vector cast(Species s) { Objects.requireNonNull(s); if (s.length() != LENGTH) throw new IllegalArgumentException("Vector length this species length differ"); return VectorIntrinsics.cast( Float64Vector.class, float.class, LENGTH, s.vectorType(), s.elementType(), LENGTH, this, s, (species, vector) -> vector.castDefault(species) ); } @SuppressWarnings("unchecked") @ForceInline private Vector castDefault(Species s) { int limit = s.length(); Class stype = s.elementType(); if (stype == byte.class) { byte[] a = new byte[limit]; for (int i = 0; i < limit; i++) { a[i] = (byte) this.get(i); } return (Vector) ByteVector.fromArray((ByteVector.ByteSpecies) s, a, 0); } else if (stype == short.class) { short[] a = new short[limit]; for (int i = 0; i < limit; i++) { a[i] = (short) this.get(i); } return (Vector) ShortVector.fromArray((ShortVector.ShortSpecies) s, a, 0); } else if (stype == int.class) { int[] a = new int[limit]; for (int i = 0; i < limit; i++) { a[i] = (int) this.get(i); } return (Vector) IntVector.fromArray((IntVector.IntSpecies) s, a, 0); } else if (stype == long.class) { long[] a = new long[limit]; for (int i = 0; i < limit; i++) { a[i] = (long) this.get(i); } return (Vector) LongVector.fromArray((LongVector.LongSpecies) s, a, 0); } else if (stype == float.class) { float[] a = new float[limit]; for (int i = 0; i < limit; i++) { a[i] = (float) this.get(i); } return (Vector) FloatVector.fromArray((FloatVector.FloatSpecies) s, a, 0); } else if (stype == double.class) { double[] a = new double[limit]; for (int i = 0; i < limit; i++) { a[i] = (double) this.get(i); } return (Vector) DoubleVector.fromArray((DoubleVector.DoubleSpecies) s, a, 0); } else { throw new UnsupportedOperationException("Bad lane type for casting."); } } @Override @ForceInline @SuppressWarnings("unchecked") public Vector reinterpret(Species s) { Objects.requireNonNull(s); if(s.elementType().equals(float.class)) { return (Vector) reshape((Species)s); } if(s.bitSize() == bitSize()) { return reinterpretType(s); } return defaultReinterpret(s); } @ForceInline private Vector reinterpretType(Species s) { Objects.requireNonNull(s); Class stype = s.elementType(); if (stype == byte.class) { return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Byte64Vector.class, byte.class, Byte64Vector.LENGTH, this, s, (species, vector) -> vector.defaultReinterpret(species) ); } else if (stype == short.class) { return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Short64Vector.class, short.class, Short64Vector.LENGTH, this, s, (species, vector) -> vector.defaultReinterpret(species) ); } else if (stype == int.class) { return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Int64Vector.class, int.class, Int64Vector.LENGTH, this, s, (species, vector) -> vector.defaultReinterpret(species) ); } else if (stype == long.class) { return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Long64Vector.class, long.class, Long64Vector.LENGTH, this, s, (species, vector) -> vector.defaultReinterpret(species) ); } else if (stype == float.class) { return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Float64Vector.class, float.class, Float64Vector.LENGTH, this, s, (species, vector) -> vector.defaultReinterpret(species) ); } else if (stype == double.class) { return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Double64Vector.class, double.class, Double64Vector.LENGTH, this, s, (species, vector) -> vector.defaultReinterpret(species) ); } else { throw new UnsupportedOperationException("Bad lane type for casting."); } } @Override @ForceInline public FloatVector reshape(Species s) { Objects.requireNonNull(s); if (s.bitSize() == 64 && (s instanceof Float64Vector.Float64Species)) { Float64Vector.Float64Species ts = (Float64Vector.Float64Species)s; return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Float64Vector.class, float.class, Float64Vector.LENGTH, this, ts, (species, vector) -> (FloatVector) vector.defaultReinterpret(species) ); } else if (s.bitSize() == 128 && (s instanceof Float128Vector.Float128Species)) { Float128Vector.Float128Species ts = (Float128Vector.Float128Species)s; return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Float128Vector.class, float.class, Float128Vector.LENGTH, this, ts, (species, vector) -> (FloatVector) vector.defaultReinterpret(species) ); } else if (s.bitSize() == 256 && (s instanceof Float256Vector.Float256Species)) { Float256Vector.Float256Species ts = (Float256Vector.Float256Species)s; return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Float256Vector.class, float.class, Float256Vector.LENGTH, this, ts, (species, vector) -> (FloatVector) vector.defaultReinterpret(species) ); } else if (s.bitSize() == 512 && (s instanceof Float512Vector.Float512Species)) { Float512Vector.Float512Species ts = (Float512Vector.Float512Species)s; return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, Float512Vector.class, float.class, Float512Vector.LENGTH, this, ts, (species, vector) -> (FloatVector) vector.defaultReinterpret(species) ); } else if ((s.bitSize() > 0) && (s.bitSize() <= 2048) && (s.bitSize() % 128 == 0) && (s instanceof FloatMaxVector.FloatMaxSpecies)) { FloatMaxVector.FloatMaxSpecies ts = (FloatMaxVector.FloatMaxSpecies)s; return VectorIntrinsics.reinterpret( Float64Vector.class, float.class, LENGTH, FloatMaxVector.class, float.class, FloatMaxVector.LENGTH, this, ts, (species, vector) -> (FloatVector) vector.defaultReinterpret(species) ); } else { throw new InternalError("Unimplemented size"); } } // Binary operations with scalars @Override @ForceInline public FloatVector add(float o) { return add(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector add(float o, Mask m) { return add(SPECIES.broadcast(o), m); } @Override @ForceInline public FloatVector sub(float o) { return sub(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector sub(float o, Mask m) { return sub(SPECIES.broadcast(o), m); } @Override @ForceInline public FloatVector mul(float o) { return mul(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector mul(float o, Mask m) { return mul(SPECIES.broadcast(o), m); } @Override @ForceInline public FloatVector min(float o) { return min(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector max(float o) { return max(SPECIES.broadcast(o)); } @Override @ForceInline public Mask equal(float o) { return equal(SPECIES.broadcast(o)); } @Override @ForceInline public Mask notEqual(float o) { return notEqual(SPECIES.broadcast(o)); } @Override @ForceInline public Mask lessThan(float o) { return lessThan(SPECIES.broadcast(o)); } @Override @ForceInline public Mask lessThanEq(float o) { return lessThanEq(SPECIES.broadcast(o)); } @Override @ForceInline public Mask greaterThan(float o) { return greaterThan(SPECIES.broadcast(o)); } @Override @ForceInline public Mask greaterThanEq(float o) { return greaterThanEq(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector blend(float o, Mask m) { return blend(SPECIES.broadcast(o), m); } @Override @ForceInline public FloatVector div(float o) { return div(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector div(float o, Mask m) { return div(SPECIES.broadcast(o), m); } @Override @ForceInline public Float64Vector div(Vector v, Mask m) { return blend(div(v), m); } @Override @ForceInline public FloatVector atan2(float o) { return atan2(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector atan2(float o, Mask m) { return atan2(SPECIES.broadcast(o), m); } @Override @ForceInline public FloatVector pow(float o) { return pow(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector pow(float o, Mask m) { return pow(SPECIES.broadcast(o), m); } @Override @ForceInline public FloatVector fma(float o1, float o2) { return fma(SPECIES.broadcast(o1), SPECIES.broadcast(o2)); } @Override @ForceInline public FloatVector fma(float o1, float o2, Mask m) { return fma(SPECIES.broadcast(o1), SPECIES.broadcast(o2), m); } @Override @ForceInline public FloatVector hypot(float o) { return hypot(SPECIES.broadcast(o)); } @Override @ForceInline public FloatVector hypot(float o, Mask m) { return hypot(SPECIES.broadcast(o), m); } // Unary operations @ForceInline @Override public Float64Vector neg(Mask m) { return blend(neg(), m); } @Override @ForceInline public Float64Vector abs() { return VectorIntrinsics.unaryOp( VECTOR_OP_ABS, Float64Vector.class, float.class, LENGTH, this, v1 -> v1.uOp((i, a) -> (float) Math.abs(a))); } @ForceInline @Override public Float64Vector abs(Mask m) { return blend(abs(), m); } @Override @ForceInline public Float64Vector neg() { return VectorIntrinsics.unaryOp( VECTOR_OP_NEG, Float64Vector.class, float.class, LENGTH, this, v1 -> v1.uOp((i, a) -> (float) -a)); } @Override @ForceInline public Float64Vector div(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.binaryOp( VECTOR_OP_DIV, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a / b))); } @Override @ForceInline public Float64Vector sqrt() { return VectorIntrinsics.unaryOp( VECTOR_OP_SQRT, Float64Vector.class, float.class, LENGTH, this, v1 -> v1.uOp((i, a) -> (float) Math.sqrt((double) a))); } @Override @ForceInline public Float64Vector exp() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_EXP, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.exp((double) a))); } @Override @ForceInline public Float64Vector log1p() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_LOG1P, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.log1p((double) a))); } @Override @ForceInline public Float64Vector log() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_LOG, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.log((double) a))); } @Override @ForceInline public Float64Vector log10() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_LOG10, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.log10((double) a))); } @Override @ForceInline public Float64Vector expm1() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_EXPM1, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.expm1((double) a))); } @Override @ForceInline public Float64Vector cbrt() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_CBRT, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.cbrt((double) a))); } @Override @ForceInline public Float64Vector sin() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_SIN, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.sin((double) a))); } @Override @ForceInline public Float64Vector cos() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_COS, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.cos((double) a))); } @Override @ForceInline public Float64Vector tan() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_TAN, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.tan((double) a))); } @Override @ForceInline public Float64Vector asin() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_ASIN, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.asin((double) a))); } @Override @ForceInline public Float64Vector acos() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_ACOS, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.acos((double) a))); } @Override @ForceInline public Float64Vector atan() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_ATAN, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.atan((double) a))); } @Override @ForceInline public Float64Vector sinh() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_SINH, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.sinh((double) a))); } @Override @ForceInline public Float64Vector cosh() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_COSH, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.cosh((double) a))); } @Override @ForceInline public Float64Vector tanh() { return (Float64Vector) VectorIntrinsics.unaryOp( VECTOR_OP_TANH, Float64Vector.class, float.class, LENGTH, this, v1 -> ((Float64Vector)v1).uOp((i, a) -> (float) Math.tanh((double) a))); } @Override @ForceInline public Float64Vector pow(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return (Float64Vector) VectorIntrinsics.binaryOp( VECTOR_OP_POW, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> ((Float64Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.pow(a,b)))); } @Override @ForceInline public Float64Vector hypot(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return (Float64Vector) VectorIntrinsics.binaryOp( VECTOR_OP_HYPOT, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> ((Float64Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.hypot(a,b)))); } @Override @ForceInline public Float64Vector atan2(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return (Float64Vector) VectorIntrinsics.binaryOp( VECTOR_OP_ATAN2, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> ((Float64Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.atan2(a,b)))); } // Binary operations @Override @ForceInline public Float64Vector add(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.binaryOp( VECTOR_OP_ADD, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a + b))); } @Override @ForceInline public Float64Vector add(Vector v, Mask m) { return blend(add(v), m); } @Override @ForceInline public Float64Vector sub(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.binaryOp( VECTOR_OP_SUB, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a - b))); } @Override @ForceInline public Float64Vector sub(Vector v, Mask m) { return blend(sub(v), m); } @Override @ForceInline public Float64Vector mul(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.binaryOp( VECTOR_OP_MUL, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a * b))); } @Override @ForceInline public Float64Vector mul(Vector v, Mask m) { return blend(mul(v), m); } @Override @ForceInline public Float64Vector min(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return (Float64Vector) VectorIntrinsics.binaryOp( VECTOR_OP_MIN, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float) Math.min(a, b))); } @Override @ForceInline public Float64Vector min(Vector v, Mask m) { return blend(min(v), m); } @Override @ForceInline public Float64Vector max(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.binaryOp( VECTOR_OP_MAX, Float64Vector.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float) Math.max(a, b))); } @Override @ForceInline public Float64Vector max(Vector v, Mask m) { return blend(max(v), m); } // Ternary operations @Override @ForceInline public Float64Vector fma(Vector o1, Vector o2) { Objects.requireNonNull(o1); Objects.requireNonNull(o2); Float64Vector v1 = (Float64Vector)o1; Float64Vector v2 = (Float64Vector)o2; return VectorIntrinsics.ternaryOp( VECTOR_OP_FMA, Float64Vector.class, float.class, LENGTH, this, v1, v2, (w1, w2, w3) -> w1.tOp(w2, w3, (i, a, b, c) -> Math.fma(a, b, c))); } // Type specific horizontal reductions @Override @ForceInline public float addAll() { int bits = (int) VectorIntrinsics.reductionCoerced( VECTOR_OP_ADD, Float64Vector.class, float.class, LENGTH, this, v -> { float r = v.rOp((float) 0, (i, a, b) -> (float) (a + b)); return (long)Float.floatToIntBits(r); }); return Float.intBitsToFloat(bits); } @Override @ForceInline public float mulAll() { int bits = (int) VectorIntrinsics.reductionCoerced( VECTOR_OP_MUL, Float64Vector.class, float.class, LENGTH, this, v -> { float r = v.rOp((float) 1, (i, a, b) -> (float) (a * b)); return (long)Float.floatToIntBits(r); }); return Float.intBitsToFloat(bits); } @Override @ForceInline public float minAll() { int bits = (int) VectorIntrinsics.reductionCoerced( VECTOR_OP_MIN, Float64Vector.class, float.class, LENGTH, this, v -> { float r = v.rOp(Float.MAX_VALUE , (i, a, b) -> (float) Math.min(a, b)); return (long)Float.floatToIntBits(r); }); return Float.intBitsToFloat(bits); } @Override @ForceInline public float maxAll() { int bits = (int) VectorIntrinsics.reductionCoerced( VECTOR_OP_MAX, Float64Vector.class, float.class, LENGTH, this, v -> { float r = v.rOp(Float.MIN_VALUE , (i, a, b) -> (float) Math.max(a, b)); return (long)Float.floatToIntBits(r); }); return Float.intBitsToFloat(bits); } @Override @ForceInline public float addAll(Mask m) { return SPECIES.broadcast((float) 0).blend(this, m).addAll(); } @Override @ForceInline public float mulAll(Mask m) { return SPECIES.broadcast((float) 1).blend(this, m).mulAll(); } @Override @ForceInline public float minAll(Mask m) { return SPECIES.broadcast(Float.MAX_VALUE).blend(this, m).minAll(); } @Override @ForceInline public float maxAll(Mask m) { return SPECIES.broadcast(Float.MIN_VALUE).blend(this, m).maxAll(); } @Override @ForceInline public Shuffle toShuffle() { float[] a = toArray(); int[] sa = new int[a.length]; for (int i = 0; i < a.length; i++) { sa[i] = (int) a[i]; } return FloatVector.shuffleFromArray(SPECIES, sa, 0); } // Memory operations private static final int ARRAY_SHIFT = 31 - Integer.numberOfLeadingZeros(Unsafe.ARRAY_FLOAT_INDEX_SCALE); private static final int BOOLEAN_ARRAY_SHIFT = 31 - Integer.numberOfLeadingZeros(Unsafe.ARRAY_BOOLEAN_INDEX_SCALE); @Override @ForceInline public void intoArray(float[] a, int ix) { Objects.requireNonNull(a); ix = VectorIntrinsics.checkIndex(ix, a.length, LENGTH); intoArrayWithoutCheck(a, ix); } @ForceInline private void intoArrayWithoutCheck(float[] a, int ix) { VectorIntrinsics.store(Float64Vector.class, float.class, LENGTH, a, (((long) ix) << ARRAY_SHIFT) + Unsafe.ARRAY_FLOAT_BASE_OFFSET, this, a, ix, (arr, idx, v) -> v.forEach((i, e) -> arr[idx + i] = e)); } @Override @ForceInline public final void intoArray(float[] a, int ax, Mask m) { Objects.requireNonNull(a); if (ax + LENGTH <= a.length) { FloatVector oldVal = FloatVector.fromArrayWithoutCheck(SPECIES, a, ax); FloatVector newVal = oldVal.blend(this, m); ((Float64Vector)newVal).intoArrayWithoutCheck(a, ax); } else { forEach(m, (i, e) -> a[ax + i] = e); } } @Override @ForceInline public void intoArray(float[] a, int ix, int[] b, int iy) { Objects.requireNonNull(a); Objects.requireNonNull(b); // Index vector: vix[0:n] = i -> ix + indexMap[iy + i] IntVector vix = IntVector.fromArray(INDEX_SPEC, b, iy).add(ix); vix = VectorIntrinsics.checkIndex(vix, a.length); intoArrayWithoutCheck(a, ix, b, iy, vix); } @ForceInline private void intoArrayWithoutCheck(float[] a, int ix, int[] b, int iy, IntVector vix) { VectorIntrinsics.storeWithMap(Float64Vector.class, float.class, LENGTH, Int64Vector.class, a, Unsafe.ARRAY_FLOAT_BASE_OFFSET, vix, this, a, ix, b, iy, (arr, idx, v, indexMap, idy) -> v.forEach((i, e) -> arr[idx+indexMap[idy+i]] = e)); } @Override @ForceInline public final void intoArray(float[] a, int ax, Mask m, int[] b, int iy) { Objects.requireNonNull(a); Objects.requireNonNull(b); // Index vector: vix[0:n] = i -> ax + b[iy + i] IntVector vix = IntVector.fromArray(INDEX_SPEC, b, iy).add(ax); if(vix.lessThan(0).anyTrue() || vix.greaterThanEq(a.length).anyTrue()) { forEach(m, (i, e) -> a[ax + b[iy+i]] = e); } else { FloatVector oldVal = FloatVector.fromArrayWithoutCheck(SPECIES, a, ax, b, iy, vix); FloatVector newVal = oldVal.blend(this, m); ((Float64Vector)newVal).intoArrayWithoutCheck(a, ax, b, iy, vix); } } @Override @ForceInline public void intoByteArray(byte[] a, int ix) { Objects.requireNonNull(a); ix = VectorIntrinsics.checkIndex(ix, a.length, bitSize() / Byte.SIZE); VectorIntrinsics.store(Float64Vector.class, float.class, LENGTH, a, ((long) ix) + Unsafe.ARRAY_BYTE_BASE_OFFSET, this, a, ix, (c, idx, v) -> { ByteBuffer bbc = ByteBuffer.wrap(c, idx, c.length - idx).order(ByteOrder.nativeOrder()); FloatBuffer tb = bbc.asFloatBuffer(); v.forEach((i, e) -> tb.put(e)); }); } @Override @ForceInline public final void intoByteArray(byte[] a, int ix, Mask m) { Float64Vector oldVal = (Float64Vector) FloatVector.fromByteArray(SPECIES, a, ix); Float64Vector newVal = oldVal.blend(this, m); newVal.intoByteArray(a, ix); } @Override @ForceInline public void intoByteBuffer(ByteBuffer bb, int ix) { if (bb.order() != ByteOrder.nativeOrder()) { throw new IllegalArgumentException(); } if (bb.isReadOnly()) { throw new ReadOnlyBufferException(); } ix = VectorIntrinsics.checkIndex(ix, bb.limit(), bitSize() / Byte.SIZE); VectorIntrinsics.store(Float64Vector.class, float.class, LENGTH, U.getReference(bb, BYTE_BUFFER_HB), ix + U.getLong(bb, BUFFER_ADDRESS), this, bb, ix, (c, idx, v) -> { ByteBuffer bbc = c.duplicate().position(idx).order(ByteOrder.nativeOrder()); FloatBuffer tb = bbc.asFloatBuffer(); v.forEach((i, e) -> tb.put(e)); }); } @Override @ForceInline public void intoByteBuffer(ByteBuffer bb, int ix, Mask m) { Float64Vector oldVal = (Float64Vector) FloatVector.fromByteBuffer(SPECIES, bb, ix); Float64Vector newVal = oldVal.blend(this, m); newVal.intoByteBuffer(bb, ix); } // @Override public String toString() { return Arrays.toString(getElements()); } @Override public boolean equals(Object o) { if (this == o) return true; if (o == null || this.getClass() != o.getClass()) return false; Float64Vector that = (Float64Vector) o; return this.equal(that).allTrue(); } @Override public int hashCode() { return Arrays.hashCode(vec); } // Binary test @Override Float64Mask bTest(Vector o, FBinTest f) { float[] vec1 = getElements(); float[] vec2 = ((Float64Vector)o).getElements(); boolean[] bits = new boolean[length()]; for (int i = 0; i < length(); i++){ bits[i] = f.apply(i, vec1[i], vec2[i]); } return new Float64Mask(bits); } // Comparisons @Override @ForceInline public Float64Mask equal(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.compare( BT_eq, Float64Vector.class, Float64Mask.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bTest(v2, (i, a, b) -> a == b)); } @Override @ForceInline public Float64Mask notEqual(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.compare( BT_ne, Float64Vector.class, Float64Mask.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bTest(v2, (i, a, b) -> a != b)); } @Override @ForceInline public Float64Mask lessThan(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.compare( BT_lt, Float64Vector.class, Float64Mask.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bTest(v2, (i, a, b) -> a < b)); } @Override @ForceInline public Float64Mask lessThanEq(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.compare( BT_le, Float64Vector.class, Float64Mask.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bTest(v2, (i, a, b) -> a <= b)); } @Override @ForceInline public Float64Mask greaterThan(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return (Float64Mask) VectorIntrinsics.compare( BT_gt, Float64Vector.class, Float64Mask.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bTest(v2, (i, a, b) -> a > b)); } @Override @ForceInline public Float64Mask greaterThanEq(Vector o) { Objects.requireNonNull(o); Float64Vector v = (Float64Vector)o; return VectorIntrinsics.compare( BT_ge, Float64Vector.class, Float64Mask.class, float.class, LENGTH, this, v, (v1, v2) -> v1.bTest(v2, (i, a, b) -> a >= b)); } // Foreach @Override void forEach(FUnCon f) { float[] vec = getElements(); for (int i = 0; i < length(); i++) { f.apply(i, vec[i]); } } @Override void forEach(Mask o, FUnCon f) { boolean[] mbits = ((Float64Mask)o).getBits(); forEach((i, a) -> { if (mbits[i]) { f.apply(i, a); } }); } Int64Vector toBits() { float[] vec = getElements(); int[] res = new int[this.species().length()]; for(int i = 0; i < this.species().length(); i++){ res[i] = Float.floatToIntBits(vec[i]); } return new Int64Vector(res); } @Override public Float64Vector rotateEL(int j) { float[] vec = getElements(); float[] res = new float[length()]; for (int i = 0; i < length(); i++){ res[(j + i) % length()] = vec[i]; } return new Float64Vector(res); } @Override public Float64Vector rotateER(int j) { float[] vec = getElements(); float[] res = new float[length()]; for (int i = 0; i < length(); i++){ int z = i - j; if(j < 0) { res[length() + z] = vec[i]; } else { res[z] = vec[i]; } } return new Float64Vector(res); } @Override public Float64Vector shiftEL(int j) { float[] vec = getElements(); float[] res = new float[length()]; for (int i = 0; i < length() - j; i++) { res[i] = vec[i + j]; } return new Float64Vector(res); } @Override public Float64Vector shiftER(int j) { float[] vec = getElements(); float[] res = new float[length()]; for (int i = 0; i < length() - j; i++){ res[i + j] = vec[i]; } return new Float64Vector(res); } @Override @ForceInline public Float64Vector rearrange(Vector v, Shuffle s, Mask m) { return this.rearrange(s).blend(v.rearrange(s), m); } @Override @ForceInline public Float64Vector rearrange(Shuffle o1) { Objects.requireNonNull(o1); Float64Shuffle s = (Float64Shuffle)o1; return VectorIntrinsics.rearrangeOp( Float64Vector.class, Float64Shuffle.class, float.class, LENGTH, this, s, (v1, s_) -> v1.uOp((i, a) -> { int ei = s_.getElement(i); return v1.get(ei); })); } @Override @ForceInline public Float64Vector blend(Vector o1, Mask o2) { Objects.requireNonNull(o1); Objects.requireNonNull(o2); Float64Vector v = (Float64Vector)o1; Float64Mask m = (Float64Mask)o2; return VectorIntrinsics.blend( Float64Vector.class, Float64Mask.class, float.class, LENGTH, this, v, m, (v1, v2, m_) -> v1.bOp(v2, (i, a, b) -> m_.getElement(i) ? b : a)); } // Accessors @Override public float get(int i) { if (i < 0 || i >= LENGTH) { throw new IllegalArgumentException("Index " + i + " must be zero or positive, and less than " + LENGTH); } int bits = (int) VectorIntrinsics.extract( Float64Vector.class, float.class, LENGTH, this, i, (vec, ix) -> { float[] vecarr = vec.getElements(); return (long)Float.floatToIntBits(vecarr[ix]); }); return Float.intBitsToFloat(bits); } @Override public Float64Vector with(int i, float e) { if (i < 0 || i >= LENGTH) { throw new IllegalArgumentException("Index " + i + " must be zero or positive, and less than " + LENGTH); } return VectorIntrinsics.insert( Float64Vector.class, float.class, LENGTH, this, i, (long)Float.floatToIntBits(e), (v, ix, bits) -> { float[] res = v.getElements().clone(); res[ix] = Float.intBitsToFloat((int)bits); return new Float64Vector(res); }); } // Mask static final class Float64Mask extends AbstractMask { static final Float64Mask TRUE_MASK = new Float64Mask(true); static final Float64Mask FALSE_MASK = new Float64Mask(false); private final boolean[] bits; // Don't access directly, use getBits() instead. public Float64Mask(boolean[] bits) { this(bits, 0); } public Float64Mask(boolean[] bits, int offset) { boolean[] a = new boolean[species().length()]; for (int i = 0; i < a.length; i++) { a[i] = bits[offset + i]; } this.bits = a; } public Float64Mask(boolean val) { boolean[] bits = new boolean[species().length()]; Arrays.fill(bits, val); this.bits = bits; } boolean[] getBits() { return VectorIntrinsics.maybeRebox(this).bits; } @Override Float64Mask uOp(MUnOp f) { boolean[] res = new boolean[species().length()]; boolean[] bits = getBits(); for (int i = 0; i < species().length(); i++) { res[i] = f.apply(i, bits[i]); } return new Float64Mask(res); } @Override Float64Mask bOp(Mask o, MBinOp f) { boolean[] res = new boolean[species().length()]; boolean[] bits = getBits(); boolean[] mbits = ((Float64Mask)o).getBits(); for (int i = 0; i < species().length(); i++) { res[i] = f.apply(i, bits[i], mbits[i]); } return new Float64Mask(res); } @Override public Float64Species species() { return SPECIES; } @Override public Float64Vector toVector() { float[] res = new float[species().length()]; boolean[] bits = getBits(); for (int i = 0; i < species().length(); i++) { // -1 will result in the most significant bit being set in // addition to some or all other bits res[i] = (float) (bits[i] ? -1 : 0); } return new Float64Vector(res); } // Unary operations @Override @ForceInline public Float64Mask not() { return (Float64Mask) VectorIntrinsics.unaryOp( VECTOR_OP_NOT, Float64Mask.class, int.class, LENGTH, this, (m1) -> m1.uOp((i, a) -> !a)); } // Binary operations @Override @ForceInline public Float64Mask and(Mask o) { Objects.requireNonNull(o); Float64Mask m = (Float64Mask)o; return VectorIntrinsics.binaryOp(VECTOR_OP_AND, Float64Mask.class, int.class, LENGTH, this, m, (m1, m2) -> m1.bOp(m2, (i, a, b) -> a & b)); } @Override @ForceInline public Float64Mask or(Mask o) { Objects.requireNonNull(o); Float64Mask m = (Float64Mask)o; return VectorIntrinsics.binaryOp(VECTOR_OP_OR, Float64Mask.class, int.class, LENGTH, this, m, (m1, m2) -> m1.bOp(m2, (i, a, b) -> a | b)); } // Reductions @Override @ForceInline public boolean anyTrue() { return VectorIntrinsics.test(BT_ne, Float64Mask.class, int.class, LENGTH, this, this, (m, __) -> anyTrueHelper(((Float64Mask)m).getBits())); } @Override @ForceInline public boolean allTrue() { return VectorIntrinsics.test(BT_overflow, Float64Mask.class, int.class, LENGTH, this, FloatVector.maskAllTrue(species()), (m, __) -> allTrueHelper(((Float64Mask)m).getBits())); } } // Shuffle static final class Float64Shuffle extends AbstractShuffle { Float64Shuffle(byte[] reorder) { super(reorder); } public Float64Shuffle(int[] reorder) { super(reorder); } public Float64Shuffle(int[] reorder, int i) { super(reorder, i); } public Float64Shuffle(IntUnaryOperator f) { super(f); } @Override public Float64Species species() { return SPECIES; } @Override public FloatVector toVector() { float[] va = new float[SPECIES.length()]; for (int i = 0; i < va.length; i++) { va[i] = (float) getElement(i); } return FloatVector.fromArray(SPECIES, va, 0); } @Override public Float64Shuffle rearrange(Vector.Shuffle o) { Float64Shuffle s = (Float64Shuffle) o; byte[] r = new byte[reorder.length]; for (int i = 0; i < reorder.length; i++) { r[i] = reorder[s.reorder[i]]; } return new Float64Shuffle(r); } } // Species @Override public Float64Species species() { return SPECIES; } static final class Float64Species extends FloatSpecies { static final int BIT_SIZE = Shape.S_64_BIT.bitSize(); static final int LENGTH = BIT_SIZE / Float.SIZE; @Override public String toString() { StringBuilder sb = new StringBuilder("Shape["); sb.append(bitSize()).append(" bits, "); sb.append(length()).append(" ").append(float.class.getSimpleName()).append("s x "); sb.append(elementSize()).append(" bits"); sb.append("]"); return sb.toString(); } @Override @ForceInline public int bitSize() { return BIT_SIZE; } @Override @ForceInline public int length() { return LENGTH; } @Override @ForceInline public Class elementType() { return float.class; } @Override @ForceInline public Class boxType() { return Float64Vector.class; } @Override @ForceInline public Class maskType() { return Float64Mask.class; } @Override @ForceInline public int elementSize() { return Float.SIZE; } @Override @ForceInline @SuppressWarnings("unchecked") Class vectorType() { return Float64Vector.class; } @Override @ForceInline public Shape shape() { return Shape.S_64_BIT; } @Override IntVector.IntSpecies indexSpecies() { return INDEX_SPEC; } @Override Float64Vector op(FOp f) { float[] res = new float[length()]; for (int i = 0; i < length(); i++) { res[i] = f.apply(i); } return new Float64Vector(res); } @Override Float64Vector op(Mask o, FOp f) { float[] res = new float[length()]; boolean[] mbits = ((Float64Mask)o).getBits(); for (int i = 0; i < length(); i++) { if (mbits[i]) { res[i] = f.apply(i); } } return new Float64Vector(res); } @Override Float64Mask opm(FOpm f) { boolean[] res = new boolean[length()]; for (int i = 0; i < length(); i++) { res[i] = (boolean)f.apply(i); } return new Float64Mask(res); } // Factories @Override @ForceInline public Float64Vector zero() { return VectorIntrinsics.broadcastCoerced(Float64Vector.class, float.class, LENGTH, Float.floatToIntBits(0.0f), SPECIES, ((bits, s) -> ((Float64Species)s).op(i -> Float.intBitsToFloat((int)bits)))); } @Override @ForceInline public Float64Vector broadcast(float e) { return VectorIntrinsics.broadcastCoerced( Float64Vector.class, float.class, LENGTH, Float.floatToIntBits(e), SPECIES, ((bits, s) -> ((Float64Species)s).op(i -> Float.intBitsToFloat((int)bits)))); } @Override @ForceInline public Float64Vector scalars(float... es) { Objects.requireNonNull(es); int ix = VectorIntrinsics.checkIndex(0, es.length, LENGTH); return VectorIntrinsics.load(Float64Vector.class, float.class, LENGTH, es, Unsafe.ARRAY_FLOAT_BASE_OFFSET, es, ix, SPECIES, (c, idx, s) -> ((Float64Species)s).op(n -> c[idx + n])); } @Override @ForceInline public Float64Mask cast(Mask m) { if (m.length() != LENGTH) throw new IllegalArgumentException("Mask length this species length differ"); return new Float64Mask(m.toArray()); } @Override @ForceInline public Float64Shuffle cast(Shuffle s) { if (s.length() != LENGTH) throw new IllegalArgumentException("Shuffle length this species length differ"); return new Float64Shuffle(s.toArray()); } } }