1 /* 2 * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * This code is free software; you can redistribute it and/or modify it 6 * under the terms of the GNU General Public License version 2 only, as 7 * published by the Free Software Foundation. Oracle designates this 8 * particular file as subject to the "Classpath" exception as provided 9 * by Oracle in the LICENSE file that accompanied this code. 10 * 11 * This code is distributed in the hope that it will be useful, but WITHOUT 12 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 13 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 14 * version 2 for more details (a copy is included in the LICENSE file that 15 * accompanied this code). 16 * 17 * You should have received a copy of the GNU General Public License version 18 * 2 along with this work; if not, write to the Free Software Foundation, 19 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 20 * 21 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 22 * or visit www.oracle.com if you need additional information or have 23 * questions. 24 */ 25 package jdk.incubator.vector; 26 27 import java.nio.ByteBuffer; 28 import java.nio.ByteOrder; 29 import java.nio.FloatBuffer; 30 import java.nio.ReadOnlyBufferException; 31 import java.util.Arrays; 32 import java.util.Objects; 33 import java.util.function.IntUnaryOperator; 34 35 import jdk.internal.misc.Unsafe; 36 import jdk.internal.vm.annotation.ForceInline; 37 import static jdk.incubator.vector.VectorIntrinsics.*; 38 39 @SuppressWarnings("cast") 40 final class Float256Vector extends FloatVector { 41 static final Float256Species SPECIES = new Float256Species(); 42 43 static final Float256Vector ZERO = new Float256Vector(); 44 45 static final int LENGTH = SPECIES.length(); 46 47 // Index vector species 48 private static final IntVector.IntSpecies INDEX_SPEC; 49 static { 50 int bitSize = Vector.bitSizeForVectorLength(int.class, LENGTH); 51 Vector.Shape shape = Shape.forBitSize(bitSize); 52 INDEX_SPEC = (IntVector.IntSpecies) Species.of(int.class, shape); 53 } 54 private final float[] vec; // Don't access directly, use getElements() instead. 55 56 private float[] getElements() { 57 return VectorIntrinsics.maybeRebox(this).vec; 58 } 59 60 Float256Vector() { 61 vec = new float[SPECIES.length()]; 62 } 63 64 Float256Vector(float[] v) { 65 vec = v; 66 } 67 68 @Override 69 public int length() { return LENGTH; } 70 71 // Unary operator 72 73 @Override 74 Float256Vector uOp(FUnOp f) { 75 float[] vec = getElements(); 76 float[] res = new float[length()]; 77 for (int i = 0; i < length(); i++) { 78 res[i] = f.apply(i, vec[i]); 79 } 80 return new Float256Vector(res); 81 } 82 83 @Override 84 Float256Vector uOp(Mask<Float> o, FUnOp f) { 85 float[] vec = getElements(); 86 float[] res = new float[length()]; 87 boolean[] mbits = ((Float256Mask)o).getBits(); 88 for (int i = 0; i < length(); i++) { 89 res[i] = mbits[i] ? f.apply(i, vec[i]) : vec[i]; 90 } 91 return new Float256Vector(res); 92 } 93 94 // Binary operator 95 96 @Override 97 Float256Vector bOp(Vector<Float> o, FBinOp f) { 98 float[] res = new float[length()]; 99 float[] vec1 = this.getElements(); 100 float[] vec2 = ((Float256Vector)o).getElements(); 101 for (int i = 0; i < length(); i++) { 102 res[i] = f.apply(i, vec1[i], vec2[i]); 103 } 104 return new Float256Vector(res); 105 } 106 107 @Override 108 Float256Vector bOp(Vector<Float> o1, Mask<Float> o2, FBinOp f) { 109 float[] res = new float[length()]; 110 float[] vec1 = this.getElements(); 111 float[] vec2 = ((Float256Vector)o1).getElements(); 112 boolean[] mbits = ((Float256Mask)o2).getBits(); 113 for (int i = 0; i < length(); i++) { 114 res[i] = mbits[i] ? f.apply(i, vec1[i], vec2[i]) : vec1[i]; 115 } 116 return new Float256Vector(res); 117 } 118 119 // Trinary operator 120 121 @Override 122 Float256Vector tOp(Vector<Float> o1, Vector<Float> o2, FTriOp f) { 123 float[] res = new float[length()]; 124 float[] vec1 = this.getElements(); 125 float[] vec2 = ((Float256Vector)o1).getElements(); 126 float[] vec3 = ((Float256Vector)o2).getElements(); 127 for (int i = 0; i < length(); i++) { 128 res[i] = f.apply(i, vec1[i], vec2[i], vec3[i]); 129 } 130 return new Float256Vector(res); 131 } 132 133 @Override 134 Float256Vector tOp(Vector<Float> o1, Vector<Float> o2, Mask<Float> o3, FTriOp f) { 135 float[] res = new float[length()]; 136 float[] vec1 = getElements(); 137 float[] vec2 = ((Float256Vector)o1).getElements(); 138 float[] vec3 = ((Float256Vector)o2).getElements(); 139 boolean[] mbits = ((Float256Mask)o3).getBits(); 140 for (int i = 0; i < length(); i++) { 141 res[i] = mbits[i] ? f.apply(i, vec1[i], vec2[i], vec3[i]) : vec1[i]; 142 } 143 return new Float256Vector(res); 144 } 145 146 @Override 147 float rOp(float v, FBinOp f) { 148 float[] vec = getElements(); 149 for (int i = 0; i < length(); i++) { 150 v = f.apply(i, v, vec[i]); 151 } 152 return v; 153 } 154 155 @Override 156 @ForceInline 157 public <F> Vector<F> cast(Species<F> s) { 158 Objects.requireNonNull(s); 159 if (s.length() != LENGTH) 160 throw new IllegalArgumentException("Vector length this species length differ"); 161 162 return VectorIntrinsics.cast( 163 Float256Vector.class, 164 float.class, LENGTH, 165 s.vectorType(), 166 s.elementType(), LENGTH, 167 this, s, 168 (species, vector) -> vector.castDefault(species) 169 ); 170 } 171 172 @SuppressWarnings("unchecked") 173 @ForceInline 174 private <F> Vector<F> castDefault(Species<F> s) { 175 int limit = s.length(); 176 177 Class<?> stype = s.elementType(); 178 if (stype == byte.class) { 179 byte[] a = new byte[limit]; 180 for (int i = 0; i < limit; i++) { 181 a[i] = (byte) this.get(i); 182 } 183 return (Vector) ByteVector.fromArray((ByteVector.ByteSpecies) s, a, 0); 184 } else if (stype == short.class) { 185 short[] a = new short[limit]; 186 for (int i = 0; i < limit; i++) { 187 a[i] = (short) this.get(i); 188 } 189 return (Vector) ShortVector.fromArray((ShortVector.ShortSpecies) s, a, 0); 190 } else if (stype == int.class) { 191 int[] a = new int[limit]; 192 for (int i = 0; i < limit; i++) { 193 a[i] = (int) this.get(i); 194 } 195 return (Vector) IntVector.fromArray((IntVector.IntSpecies) s, a, 0); 196 } else if (stype == long.class) { 197 long[] a = new long[limit]; 198 for (int i = 0; i < limit; i++) { 199 a[i] = (long) this.get(i); 200 } 201 return (Vector) LongVector.fromArray((LongVector.LongSpecies) s, a, 0); 202 } else if (stype == float.class) { 203 float[] a = new float[limit]; 204 for (int i = 0; i < limit; i++) { 205 a[i] = (float) this.get(i); 206 } 207 return (Vector) FloatVector.fromArray((FloatVector.FloatSpecies) s, a, 0); 208 } else if (stype == double.class) { 209 double[] a = new double[limit]; 210 for (int i = 0; i < limit; i++) { 211 a[i] = (double) this.get(i); 212 } 213 return (Vector) DoubleVector.fromArray((DoubleVector.DoubleSpecies) s, a, 0); 214 } else { 215 throw new UnsupportedOperationException("Bad lane type for casting."); 216 } 217 } 218 219 @Override 220 @ForceInline 221 @SuppressWarnings("unchecked") 222 public <F> Vector<F> reinterpret(Species<F> s) { 223 Objects.requireNonNull(s); 224 225 if(s.elementType().equals(float.class)) { 226 return (Vector<F>) reshape((Species<Float>)s); 227 } 228 if(s.bitSize() == bitSize()) { 229 return reinterpretType(s); 230 } 231 232 return defaultReinterpret(s); 233 } 234 235 @ForceInline 236 private <F> Vector<F> reinterpretType(Species<F> s) { 237 Objects.requireNonNull(s); 238 239 Class<?> stype = s.elementType(); 240 if (stype == byte.class) { 241 return VectorIntrinsics.reinterpret( 242 Float256Vector.class, 243 float.class, LENGTH, 244 Byte256Vector.class, 245 byte.class, Byte256Vector.LENGTH, 246 this, s, 247 (species, vector) -> vector.defaultReinterpret(species) 248 ); 249 } else if (stype == short.class) { 250 return VectorIntrinsics.reinterpret( 251 Float256Vector.class, 252 float.class, LENGTH, 253 Short256Vector.class, 254 short.class, Short256Vector.LENGTH, 255 this, s, 256 (species, vector) -> vector.defaultReinterpret(species) 257 ); 258 } else if (stype == int.class) { 259 return VectorIntrinsics.reinterpret( 260 Float256Vector.class, 261 float.class, LENGTH, 262 Int256Vector.class, 263 int.class, Int256Vector.LENGTH, 264 this, s, 265 (species, vector) -> vector.defaultReinterpret(species) 266 ); 267 } else if (stype == long.class) { 268 return VectorIntrinsics.reinterpret( 269 Float256Vector.class, 270 float.class, LENGTH, 271 Long256Vector.class, 272 long.class, Long256Vector.LENGTH, 273 this, s, 274 (species, vector) -> vector.defaultReinterpret(species) 275 ); 276 } else if (stype == float.class) { 277 return VectorIntrinsics.reinterpret( 278 Float256Vector.class, 279 float.class, LENGTH, 280 Float256Vector.class, 281 float.class, Float256Vector.LENGTH, 282 this, s, 283 (species, vector) -> vector.defaultReinterpret(species) 284 ); 285 } else if (stype == double.class) { 286 return VectorIntrinsics.reinterpret( 287 Float256Vector.class, 288 float.class, LENGTH, 289 Double256Vector.class, 290 double.class, Double256Vector.LENGTH, 291 this, s, 292 (species, vector) -> vector.defaultReinterpret(species) 293 ); 294 } else { 295 throw new UnsupportedOperationException("Bad lane type for casting."); 296 } 297 } 298 299 @Override 300 @ForceInline 301 public FloatVector reshape(Species<Float> s) { 302 Objects.requireNonNull(s); 303 if (s.bitSize() == 64 && (s instanceof Float64Vector.Float64Species)) { 304 Float64Vector.Float64Species ts = (Float64Vector.Float64Species)s; 305 return VectorIntrinsics.reinterpret( 306 Float256Vector.class, 307 float.class, LENGTH, 308 Float64Vector.class, 309 float.class, Float64Vector.LENGTH, 310 this, ts, 311 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 312 ); 313 } else if (s.bitSize() == 128 && (s instanceof Float128Vector.Float128Species)) { 314 Float128Vector.Float128Species ts = (Float128Vector.Float128Species)s; 315 return VectorIntrinsics.reinterpret( 316 Float256Vector.class, 317 float.class, LENGTH, 318 Float128Vector.class, 319 float.class, Float128Vector.LENGTH, 320 this, ts, 321 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 322 ); 323 } else if (s.bitSize() == 256 && (s instanceof Float256Vector.Float256Species)) { 324 Float256Vector.Float256Species ts = (Float256Vector.Float256Species)s; 325 return VectorIntrinsics.reinterpret( 326 Float256Vector.class, 327 float.class, LENGTH, 328 Float256Vector.class, 329 float.class, Float256Vector.LENGTH, 330 this, ts, 331 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 332 ); 333 } else if (s.bitSize() == 512 && (s instanceof Float512Vector.Float512Species)) { 334 Float512Vector.Float512Species ts = (Float512Vector.Float512Species)s; 335 return VectorIntrinsics.reinterpret( 336 Float256Vector.class, 337 float.class, LENGTH, 338 Float512Vector.class, 339 float.class, Float512Vector.LENGTH, 340 this, ts, 341 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 342 ); 343 } else if ((s.bitSize() > 0) && (s.bitSize() <= 2048) 344 && (s.bitSize() % 128 == 0) && (s instanceof FloatMaxVector.FloatMaxSpecies)) { 345 FloatMaxVector.FloatMaxSpecies ts = (FloatMaxVector.FloatMaxSpecies)s; 346 return VectorIntrinsics.reinterpret( 347 Float256Vector.class, 348 float.class, LENGTH, 349 FloatMaxVector.class, 350 float.class, FloatMaxVector.LENGTH, 351 this, ts, 352 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 353 ); 354 } else { 355 throw new InternalError("Unimplemented size"); 356 } 357 } 358 359 // Binary operations with scalars 360 361 @Override 362 @ForceInline 363 public FloatVector add(float o) { 364 return add(SPECIES.broadcast(o)); 365 } 366 367 @Override 368 @ForceInline 369 public FloatVector add(float o, Mask<Float> m) { 370 return add(SPECIES.broadcast(o), m); 371 } 372 373 @Override 374 @ForceInline 375 public FloatVector sub(float o) { 376 return sub(SPECIES.broadcast(o)); 377 } 378 379 @Override 380 @ForceInline 381 public FloatVector sub(float o, Mask<Float> m) { 382 return sub(SPECIES.broadcast(o), m); 383 } 384 385 @Override 386 @ForceInline 387 public FloatVector mul(float o) { 388 return mul(SPECIES.broadcast(o)); 389 } 390 391 @Override 392 @ForceInline 393 public FloatVector mul(float o, Mask<Float> m) { 394 return mul(SPECIES.broadcast(o), m); 395 } 396 397 @Override 398 @ForceInline 399 public FloatVector min(float o) { 400 return min(SPECIES.broadcast(o)); 401 } 402 403 @Override 404 @ForceInline 405 public FloatVector max(float o) { 406 return max(SPECIES.broadcast(o)); 407 } 408 409 @Override 410 @ForceInline 411 public Mask<Float> equal(float o) { 412 return equal(SPECIES.broadcast(o)); 413 } 414 415 @Override 416 @ForceInline 417 public Mask<Float> notEqual(float o) { 418 return notEqual(SPECIES.broadcast(o)); 419 } 420 421 @Override 422 @ForceInline 423 public Mask<Float> lessThan(float o) { 424 return lessThan(SPECIES.broadcast(o)); 425 } 426 427 @Override 428 @ForceInline 429 public Mask<Float> lessThanEq(float o) { 430 return lessThanEq(SPECIES.broadcast(o)); 431 } 432 433 @Override 434 @ForceInline 435 public Mask<Float> greaterThan(float o) { 436 return greaterThan(SPECIES.broadcast(o)); 437 } 438 439 @Override 440 @ForceInline 441 public Mask<Float> greaterThanEq(float o) { 442 return greaterThanEq(SPECIES.broadcast(o)); 443 } 444 445 @Override 446 @ForceInline 447 public FloatVector blend(float o, Mask<Float> m) { 448 return blend(SPECIES.broadcast(o), m); 449 } 450 451 @Override 452 @ForceInline 453 public FloatVector div(float o) { 454 return div(SPECIES.broadcast(o)); 455 } 456 457 @Override 458 @ForceInline 459 public FloatVector div(float o, Mask<Float> m) { 460 return div(SPECIES.broadcast(o), m); 461 } 462 463 @Override 464 @ForceInline 465 public Float256Vector div(Vector<Float> v, Mask<Float> m) { 466 return blend(div(v), m); 467 } 468 469 @Override 470 @ForceInline 471 public FloatVector atan2(float o) { 472 return atan2(SPECIES.broadcast(o)); 473 } 474 475 @Override 476 @ForceInline 477 public FloatVector atan2(float o, Mask<Float> m) { 478 return atan2(SPECIES.broadcast(o), m); 479 } 480 481 @Override 482 @ForceInline 483 public FloatVector pow(float o) { 484 return pow(SPECIES.broadcast(o)); 485 } 486 487 @Override 488 @ForceInline 489 public FloatVector pow(float o, Mask<Float> m) { 490 return pow(SPECIES.broadcast(o), m); 491 } 492 493 @Override 494 @ForceInline 495 public FloatVector fma(float o1, float o2) { 496 return fma(SPECIES.broadcast(o1), SPECIES.broadcast(o2)); 497 } 498 499 @Override 500 @ForceInline 501 public FloatVector fma(float o1, float o2, Mask<Float> m) { 502 return fma(SPECIES.broadcast(o1), SPECIES.broadcast(o2), m); 503 } 504 505 @Override 506 @ForceInline 507 public FloatVector hypot(float o) { 508 return hypot(SPECIES.broadcast(o)); 509 } 510 511 @Override 512 @ForceInline 513 public FloatVector hypot(float o, Mask<Float> m) { 514 return hypot(SPECIES.broadcast(o), m); 515 } 516 517 518 // Unary operations 519 520 @ForceInline 521 @Override 522 public Float256Vector neg(Mask<Float> m) { 523 return blend(neg(), m); 524 } 525 526 @Override 527 @ForceInline 528 public Float256Vector abs() { 529 return VectorIntrinsics.unaryOp( 530 VECTOR_OP_ABS, Float256Vector.class, float.class, LENGTH, 531 this, 532 v1 -> v1.uOp((i, a) -> (float) Math.abs(a))); 533 } 534 535 @ForceInline 536 @Override 537 public Float256Vector abs(Mask<Float> m) { 538 return blend(abs(), m); 539 } 540 541 @Override 542 @ForceInline 543 public Float256Vector neg() { 544 return VectorIntrinsics.unaryOp( 545 VECTOR_OP_NEG, Float256Vector.class, float.class, LENGTH, 546 this, 547 v1 -> v1.uOp((i, a) -> (float) -a)); 548 } 549 550 @Override 551 @ForceInline 552 public Float256Vector div(Vector<Float> o) { 553 Objects.requireNonNull(o); 554 Float256Vector v = (Float256Vector)o; 555 return VectorIntrinsics.binaryOp( 556 VECTOR_OP_DIV, Float256Vector.class, float.class, LENGTH, 557 this, v, 558 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a / b))); 559 } 560 561 @Override 562 @ForceInline 563 public Float256Vector sqrt() { 564 return VectorIntrinsics.unaryOp( 565 VECTOR_OP_SQRT, Float256Vector.class, float.class, LENGTH, 566 this, 567 v1 -> v1.uOp((i, a) -> (float) Math.sqrt((double) a))); 568 } 569 570 @Override 571 @ForceInline 572 public Float256Vector exp() { 573 return (Float256Vector) VectorIntrinsics.unaryOp( 574 VECTOR_OP_EXP, Float256Vector.class, float.class, LENGTH, 575 this, 576 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.exp((double) a))); 577 } 578 579 @Override 580 @ForceInline 581 public Float256Vector log1p() { 582 return (Float256Vector) VectorIntrinsics.unaryOp( 583 VECTOR_OP_LOG1P, Float256Vector.class, float.class, LENGTH, 584 this, 585 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.log1p((double) a))); 586 } 587 588 @Override 589 @ForceInline 590 public Float256Vector log() { 591 return (Float256Vector) VectorIntrinsics.unaryOp( 592 VECTOR_OP_LOG, Float256Vector.class, float.class, LENGTH, 593 this, 594 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.log((double) a))); 595 } 596 597 @Override 598 @ForceInline 599 public Float256Vector log10() { 600 return (Float256Vector) VectorIntrinsics.unaryOp( 601 VECTOR_OP_LOG10, Float256Vector.class, float.class, LENGTH, 602 this, 603 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.log10((double) a))); 604 } 605 606 @Override 607 @ForceInline 608 public Float256Vector expm1() { 609 return (Float256Vector) VectorIntrinsics.unaryOp( 610 VECTOR_OP_EXPM1, Float256Vector.class, float.class, LENGTH, 611 this, 612 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.expm1((double) a))); 613 } 614 615 @Override 616 @ForceInline 617 public Float256Vector cbrt() { 618 return (Float256Vector) VectorIntrinsics.unaryOp( 619 VECTOR_OP_CBRT, Float256Vector.class, float.class, LENGTH, 620 this, 621 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.cbrt((double) a))); 622 } 623 624 @Override 625 @ForceInline 626 public Float256Vector sin() { 627 return (Float256Vector) VectorIntrinsics.unaryOp( 628 VECTOR_OP_SIN, Float256Vector.class, float.class, LENGTH, 629 this, 630 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.sin((double) a))); 631 } 632 633 @Override 634 @ForceInline 635 public Float256Vector cos() { 636 return (Float256Vector) VectorIntrinsics.unaryOp( 637 VECTOR_OP_COS, Float256Vector.class, float.class, LENGTH, 638 this, 639 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.cos((double) a))); 640 } 641 642 @Override 643 @ForceInline 644 public Float256Vector tan() { 645 return (Float256Vector) VectorIntrinsics.unaryOp( 646 VECTOR_OP_TAN, Float256Vector.class, float.class, LENGTH, 647 this, 648 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.tan((double) a))); 649 } 650 651 @Override 652 @ForceInline 653 public Float256Vector asin() { 654 return (Float256Vector) VectorIntrinsics.unaryOp( 655 VECTOR_OP_ASIN, Float256Vector.class, float.class, LENGTH, 656 this, 657 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.asin((double) a))); 658 } 659 660 @Override 661 @ForceInline 662 public Float256Vector acos() { 663 return (Float256Vector) VectorIntrinsics.unaryOp( 664 VECTOR_OP_ACOS, Float256Vector.class, float.class, LENGTH, 665 this, 666 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.acos((double) a))); 667 } 668 669 @Override 670 @ForceInline 671 public Float256Vector atan() { 672 return (Float256Vector) VectorIntrinsics.unaryOp( 673 VECTOR_OP_ATAN, Float256Vector.class, float.class, LENGTH, 674 this, 675 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.atan((double) a))); 676 } 677 678 @Override 679 @ForceInline 680 public Float256Vector sinh() { 681 return (Float256Vector) VectorIntrinsics.unaryOp( 682 VECTOR_OP_SINH, Float256Vector.class, float.class, LENGTH, 683 this, 684 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.sinh((double) a))); 685 } 686 687 @Override 688 @ForceInline 689 public Float256Vector cosh() { 690 return (Float256Vector) VectorIntrinsics.unaryOp( 691 VECTOR_OP_COSH, Float256Vector.class, float.class, LENGTH, 692 this, 693 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.cosh((double) a))); 694 } 695 696 @Override 697 @ForceInline 698 public Float256Vector tanh() { 699 return (Float256Vector) VectorIntrinsics.unaryOp( 700 VECTOR_OP_TANH, Float256Vector.class, float.class, LENGTH, 701 this, 702 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.tanh((double) a))); 703 } 704 705 @Override 706 @ForceInline 707 public Float256Vector pow(Vector<Float> o) { 708 Objects.requireNonNull(o); 709 Float256Vector v = (Float256Vector)o; 710 return (Float256Vector) VectorIntrinsics.binaryOp( 711 VECTOR_OP_POW, Float256Vector.class, float.class, LENGTH, 712 this, v, 713 (v1, v2) -> ((Float256Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.pow(a,b)))); 714 } 715 716 @Override 717 @ForceInline 718 public Float256Vector hypot(Vector<Float> o) { 719 Objects.requireNonNull(o); 720 Float256Vector v = (Float256Vector)o; 721 return (Float256Vector) VectorIntrinsics.binaryOp( 722 VECTOR_OP_HYPOT, Float256Vector.class, float.class, LENGTH, 723 this, v, 724 (v1, v2) -> ((Float256Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.hypot(a,b)))); 725 } 726 727 @Override 728 @ForceInline 729 public Float256Vector atan2(Vector<Float> o) { 730 Objects.requireNonNull(o); 731 Float256Vector v = (Float256Vector)o; 732 return (Float256Vector) VectorIntrinsics.binaryOp( 733 VECTOR_OP_ATAN2, Float256Vector.class, float.class, LENGTH, 734 this, v, 735 (v1, v2) -> ((Float256Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.atan2(a,b)))); 736 } 737 738 739 // Binary operations 740 741 @Override 742 @ForceInline 743 public Float256Vector add(Vector<Float> o) { 744 Objects.requireNonNull(o); 745 Float256Vector v = (Float256Vector)o; 746 return VectorIntrinsics.binaryOp( 747 VECTOR_OP_ADD, Float256Vector.class, float.class, LENGTH, 748 this, v, 749 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a + b))); 750 } 751 752 @Override 753 @ForceInline 754 public Float256Vector add(Vector<Float> v, Mask<Float> m) { 755 return blend(add(v), m); 756 } 757 758 @Override 759 @ForceInline 760 public Float256Vector sub(Vector<Float> o) { 761 Objects.requireNonNull(o); 762 Float256Vector v = (Float256Vector)o; 763 return VectorIntrinsics.binaryOp( 764 VECTOR_OP_SUB, Float256Vector.class, float.class, LENGTH, 765 this, v, 766 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a - b))); 767 } 768 769 @Override 770 @ForceInline 771 public Float256Vector sub(Vector<Float> v, Mask<Float> m) { 772 return blend(sub(v), m); 773 } 774 775 @Override 776 @ForceInline 777 public Float256Vector mul(Vector<Float> o) { 778 Objects.requireNonNull(o); 779 Float256Vector v = (Float256Vector)o; 780 return VectorIntrinsics.binaryOp( 781 VECTOR_OP_MUL, Float256Vector.class, float.class, LENGTH, 782 this, v, 783 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a * b))); 784 } 785 786 @Override 787 @ForceInline 788 public Float256Vector mul(Vector<Float> v, Mask<Float> m) { 789 return blend(mul(v), m); 790 } 791 792 @Override 793 @ForceInline 794 public Float256Vector min(Vector<Float> o) { 795 Objects.requireNonNull(o); 796 Float256Vector v = (Float256Vector)o; 797 return (Float256Vector) VectorIntrinsics.binaryOp( 798 VECTOR_OP_MIN, Float256Vector.class, float.class, LENGTH, 799 this, v, 800 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float) Math.min(a, b))); 801 } 802 803 @Override 804 @ForceInline 805 public Float256Vector min(Vector<Float> v, Mask<Float> m) { 806 return blend(min(v), m); 807 } 808 809 @Override 810 @ForceInline 811 public Float256Vector max(Vector<Float> o) { 812 Objects.requireNonNull(o); 813 Float256Vector v = (Float256Vector)o; 814 return VectorIntrinsics.binaryOp( 815 VECTOR_OP_MAX, Float256Vector.class, float.class, LENGTH, 816 this, v, 817 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float) Math.max(a, b))); 818 } 819 820 @Override 821 @ForceInline 822 public Float256Vector max(Vector<Float> v, Mask<Float> m) { 823 return blend(max(v), m); 824 } 825 826 827 // Ternary operations 828 829 @Override 830 @ForceInline 831 public Float256Vector fma(Vector<Float> o1, Vector<Float> o2) { 832 Objects.requireNonNull(o1); 833 Objects.requireNonNull(o2); 834 Float256Vector v1 = (Float256Vector)o1; 835 Float256Vector v2 = (Float256Vector)o2; 836 return VectorIntrinsics.ternaryOp( 837 VECTOR_OP_FMA, Float256Vector.class, float.class, LENGTH, 838 this, v1, v2, 839 (w1, w2, w3) -> w1.tOp(w2, w3, (i, a, b, c) -> Math.fma(a, b, c))); 840 } 841 842 // Type specific horizontal reductions 843 844 @Override 845 @ForceInline 846 public float addAll() { 847 int bits = (int) VectorIntrinsics.reductionCoerced( 848 VECTOR_OP_ADD, Float256Vector.class, float.class, LENGTH, 849 this, 850 v -> { 851 float r = v.rOp((float) 0, (i, a, b) -> (float) (a + b)); 852 return (long)Float.floatToIntBits(r); 853 }); 854 return Float.intBitsToFloat(bits); 855 } 856 857 @Override 858 @ForceInline 859 public float subAll() { 860 int bits = (int) VectorIntrinsics.reductionCoerced( 861 VECTOR_OP_SUB, Float256Vector.class, float.class, LENGTH, 862 this, 863 v -> { 864 float r = v.rOp((float) 0, (i, a, b) -> (float) (a - b)); 865 return (long)Float.floatToIntBits(r); 866 }); 867 return Float.intBitsToFloat(bits); 868 } 869 870 @Override 871 @ForceInline 872 public float mulAll() { 873 int bits = (int) VectorIntrinsics.reductionCoerced( 874 VECTOR_OP_MUL, Float256Vector.class, float.class, LENGTH, 875 this, 876 v -> { 877 float r = v.rOp((float) 1, (i, a, b) -> (float) (a * b)); 878 return (long)Float.floatToIntBits(r); 879 }); 880 return Float.intBitsToFloat(bits); 881 } 882 883 @Override 884 @ForceInline 885 public float minAll() { 886 int bits = (int) VectorIntrinsics.reductionCoerced( 887 VECTOR_OP_MIN, Float256Vector.class, float.class, LENGTH, 888 this, 889 v -> { 890 float r = v.rOp(Float.MAX_VALUE , (i, a, b) -> (float) Math.min(a, b)); 891 return (long)Float.floatToIntBits(r); 892 }); 893 return Float.intBitsToFloat(bits); 894 } 895 896 @Override 897 @ForceInline 898 public float maxAll() { 899 int bits = (int) VectorIntrinsics.reductionCoerced( 900 VECTOR_OP_MAX, Float256Vector.class, float.class, LENGTH, 901 this, 902 v -> { 903 float r = v.rOp(Float.MIN_VALUE , (i, a, b) -> (float) Math.max(a, b)); 904 return (long)Float.floatToIntBits(r); 905 }); 906 return Float.intBitsToFloat(bits); 907 } 908 909 910 @Override 911 @ForceInline 912 public float addAll(Mask<Float> m) { 913 return blend(SPECIES.broadcast((float) 0), m).addAll(); 914 } 915 916 @Override 917 @ForceInline 918 public float subAll(Mask<Float> m) { 919 return blend(SPECIES.broadcast((float) 0), m).subAll(); 920 } 921 922 @Override 923 @ForceInline 924 public float mulAll(Mask<Float> m) { 925 return blend(SPECIES.broadcast((float) 1), m).mulAll(); 926 } 927 928 @Override 929 @ForceInline 930 public float minAll(Mask<Float> m) { 931 return blend(SPECIES.broadcast(Float.MAX_VALUE), m).minAll(); 932 } 933 934 @Override 935 @ForceInline 936 public float maxAll(Mask<Float> m) { 937 return blend(SPECIES.broadcast(Float.MIN_VALUE), m).maxAll(); 938 } 939 940 @Override 941 @ForceInline 942 public Shuffle<Float> toShuffle() { 943 float[] a = toArray(); 944 int[] sa = new int[a.length]; 945 for (int i = 0; i < a.length; i++) { 946 sa[i] = (int) a[i]; 947 } 948 return FloatVector.shuffleFromArray(SPECIES, sa, 0); 949 } 950 951 // Memory operations 952 953 private static final int ARRAY_SHIFT = 31 - Integer.numberOfLeadingZeros(Unsafe.ARRAY_FLOAT_INDEX_SCALE); 954 private static final int BOOLEAN_ARRAY_SHIFT = 31 - Integer.numberOfLeadingZeros(Unsafe.ARRAY_BOOLEAN_INDEX_SCALE); 955 956 @Override 957 @ForceInline 958 public void intoArray(float[] a, int ix) { 959 Objects.requireNonNull(a); 960 ix = VectorIntrinsics.checkIndex(ix, a.length, LENGTH); 961 VectorIntrinsics.store(Float256Vector.class, float.class, LENGTH, 962 a, (((long) ix) << ARRAY_SHIFT) + Unsafe.ARRAY_FLOAT_BASE_OFFSET, 963 this, 964 a, ix, 965 (arr, idx, v) -> v.forEach((i, e) -> arr[idx + i] = e)); 966 } 967 968 @Override 969 @ForceInline 970 public final void intoArray(float[] a, int ax, Mask<Float> m) { 971 FloatVector oldVal = FloatVector.fromArray(SPECIES, a, ax); 972 FloatVector newVal = oldVal.blend(this, m); 973 newVal.intoArray(a, ax); 974 } 975 @Override 976 @ForceInline 977 public void intoArray(float[] a, int ix, int[] b, int iy) { 978 Objects.requireNonNull(a); 979 Objects.requireNonNull(b); 980 981 // Index vector: vix[0:n] = i -> ix + indexMap[iy + i] 982 IntVector vix = IntVector.fromArray(INDEX_SPEC, b, iy).add(ix); 983 984 vix = VectorIntrinsics.checkIndex(vix, a.length); 985 986 VectorIntrinsics.storeWithMap(Float256Vector.class, float.class, LENGTH, Int256Vector.class, 987 a, Unsafe.ARRAY_FLOAT_BASE_OFFSET, vix, 988 this, 989 a, ix, b, iy, 990 (arr, idx, v, indexMap, idy) -> v.forEach((i, e) -> arr[idx+indexMap[idy+i]] = e)); 991 } 992 993 @Override 994 @ForceInline 995 public final void intoArray(float[] a, int ax, Mask<Float> m, int[] b, int iy) { 996 // @@@ This can result in out of bounds errors for unset mask lanes 997 FloatVector oldVal = FloatVector.fromArray(SPECIES, a, ax, b, iy); 998 FloatVector newVal = oldVal.blend(this, m); 999 newVal.intoArray(a, ax, b, iy); 1000 } 1001 1002 @Override 1003 @ForceInline 1004 public void intoByteArray(byte[] a, int ix) { 1005 Objects.requireNonNull(a); 1006 ix = VectorIntrinsics.checkIndex(ix, a.length, bitSize() / Byte.SIZE); 1007 VectorIntrinsics.store(Float256Vector.class, float.class, LENGTH, 1008 a, ((long) ix) + Unsafe.ARRAY_BYTE_BASE_OFFSET, 1009 this, 1010 a, ix, 1011 (c, idx, v) -> { 1012 ByteBuffer bbc = ByteBuffer.wrap(c, idx, c.length - idx).order(ByteOrder.nativeOrder()); 1013 FloatBuffer tb = bbc.asFloatBuffer(); 1014 v.forEach((i, e) -> tb.put(e)); 1015 }); 1016 } 1017 1018 @Override 1019 @ForceInline 1020 public final void intoByteArray(byte[] a, int ix, Mask<Float> m) { 1021 Float256Vector oldVal = (Float256Vector) FloatVector.fromByteArray(SPECIES, a, ix); 1022 Float256Vector newVal = oldVal.blend(this, m); 1023 newVal.intoByteArray(a, ix); 1024 } 1025 1026 @Override 1027 @ForceInline 1028 public void intoByteBuffer(ByteBuffer bb, int ix) { 1029 if (bb.order() != ByteOrder.nativeOrder()) { 1030 throw new IllegalArgumentException(); 1031 } 1032 if (bb.isReadOnly()) { 1033 throw new ReadOnlyBufferException(); 1034 } 1035 ix = VectorIntrinsics.checkIndex(ix, bb.limit(), bitSize() / Byte.SIZE); 1036 VectorIntrinsics.store(Float256Vector.class, float.class, LENGTH, 1037 U.getReference(bb, BYTE_BUFFER_HB), ix + U.getLong(bb, BUFFER_ADDRESS), 1038 this, 1039 bb, ix, 1040 (c, idx, v) -> { 1041 ByteBuffer bbc = c.duplicate().position(idx).order(ByteOrder.nativeOrder()); 1042 FloatBuffer tb = bbc.asFloatBuffer(); 1043 v.forEach((i, e) -> tb.put(e)); 1044 }); 1045 } 1046 1047 @Override 1048 @ForceInline 1049 public void intoByteBuffer(ByteBuffer bb, int ix, Mask<Float> m) { 1050 Float256Vector oldVal = (Float256Vector) FloatVector.fromByteBuffer(SPECIES, bb, ix); 1051 Float256Vector newVal = oldVal.blend(this, m); 1052 newVal.intoByteBuffer(bb, ix); 1053 } 1054 1055 // 1056 1057 @Override 1058 public String toString() { 1059 return Arrays.toString(getElements()); 1060 } 1061 1062 @Override 1063 public boolean equals(Object o) { 1064 if (this == o) return true; 1065 if (o == null || this.getClass() != o.getClass()) return false; 1066 1067 Float256Vector that = (Float256Vector) o; 1068 return this.equal(that).allTrue(); 1069 } 1070 1071 @Override 1072 public int hashCode() { 1073 return Arrays.hashCode(vec); 1074 } 1075 1076 // Binary test 1077 1078 @Override 1079 Float256Mask bTest(Vector<Float> o, FBinTest f) { 1080 float[] vec1 = getElements(); 1081 float[] vec2 = ((Float256Vector)o).getElements(); 1082 boolean[] bits = new boolean[length()]; 1083 for (int i = 0; i < length(); i++){ 1084 bits[i] = f.apply(i, vec1[i], vec2[i]); 1085 } 1086 return new Float256Mask(bits); 1087 } 1088 1089 // Comparisons 1090 1091 @Override 1092 @ForceInline 1093 public Float256Mask equal(Vector<Float> o) { 1094 Objects.requireNonNull(o); 1095 Float256Vector v = (Float256Vector)o; 1096 1097 return VectorIntrinsics.compare( 1098 BT_eq, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1099 this, v, 1100 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a == b)); 1101 } 1102 1103 @Override 1104 @ForceInline 1105 public Float256Mask notEqual(Vector<Float> o) { 1106 Objects.requireNonNull(o); 1107 Float256Vector v = (Float256Vector)o; 1108 1109 return VectorIntrinsics.compare( 1110 BT_ne, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1111 this, v, 1112 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a != b)); 1113 } 1114 1115 @Override 1116 @ForceInline 1117 public Float256Mask lessThan(Vector<Float> o) { 1118 Objects.requireNonNull(o); 1119 Float256Vector v = (Float256Vector)o; 1120 1121 return VectorIntrinsics.compare( 1122 BT_lt, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1123 this, v, 1124 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a < b)); 1125 } 1126 1127 @Override 1128 @ForceInline 1129 public Float256Mask lessThanEq(Vector<Float> o) { 1130 Objects.requireNonNull(o); 1131 Float256Vector v = (Float256Vector)o; 1132 1133 return VectorIntrinsics.compare( 1134 BT_le, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1135 this, v, 1136 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a <= b)); 1137 } 1138 1139 @Override 1140 @ForceInline 1141 public Float256Mask greaterThan(Vector<Float> o) { 1142 Objects.requireNonNull(o); 1143 Float256Vector v = (Float256Vector)o; 1144 1145 return (Float256Mask) VectorIntrinsics.compare( 1146 BT_gt, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1147 this, v, 1148 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a > b)); 1149 } 1150 1151 @Override 1152 @ForceInline 1153 public Float256Mask greaterThanEq(Vector<Float> o) { 1154 Objects.requireNonNull(o); 1155 Float256Vector v = (Float256Vector)o; 1156 1157 return VectorIntrinsics.compare( 1158 BT_ge, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1159 this, v, 1160 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a >= b)); 1161 } 1162 1163 // Foreach 1164 1165 @Override 1166 void forEach(FUnCon f) { 1167 float[] vec = getElements(); 1168 for (int i = 0; i < length(); i++) { 1169 f.apply(i, vec[i]); 1170 } 1171 } 1172 1173 @Override 1174 void forEach(Mask<Float> o, FUnCon f) { 1175 boolean[] mbits = ((Float256Mask)o).getBits(); 1176 forEach((i, a) -> { 1177 if (mbits[i]) { f.apply(i, a); } 1178 }); 1179 } 1180 1181 Int256Vector toBits() { 1182 float[] vec = getElements(); 1183 int[] res = new int[this.species().length()]; 1184 for(int i = 0; i < this.species().length(); i++){ 1185 res[i] = Float.floatToIntBits(vec[i]); 1186 } 1187 return new Int256Vector(res); 1188 } 1189 1190 1191 @Override 1192 public Float256Vector rotateEL(int j) { 1193 float[] vec = getElements(); 1194 float[] res = new float[length()]; 1195 for (int i = 0; i < length(); i++){ 1196 res[(j + i) % length()] = vec[i]; 1197 } 1198 return new Float256Vector(res); 1199 } 1200 1201 @Override 1202 public Float256Vector rotateER(int j) { 1203 float[] vec = getElements(); 1204 float[] res = new float[length()]; 1205 for (int i = 0; i < length(); i++){ 1206 int z = i - j; 1207 if(j < 0) { 1208 res[length() + z] = vec[i]; 1209 } else { 1210 res[z] = vec[i]; 1211 } 1212 } 1213 return new Float256Vector(res); 1214 } 1215 1216 @Override 1217 public Float256Vector shiftEL(int j) { 1218 float[] vec = getElements(); 1219 float[] res = new float[length()]; 1220 for (int i = 0; i < length() - j; i++) { 1221 res[i] = vec[i + j]; 1222 } 1223 return new Float256Vector(res); 1224 } 1225 1226 @Override 1227 public Float256Vector shiftER(int j) { 1228 float[] vec = getElements(); 1229 float[] res = new float[length()]; 1230 for (int i = 0; i < length() - j; i++){ 1231 res[i + j] = vec[i]; 1232 } 1233 return new Float256Vector(res); 1234 } 1235 1236 @Override 1237 @ForceInline 1238 public Float256Vector rearrange(Vector<Float> v, 1239 Shuffle<Float> s, Mask<Float> m) { 1240 return this.rearrange(s).blend(v.rearrange(s), m); 1241 } 1242 1243 @Override 1244 @ForceInline 1245 public Float256Vector rearrange(Shuffle<Float> o1) { 1246 Objects.requireNonNull(o1); 1247 Float256Shuffle s = (Float256Shuffle)o1; 1248 1249 return VectorIntrinsics.rearrangeOp( 1250 Float256Vector.class, Float256Shuffle.class, float.class, LENGTH, 1251 this, s, 1252 (v1, s_) -> v1.uOp((i, a) -> { 1253 int ei = s_.getElement(i); 1254 return v1.get(ei); 1255 })); 1256 } 1257 1258 @Override 1259 @ForceInline 1260 public Float256Vector blend(Vector<Float> o1, Mask<Float> o2) { 1261 Objects.requireNonNull(o1); 1262 Objects.requireNonNull(o2); 1263 Float256Vector v = (Float256Vector)o1; 1264 Float256Mask m = (Float256Mask)o2; 1265 1266 return VectorIntrinsics.blend( 1267 Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1268 this, v, m, 1269 (v1, v2, m_) -> v1.bOp(v2, (i, a, b) -> m_.getElement(i) ? b : a)); 1270 } 1271 1272 // Accessors 1273 1274 @Override 1275 public float get(int i) { 1276 if (i < 0 || i >= LENGTH) { 1277 throw new IllegalArgumentException("Index " + i + " must be zero or positive, and less than " + LENGTH); 1278 } 1279 int bits = (int) VectorIntrinsics.extract( 1280 Float256Vector.class, float.class, LENGTH, 1281 this, i, 1282 (vec, ix) -> { 1283 float[] vecarr = vec.getElements(); 1284 return (long)Float.floatToIntBits(vecarr[ix]); 1285 }); 1286 return Float.intBitsToFloat(bits); 1287 } 1288 1289 @Override 1290 public Float256Vector with(int i, float e) { 1291 if (i < 0 || i >= LENGTH) { 1292 throw new IllegalArgumentException("Index " + i + " must be zero or positive, and less than " + LENGTH); 1293 } 1294 return VectorIntrinsics.insert( 1295 Float256Vector.class, float.class, LENGTH, 1296 this, i, (long)Float.floatToIntBits(e), 1297 (v, ix, bits) -> { 1298 float[] res = v.getElements().clone(); 1299 res[ix] = Float.intBitsToFloat((int)bits); 1300 return new Float256Vector(res); 1301 }); 1302 } 1303 1304 // Mask 1305 1306 static final class Float256Mask extends AbstractMask<Float> { 1307 static final Float256Mask TRUE_MASK = new Float256Mask(true); 1308 static final Float256Mask FALSE_MASK = new Float256Mask(false); 1309 1310 private final boolean[] bits; // Don't access directly, use getBits() instead. 1311 1312 public Float256Mask(boolean[] bits) { 1313 this(bits, 0); 1314 } 1315 1316 public Float256Mask(boolean[] bits, int offset) { 1317 boolean[] a = new boolean[species().length()]; 1318 for (int i = 0; i < a.length; i++) { 1319 a[i] = bits[offset + i]; 1320 } 1321 this.bits = a; 1322 } 1323 1324 public Float256Mask(boolean val) { 1325 boolean[] bits = new boolean[species().length()]; 1326 Arrays.fill(bits, val); 1327 this.bits = bits; 1328 } 1329 1330 boolean[] getBits() { 1331 return VectorIntrinsics.maybeRebox(this).bits; 1332 } 1333 1334 @Override 1335 Float256Mask uOp(MUnOp f) { 1336 boolean[] res = new boolean[species().length()]; 1337 boolean[] bits = getBits(); 1338 for (int i = 0; i < species().length(); i++) { 1339 res[i] = f.apply(i, bits[i]); 1340 } 1341 return new Float256Mask(res); 1342 } 1343 1344 @Override 1345 Float256Mask bOp(Mask<Float> o, MBinOp f) { 1346 boolean[] res = new boolean[species().length()]; 1347 boolean[] bits = getBits(); 1348 boolean[] mbits = ((Float256Mask)o).getBits(); 1349 for (int i = 0; i < species().length(); i++) { 1350 res[i] = f.apply(i, bits[i], mbits[i]); 1351 } 1352 return new Float256Mask(res); 1353 } 1354 1355 @Override 1356 public Float256Species species() { 1357 return SPECIES; 1358 } 1359 1360 @Override 1361 public Float256Vector toVector() { 1362 float[] res = new float[species().length()]; 1363 boolean[] bits = getBits(); 1364 for (int i = 0; i < species().length(); i++) { 1365 // -1 will result in the most significant bit being set in 1366 // addition to some or all other bits 1367 res[i] = (float) (bits[i] ? -1 : 0); 1368 } 1369 return new Float256Vector(res); 1370 } 1371 1372 // Unary operations 1373 1374 @Override 1375 @ForceInline 1376 public Float256Mask not() { 1377 return (Float256Mask) VectorIntrinsics.unaryOp( 1378 VECTOR_OP_NOT, Float256Mask.class, int.class, LENGTH, 1379 this, 1380 (m1) -> m1.uOp((i, a) -> !a)); 1381 } 1382 1383 // Binary operations 1384 1385 @Override 1386 @ForceInline 1387 public Float256Mask and(Mask<Float> o) { 1388 Objects.requireNonNull(o); 1389 Float256Mask m = (Float256Mask)o; 1390 return VectorIntrinsics.binaryOp(VECTOR_OP_AND, Float256Mask.class, int.class, LENGTH, 1391 this, m, 1392 (m1, m2) -> m1.bOp(m2, (i, a, b) -> a & b)); 1393 } 1394 1395 @Override 1396 @ForceInline 1397 public Float256Mask or(Mask<Float> o) { 1398 Objects.requireNonNull(o); 1399 Float256Mask m = (Float256Mask)o; 1400 return VectorIntrinsics.binaryOp(VECTOR_OP_OR, Float256Mask.class, int.class, LENGTH, 1401 this, m, 1402 (m1, m2) -> m1.bOp(m2, (i, a, b) -> a | b)); 1403 } 1404 1405 // Reductions 1406 1407 @Override 1408 @ForceInline 1409 public boolean anyTrue() { 1410 return VectorIntrinsics.test(BT_ne, Float256Mask.class, int.class, LENGTH, 1411 this, this, 1412 (m, __) -> anyTrueHelper(((Float256Mask)m).getBits())); 1413 } 1414 1415 @Override 1416 @ForceInline 1417 public boolean allTrue() { 1418 return VectorIntrinsics.test(BT_overflow, Float256Mask.class, int.class, LENGTH, 1419 this, FloatVector.maskAllTrue(species()), 1420 (m, __) -> allTrueHelper(((Float256Mask)m).getBits())); 1421 } 1422 } 1423 1424 // Shuffle 1425 1426 static final class Float256Shuffle extends AbstractShuffle<Float> { 1427 Float256Shuffle(byte[] reorder) { 1428 super(reorder); 1429 } 1430 1431 public Float256Shuffle(int[] reorder) { 1432 super(reorder); 1433 } 1434 1435 public Float256Shuffle(int[] reorder, int i) { 1436 super(reorder, i); 1437 } 1438 1439 public Float256Shuffle(IntUnaryOperator f) { 1440 super(f); 1441 } 1442 1443 @Override 1444 public Float256Species species() { 1445 return SPECIES; 1446 } 1447 1448 @Override 1449 public FloatVector toVector() { 1450 float[] va = new float[SPECIES.length()]; 1451 for (int i = 0; i < va.length; i++) { 1452 va[i] = (float) getElement(i); 1453 } 1454 return FloatVector.fromArray(SPECIES, va, 0); 1455 } 1456 1457 @Override 1458 public Float256Shuffle rearrange(Vector.Shuffle<Float> o) { 1459 Float256Shuffle s = (Float256Shuffle) o; 1460 byte[] r = new byte[reorder.length]; 1461 for (int i = 0; i < reorder.length; i++) { 1462 r[i] = reorder[s.reorder[i]]; 1463 } 1464 return new Float256Shuffle(r); 1465 } 1466 } 1467 1468 // Species 1469 1470 @Override 1471 public Float256Species species() { 1472 return SPECIES; 1473 } 1474 1475 static final class Float256Species extends FloatSpecies { 1476 static final int BIT_SIZE = Shape.S_256_BIT.bitSize(); 1477 1478 static final int LENGTH = BIT_SIZE / Float.SIZE; 1479 1480 @Override 1481 public String toString() { 1482 StringBuilder sb = new StringBuilder("Shape["); 1483 sb.append(bitSize()).append(" bits, "); 1484 sb.append(length()).append(" ").append(float.class.getSimpleName()).append("s x "); 1485 sb.append(elementSize()).append(" bits"); 1486 sb.append("]"); 1487 return sb.toString(); 1488 } 1489 1490 @Override 1491 @ForceInline 1492 public int bitSize() { 1493 return BIT_SIZE; 1494 } 1495 1496 @Override 1497 @ForceInline 1498 public int length() { 1499 return LENGTH; 1500 } 1501 1502 @Override 1503 @ForceInline 1504 public Class<Float> elementType() { 1505 return float.class; 1506 } 1507 1508 @Override 1509 @ForceInline 1510 public Class<?> boxType() { 1511 return Float256Vector.class; 1512 } 1513 1514 @Override 1515 @ForceInline 1516 public Class<?> maskType() { 1517 return Float256Mask.class; 1518 } 1519 1520 @Override 1521 @ForceInline 1522 public int elementSize() { 1523 return Float.SIZE; 1524 } 1525 1526 @Override 1527 @ForceInline 1528 @SuppressWarnings("unchecked") 1529 Class<?> vectorType() { 1530 return Float256Vector.class; 1531 } 1532 1533 @Override 1534 @ForceInline 1535 public Shape shape() { 1536 return Shape.S_256_BIT; 1537 } 1538 1539 @Override 1540 IntVector.IntSpecies indexSpecies() { 1541 return INDEX_SPEC; 1542 } 1543 1544 @Override 1545 Float256Vector op(FOp f) { 1546 float[] res = new float[length()]; 1547 for (int i = 0; i < length(); i++) { 1548 res[i] = f.apply(i); 1549 } 1550 return new Float256Vector(res); 1551 } 1552 1553 @Override 1554 Float256Vector op(Mask<Float> o, FOp f) { 1555 float[] res = new float[length()]; 1556 boolean[] mbits = ((Float256Mask)o).getBits(); 1557 for (int i = 0; i < length(); i++) { 1558 if (mbits[i]) { 1559 res[i] = f.apply(i); 1560 } 1561 } 1562 return new Float256Vector(res); 1563 } 1564 1565 @Override 1566 Float256Mask opm(FOpm f) { 1567 boolean[] res = new boolean[length()]; 1568 for (int i = 0; i < length(); i++) { 1569 res[i] = (boolean)f.apply(i); 1570 } 1571 return new Float256Mask(res); 1572 } 1573 1574 // Factories 1575 1576 @Override 1577 @ForceInline 1578 public Float256Vector zero() { 1579 return VectorIntrinsics.broadcastCoerced(Float256Vector.class, float.class, LENGTH, 1580 Float.floatToIntBits(0.0f), SPECIES, 1581 ((bits, s) -> ((Float256Species)s).op(i -> Float.intBitsToFloat((int)bits)))); 1582 } 1583 1584 @Override 1585 @ForceInline 1586 public Float256Vector broadcast(float e) { 1587 return VectorIntrinsics.broadcastCoerced( 1588 Float256Vector.class, float.class, LENGTH, 1589 Float.floatToIntBits(e), SPECIES, 1590 ((bits, s) -> ((Float256Species)s).op(i -> Float.intBitsToFloat((int)bits)))); 1591 } 1592 1593 @Override 1594 @ForceInline 1595 public Float256Vector scalars(float... es) { 1596 Objects.requireNonNull(es); 1597 int ix = VectorIntrinsics.checkIndex(0, es.length, LENGTH); 1598 return VectorIntrinsics.load(Float256Vector.class, float.class, LENGTH, 1599 es, Unsafe.ARRAY_FLOAT_BASE_OFFSET, 1600 es, ix, SPECIES, 1601 (c, idx, s) -> ((Float256Species)s).op(n -> c[idx + n])); 1602 } 1603 1604 @Override 1605 @ForceInline 1606 public <E> Float256Mask cast(Mask<E> m) { 1607 if (m.length() != LENGTH) 1608 throw new IllegalArgumentException("Mask length this species length differ"); 1609 return new Float256Mask(m.toArray()); 1610 } 1611 1612 @Override 1613 @ForceInline 1614 public <E> Float256Shuffle cast(Shuffle<E> s) { 1615 if (s.length() != LENGTH) 1616 throw new IllegalArgumentException("Shuffle length this species length differ"); 1617 return new Float256Shuffle(s.toArray()); 1618 } 1619 } 1620 }