1 /* 2 * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * This code is free software; you can redistribute it and/or modify it 6 * under the terms of the GNU General Public License version 2 only, as 7 * published by the Free Software Foundation. Oracle designates this 8 * particular file as subject to the "Classpath" exception as provided 9 * by Oracle in the LICENSE file that accompanied this code. 10 * 11 * This code is distributed in the hope that it will be useful, but WITHOUT 12 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 13 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 14 * version 2 for more details (a copy is included in the LICENSE file that 15 * accompanied this code). 16 * 17 * You should have received a copy of the GNU General Public License version 18 * 2 along with this work; if not, write to the Free Software Foundation, 19 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 20 * 21 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 22 * or visit www.oracle.com if you need additional information or have 23 * questions. 24 */ 25 package jdk.incubator.vector; 26 27 import java.nio.ByteBuffer; 28 import java.nio.ByteOrder; 29 import java.nio.FloatBuffer; 30 import java.nio.ReadOnlyBufferException; 31 import java.util.Arrays; 32 import java.util.Objects; 33 import java.util.function.IntUnaryOperator; 34 35 import jdk.internal.misc.Unsafe; 36 import jdk.internal.vm.annotation.ForceInline; 37 import static jdk.incubator.vector.VectorIntrinsics.*; 38 39 @SuppressWarnings("cast") 40 final class Float256Vector extends FloatVector { 41 static final Float256Species SPECIES = new Float256Species(); 42 43 static final Float256Vector ZERO = new Float256Vector(); 44 45 static final int LENGTH = SPECIES.length(); 46 47 // Index vector species 48 private static final IntVector.IntSpecies INDEX_SPEC; 49 static { 50 int bitSize = Vector.bitSizeForVectorLength(int.class, LENGTH); 51 Vector.Shape shape = Shape.forBitSize(bitSize); 52 INDEX_SPEC = (IntVector.IntSpecies) Species.of(int.class, shape); 53 } 54 private final float[] vec; // Don't access directly, use getElements() instead. 55 56 private float[] getElements() { 57 return VectorIntrinsics.maybeRebox(this).vec; 58 } 59 60 Float256Vector() { 61 vec = new float[SPECIES.length()]; 62 } 63 64 Float256Vector(float[] v) { 65 vec = v; 66 } 67 68 @Override 69 public int length() { return LENGTH; } 70 71 // Unary operator 72 73 @Override 74 Float256Vector uOp(FUnOp f) { 75 float[] vec = getElements(); 76 float[] res = new float[length()]; 77 for (int i = 0; i < length(); i++) { 78 res[i] = f.apply(i, vec[i]); 79 } 80 return new Float256Vector(res); 81 } 82 83 @Override 84 Float256Vector uOp(Mask<Float> o, FUnOp f) { 85 float[] vec = getElements(); 86 float[] res = new float[length()]; 87 boolean[] mbits = ((Float256Mask)o).getBits(); 88 for (int i = 0; i < length(); i++) { 89 res[i] = mbits[i] ? f.apply(i, vec[i]) : vec[i]; 90 } 91 return new Float256Vector(res); 92 } 93 94 // Binary operator 95 96 @Override 97 Float256Vector bOp(Vector<Float> o, FBinOp f) { 98 float[] res = new float[length()]; 99 float[] vec1 = this.getElements(); 100 float[] vec2 = ((Float256Vector)o).getElements(); 101 for (int i = 0; i < length(); i++) { 102 res[i] = f.apply(i, vec1[i], vec2[i]); 103 } 104 return new Float256Vector(res); 105 } 106 107 @Override 108 Float256Vector bOp(Vector<Float> o1, Mask<Float> o2, FBinOp f) { 109 float[] res = new float[length()]; 110 float[] vec1 = this.getElements(); 111 float[] vec2 = ((Float256Vector)o1).getElements(); 112 boolean[] mbits = ((Float256Mask)o2).getBits(); 113 for (int i = 0; i < length(); i++) { 114 res[i] = mbits[i] ? f.apply(i, vec1[i], vec2[i]) : vec1[i]; 115 } 116 return new Float256Vector(res); 117 } 118 119 // Trinary operator 120 121 @Override 122 Float256Vector tOp(Vector<Float> o1, Vector<Float> o2, FTriOp f) { 123 float[] res = new float[length()]; 124 float[] vec1 = this.getElements(); 125 float[] vec2 = ((Float256Vector)o1).getElements(); 126 float[] vec3 = ((Float256Vector)o2).getElements(); 127 for (int i = 0; i < length(); i++) { 128 res[i] = f.apply(i, vec1[i], vec2[i], vec3[i]); 129 } 130 return new Float256Vector(res); 131 } 132 133 @Override 134 Float256Vector tOp(Vector<Float> o1, Vector<Float> o2, Mask<Float> o3, FTriOp f) { 135 float[] res = new float[length()]; 136 float[] vec1 = getElements(); 137 float[] vec2 = ((Float256Vector)o1).getElements(); 138 float[] vec3 = ((Float256Vector)o2).getElements(); 139 boolean[] mbits = ((Float256Mask)o3).getBits(); 140 for (int i = 0; i < length(); i++) { 141 res[i] = mbits[i] ? f.apply(i, vec1[i], vec2[i], vec3[i]) : vec1[i]; 142 } 143 return new Float256Vector(res); 144 } 145 146 @Override 147 float rOp(float v, FBinOp f) { 148 float[] vec = getElements(); 149 for (int i = 0; i < length(); i++) { 150 v = f.apply(i, v, vec[i]); 151 } 152 return v; 153 } 154 155 @Override 156 @ForceInline 157 public <F> Vector<F> cast(Species<F> s) { 158 Objects.requireNonNull(s); 159 if (s.length() != LENGTH) 160 throw new IllegalArgumentException("Vector length this species length differ"); 161 162 return VectorIntrinsics.cast( 163 Float256Vector.class, 164 float.class, LENGTH, 165 s.vectorType(), 166 s.elementType(), LENGTH, 167 this, s, 168 (species, vector) -> vector.castDefault(species) 169 ); 170 } 171 172 @SuppressWarnings("unchecked") 173 @ForceInline 174 private <F> Vector<F> castDefault(Species<F> s) { 175 int limit = s.length(); 176 177 Class<?> stype = s.elementType(); 178 if (stype == byte.class) { 179 byte[] a = new byte[limit]; 180 for (int i = 0; i < limit; i++) { 181 a[i] = (byte) this.get(i); 182 } 183 return (Vector) ByteVector.fromArray((ByteVector.ByteSpecies) s, a, 0); 184 } else if (stype == short.class) { 185 short[] a = new short[limit]; 186 for (int i = 0; i < limit; i++) { 187 a[i] = (short) this.get(i); 188 } 189 return (Vector) ShortVector.fromArray((ShortVector.ShortSpecies) s, a, 0); 190 } else if (stype == int.class) { 191 int[] a = new int[limit]; 192 for (int i = 0; i < limit; i++) { 193 a[i] = (int) this.get(i); 194 } 195 return (Vector) IntVector.fromArray((IntVector.IntSpecies) s, a, 0); 196 } else if (stype == long.class) { 197 long[] a = new long[limit]; 198 for (int i = 0; i < limit; i++) { 199 a[i] = (long) this.get(i); 200 } 201 return (Vector) LongVector.fromArray((LongVector.LongSpecies) s, a, 0); 202 } else if (stype == float.class) { 203 float[] a = new float[limit]; 204 for (int i = 0; i < limit; i++) { 205 a[i] = (float) this.get(i); 206 } 207 return (Vector) FloatVector.fromArray((FloatVector.FloatSpecies) s, a, 0); 208 } else if (stype == double.class) { 209 double[] a = new double[limit]; 210 for (int i = 0; i < limit; i++) { 211 a[i] = (double) this.get(i); 212 } 213 return (Vector) DoubleVector.fromArray((DoubleVector.DoubleSpecies) s, a, 0); 214 } else { 215 throw new UnsupportedOperationException("Bad lane type for casting."); 216 } 217 } 218 219 @Override 220 @ForceInline 221 @SuppressWarnings("unchecked") 222 public <F> Vector<F> reinterpret(Species<F> s) { 223 Objects.requireNonNull(s); 224 225 if(s.elementType().equals(float.class)) { 226 return (Vector<F>) reshape((Species<Float>)s); 227 } 228 if(s.bitSize() == bitSize()) { 229 return reinterpretType(s); 230 } 231 232 return defaultReinterpret(s); 233 } 234 235 @ForceInline 236 private <F> Vector<F> reinterpretType(Species<F> s) { 237 Objects.requireNonNull(s); 238 239 Class<?> stype = s.elementType(); 240 if (stype == byte.class) { 241 return VectorIntrinsics.reinterpret( 242 Float256Vector.class, 243 float.class, LENGTH, 244 Byte256Vector.class, 245 byte.class, Byte256Vector.LENGTH, 246 this, s, 247 (species, vector) -> vector.defaultReinterpret(species) 248 ); 249 } else if (stype == short.class) { 250 return VectorIntrinsics.reinterpret( 251 Float256Vector.class, 252 float.class, LENGTH, 253 Short256Vector.class, 254 short.class, Short256Vector.LENGTH, 255 this, s, 256 (species, vector) -> vector.defaultReinterpret(species) 257 ); 258 } else if (stype == int.class) { 259 return VectorIntrinsics.reinterpret( 260 Float256Vector.class, 261 float.class, LENGTH, 262 Int256Vector.class, 263 int.class, Int256Vector.LENGTH, 264 this, s, 265 (species, vector) -> vector.defaultReinterpret(species) 266 ); 267 } else if (stype == long.class) { 268 return VectorIntrinsics.reinterpret( 269 Float256Vector.class, 270 float.class, LENGTH, 271 Long256Vector.class, 272 long.class, Long256Vector.LENGTH, 273 this, s, 274 (species, vector) -> vector.defaultReinterpret(species) 275 ); 276 } else if (stype == float.class) { 277 return VectorIntrinsics.reinterpret( 278 Float256Vector.class, 279 float.class, LENGTH, 280 Float256Vector.class, 281 float.class, Float256Vector.LENGTH, 282 this, s, 283 (species, vector) -> vector.defaultReinterpret(species) 284 ); 285 } else if (stype == double.class) { 286 return VectorIntrinsics.reinterpret( 287 Float256Vector.class, 288 float.class, LENGTH, 289 Double256Vector.class, 290 double.class, Double256Vector.LENGTH, 291 this, s, 292 (species, vector) -> vector.defaultReinterpret(species) 293 ); 294 } else { 295 throw new UnsupportedOperationException("Bad lane type for casting."); 296 } 297 } 298 299 @Override 300 @ForceInline 301 public FloatVector reshape(Species<Float> s) { 302 Objects.requireNonNull(s); 303 if (s.bitSize() == 64 && (s instanceof Float64Vector.Float64Species)) { 304 Float64Vector.Float64Species ts = (Float64Vector.Float64Species)s; 305 return VectorIntrinsics.reinterpret( 306 Float256Vector.class, 307 float.class, LENGTH, 308 Float64Vector.class, 309 float.class, Float64Vector.LENGTH, 310 this, ts, 311 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 312 ); 313 } else if (s.bitSize() == 128 && (s instanceof Float128Vector.Float128Species)) { 314 Float128Vector.Float128Species ts = (Float128Vector.Float128Species)s; 315 return VectorIntrinsics.reinterpret( 316 Float256Vector.class, 317 float.class, LENGTH, 318 Float128Vector.class, 319 float.class, Float128Vector.LENGTH, 320 this, ts, 321 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 322 ); 323 } else if (s.bitSize() == 256 && (s instanceof Float256Vector.Float256Species)) { 324 Float256Vector.Float256Species ts = (Float256Vector.Float256Species)s; 325 return VectorIntrinsics.reinterpret( 326 Float256Vector.class, 327 float.class, LENGTH, 328 Float256Vector.class, 329 float.class, Float256Vector.LENGTH, 330 this, ts, 331 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 332 ); 333 } else if (s.bitSize() == 512 && (s instanceof Float512Vector.Float512Species)) { 334 Float512Vector.Float512Species ts = (Float512Vector.Float512Species)s; 335 return VectorIntrinsics.reinterpret( 336 Float256Vector.class, 337 float.class, LENGTH, 338 Float512Vector.class, 339 float.class, Float512Vector.LENGTH, 340 this, ts, 341 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 342 ); 343 } else if ((s.bitSize() > 0) && (s.bitSize() <= 2048) 344 && (s.bitSize() % 128 == 0) && (s instanceof FloatMaxVector.FloatMaxSpecies)) { 345 FloatMaxVector.FloatMaxSpecies ts = (FloatMaxVector.FloatMaxSpecies)s; 346 return VectorIntrinsics.reinterpret( 347 Float256Vector.class, 348 float.class, LENGTH, 349 FloatMaxVector.class, 350 float.class, FloatMaxVector.LENGTH, 351 this, ts, 352 (species, vector) -> (FloatVector) vector.defaultReinterpret(species) 353 ); 354 } else { 355 throw new InternalError("Unimplemented size"); 356 } 357 } 358 359 // Binary operations with scalars 360 361 @Override 362 @ForceInline 363 public FloatVector add(float o) { 364 return add(SPECIES.broadcast(o)); 365 } 366 367 @Override 368 @ForceInline 369 public FloatVector add(float o, Mask<Float> m) { 370 return add(SPECIES.broadcast(o), m); 371 } 372 373 @Override 374 @ForceInline 375 public FloatVector sub(float o) { 376 return sub(SPECIES.broadcast(o)); 377 } 378 379 @Override 380 @ForceInline 381 public FloatVector sub(float o, Mask<Float> m) { 382 return sub(SPECIES.broadcast(o), m); 383 } 384 385 @Override 386 @ForceInline 387 public FloatVector mul(float o) { 388 return mul(SPECIES.broadcast(o)); 389 } 390 391 @Override 392 @ForceInline 393 public FloatVector mul(float o, Mask<Float> m) { 394 return mul(SPECIES.broadcast(o), m); 395 } 396 397 @Override 398 @ForceInline 399 public FloatVector min(float o) { 400 return min(SPECIES.broadcast(o)); 401 } 402 403 @Override 404 @ForceInline 405 public FloatVector max(float o) { 406 return max(SPECIES.broadcast(o)); 407 } 408 409 @Override 410 @ForceInline 411 public Mask<Float> equal(float o) { 412 return equal(SPECIES.broadcast(o)); 413 } 414 415 @Override 416 @ForceInline 417 public Mask<Float> notEqual(float o) { 418 return notEqual(SPECIES.broadcast(o)); 419 } 420 421 @Override 422 @ForceInline 423 public Mask<Float> lessThan(float o) { 424 return lessThan(SPECIES.broadcast(o)); 425 } 426 427 @Override 428 @ForceInline 429 public Mask<Float> lessThanEq(float o) { 430 return lessThanEq(SPECIES.broadcast(o)); 431 } 432 433 @Override 434 @ForceInline 435 public Mask<Float> greaterThan(float o) { 436 return greaterThan(SPECIES.broadcast(o)); 437 } 438 439 @Override 440 @ForceInline 441 public Mask<Float> greaterThanEq(float o) { 442 return greaterThanEq(SPECIES.broadcast(o)); 443 } 444 445 @Override 446 @ForceInline 447 public FloatVector blend(float o, Mask<Float> m) { 448 return blend(SPECIES.broadcast(o), m); 449 } 450 451 @Override 452 @ForceInline 453 public FloatVector div(float o) { 454 return div(SPECIES.broadcast(o)); 455 } 456 457 @Override 458 @ForceInline 459 public FloatVector div(float o, Mask<Float> m) { 460 return div(SPECIES.broadcast(o), m); 461 } 462 463 @Override 464 @ForceInline 465 public Float256Vector div(Vector<Float> v, Mask<Float> m) { 466 return blend(div(v), m); 467 } 468 469 @Override 470 @ForceInline 471 public FloatVector atan2(float o) { 472 return atan2(SPECIES.broadcast(o)); 473 } 474 475 @Override 476 @ForceInline 477 public FloatVector atan2(float o, Mask<Float> m) { 478 return atan2(SPECIES.broadcast(o), m); 479 } 480 481 @Override 482 @ForceInline 483 public FloatVector pow(float o) { 484 return pow(SPECIES.broadcast(o)); 485 } 486 487 @Override 488 @ForceInline 489 public FloatVector pow(float o, Mask<Float> m) { 490 return pow(SPECIES.broadcast(o), m); 491 } 492 493 @Override 494 @ForceInline 495 public FloatVector fma(float o1, float o2) { 496 return fma(SPECIES.broadcast(o1), SPECIES.broadcast(o2)); 497 } 498 499 @Override 500 @ForceInline 501 public FloatVector fma(float o1, float o2, Mask<Float> m) { 502 return fma(SPECIES.broadcast(o1), SPECIES.broadcast(o2), m); 503 } 504 505 @Override 506 @ForceInline 507 public FloatVector hypot(float o) { 508 return hypot(SPECIES.broadcast(o)); 509 } 510 511 @Override 512 @ForceInline 513 public FloatVector hypot(float o, Mask<Float> m) { 514 return hypot(SPECIES.broadcast(o), m); 515 } 516 517 518 // Unary operations 519 520 @ForceInline 521 @Override 522 public Float256Vector neg(Mask<Float> m) { 523 return blend(neg(), m); 524 } 525 526 @Override 527 @ForceInline 528 public Float256Vector abs() { 529 return VectorIntrinsics.unaryOp( 530 VECTOR_OP_ABS, Float256Vector.class, float.class, LENGTH, 531 this, 532 v1 -> v1.uOp((i, a) -> (float) Math.abs(a))); 533 } 534 535 @ForceInline 536 @Override 537 public Float256Vector abs(Mask<Float> m) { 538 return blend(abs(), m); 539 } 540 541 @Override 542 @ForceInline 543 public Float256Vector neg() { 544 return VectorIntrinsics.unaryOp( 545 VECTOR_OP_NEG, Float256Vector.class, float.class, LENGTH, 546 this, 547 v1 -> v1.uOp((i, a) -> (float) -a)); 548 } 549 550 @Override 551 @ForceInline 552 public Float256Vector div(Vector<Float> o) { 553 Objects.requireNonNull(o); 554 Float256Vector v = (Float256Vector)o; 555 return VectorIntrinsics.binaryOp( 556 VECTOR_OP_DIV, Float256Vector.class, float.class, LENGTH, 557 this, v, 558 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a / b))); 559 } 560 561 @Override 562 @ForceInline 563 public Float256Vector sqrt() { 564 return VectorIntrinsics.unaryOp( 565 VECTOR_OP_SQRT, Float256Vector.class, float.class, LENGTH, 566 this, 567 v1 -> v1.uOp((i, a) -> (float) Math.sqrt((double) a))); 568 } 569 570 @Override 571 @ForceInline 572 public Float256Vector exp() { 573 return (Float256Vector) VectorIntrinsics.unaryOp( 574 VECTOR_OP_EXP, Float256Vector.class, float.class, LENGTH, 575 this, 576 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.exp((double) a))); 577 } 578 579 @Override 580 @ForceInline 581 public Float256Vector log1p() { 582 return (Float256Vector) VectorIntrinsics.unaryOp( 583 VECTOR_OP_LOG1P, Float256Vector.class, float.class, LENGTH, 584 this, 585 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.log1p((double) a))); 586 } 587 588 @Override 589 @ForceInline 590 public Float256Vector log() { 591 return (Float256Vector) VectorIntrinsics.unaryOp( 592 VECTOR_OP_LOG, Float256Vector.class, float.class, LENGTH, 593 this, 594 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.log((double) a))); 595 } 596 597 @Override 598 @ForceInline 599 public Float256Vector log10() { 600 return (Float256Vector) VectorIntrinsics.unaryOp( 601 VECTOR_OP_LOG10, Float256Vector.class, float.class, LENGTH, 602 this, 603 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.log10((double) a))); 604 } 605 606 @Override 607 @ForceInline 608 public Float256Vector expm1() { 609 return (Float256Vector) VectorIntrinsics.unaryOp( 610 VECTOR_OP_EXPM1, Float256Vector.class, float.class, LENGTH, 611 this, 612 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.expm1((double) a))); 613 } 614 615 @Override 616 @ForceInline 617 public Float256Vector cbrt() { 618 return (Float256Vector) VectorIntrinsics.unaryOp( 619 VECTOR_OP_CBRT, Float256Vector.class, float.class, LENGTH, 620 this, 621 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.cbrt((double) a))); 622 } 623 624 @Override 625 @ForceInline 626 public Float256Vector sin() { 627 return (Float256Vector) VectorIntrinsics.unaryOp( 628 VECTOR_OP_SIN, Float256Vector.class, float.class, LENGTH, 629 this, 630 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.sin((double) a))); 631 } 632 633 @Override 634 @ForceInline 635 public Float256Vector cos() { 636 return (Float256Vector) VectorIntrinsics.unaryOp( 637 VECTOR_OP_COS, Float256Vector.class, float.class, LENGTH, 638 this, 639 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.cos((double) a))); 640 } 641 642 @Override 643 @ForceInline 644 public Float256Vector tan() { 645 return (Float256Vector) VectorIntrinsics.unaryOp( 646 VECTOR_OP_TAN, Float256Vector.class, float.class, LENGTH, 647 this, 648 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.tan((double) a))); 649 } 650 651 @Override 652 @ForceInline 653 public Float256Vector asin() { 654 return (Float256Vector) VectorIntrinsics.unaryOp( 655 VECTOR_OP_ASIN, Float256Vector.class, float.class, LENGTH, 656 this, 657 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.asin((double) a))); 658 } 659 660 @Override 661 @ForceInline 662 public Float256Vector acos() { 663 return (Float256Vector) VectorIntrinsics.unaryOp( 664 VECTOR_OP_ACOS, Float256Vector.class, float.class, LENGTH, 665 this, 666 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.acos((double) a))); 667 } 668 669 @Override 670 @ForceInline 671 public Float256Vector atan() { 672 return (Float256Vector) VectorIntrinsics.unaryOp( 673 VECTOR_OP_ATAN, Float256Vector.class, float.class, LENGTH, 674 this, 675 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.atan((double) a))); 676 } 677 678 @Override 679 @ForceInline 680 public Float256Vector sinh() { 681 return (Float256Vector) VectorIntrinsics.unaryOp( 682 VECTOR_OP_SINH, Float256Vector.class, float.class, LENGTH, 683 this, 684 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.sinh((double) a))); 685 } 686 687 @Override 688 @ForceInline 689 public Float256Vector cosh() { 690 return (Float256Vector) VectorIntrinsics.unaryOp( 691 VECTOR_OP_COSH, Float256Vector.class, float.class, LENGTH, 692 this, 693 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.cosh((double) a))); 694 } 695 696 @Override 697 @ForceInline 698 public Float256Vector tanh() { 699 return (Float256Vector) VectorIntrinsics.unaryOp( 700 VECTOR_OP_TANH, Float256Vector.class, float.class, LENGTH, 701 this, 702 v1 -> ((Float256Vector)v1).uOp((i, a) -> (float) Math.tanh((double) a))); 703 } 704 705 @Override 706 @ForceInline 707 public Float256Vector pow(Vector<Float> o) { 708 Objects.requireNonNull(o); 709 Float256Vector v = (Float256Vector)o; 710 return (Float256Vector) VectorIntrinsics.binaryOp( 711 VECTOR_OP_POW, Float256Vector.class, float.class, LENGTH, 712 this, v, 713 (v1, v2) -> ((Float256Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.pow(a,b)))); 714 } 715 716 @Override 717 @ForceInline 718 public Float256Vector hypot(Vector<Float> o) { 719 Objects.requireNonNull(o); 720 Float256Vector v = (Float256Vector)o; 721 return (Float256Vector) VectorIntrinsics.binaryOp( 722 VECTOR_OP_HYPOT, Float256Vector.class, float.class, LENGTH, 723 this, v, 724 (v1, v2) -> ((Float256Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.hypot(a,b)))); 725 } 726 727 @Override 728 @ForceInline 729 public Float256Vector atan2(Vector<Float> o) { 730 Objects.requireNonNull(o); 731 Float256Vector v = (Float256Vector)o; 732 return (Float256Vector) VectorIntrinsics.binaryOp( 733 VECTOR_OP_ATAN2, Float256Vector.class, float.class, LENGTH, 734 this, v, 735 (v1, v2) -> ((Float256Vector)v1).bOp(v2, (i, a, b) -> (float)(Math.atan2(a,b)))); 736 } 737 738 739 // Binary operations 740 741 @Override 742 @ForceInline 743 public Float256Vector add(Vector<Float> o) { 744 Objects.requireNonNull(o); 745 Float256Vector v = (Float256Vector)o; 746 return VectorIntrinsics.binaryOp( 747 VECTOR_OP_ADD, Float256Vector.class, float.class, LENGTH, 748 this, v, 749 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a + b))); 750 } 751 752 @Override 753 @ForceInline 754 public Float256Vector add(Vector<Float> v, Mask<Float> m) { 755 return blend(add(v), m); 756 } 757 758 @Override 759 @ForceInline 760 public Float256Vector sub(Vector<Float> o) { 761 Objects.requireNonNull(o); 762 Float256Vector v = (Float256Vector)o; 763 return VectorIntrinsics.binaryOp( 764 VECTOR_OP_SUB, Float256Vector.class, float.class, LENGTH, 765 this, v, 766 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a - b))); 767 } 768 769 @Override 770 @ForceInline 771 public Float256Vector sub(Vector<Float> v, Mask<Float> m) { 772 return blend(sub(v), m); 773 } 774 775 @Override 776 @ForceInline 777 public Float256Vector mul(Vector<Float> o) { 778 Objects.requireNonNull(o); 779 Float256Vector v = (Float256Vector)o; 780 return VectorIntrinsics.binaryOp( 781 VECTOR_OP_MUL, Float256Vector.class, float.class, LENGTH, 782 this, v, 783 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float)(a * b))); 784 } 785 786 @Override 787 @ForceInline 788 public Float256Vector mul(Vector<Float> v, Mask<Float> m) { 789 return blend(mul(v), m); 790 } 791 792 @Override 793 @ForceInline 794 public Float256Vector min(Vector<Float> o) { 795 Objects.requireNonNull(o); 796 Float256Vector v = (Float256Vector)o; 797 return (Float256Vector) VectorIntrinsics.binaryOp( 798 VECTOR_OP_MIN, Float256Vector.class, float.class, LENGTH, 799 this, v, 800 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float) Math.min(a, b))); 801 } 802 803 @Override 804 @ForceInline 805 public Float256Vector min(Vector<Float> v, Mask<Float> m) { 806 return blend(min(v), m); 807 } 808 809 @Override 810 @ForceInline 811 public Float256Vector max(Vector<Float> o) { 812 Objects.requireNonNull(o); 813 Float256Vector v = (Float256Vector)o; 814 return VectorIntrinsics.binaryOp( 815 VECTOR_OP_MAX, Float256Vector.class, float.class, LENGTH, 816 this, v, 817 (v1, v2) -> v1.bOp(v2, (i, a, b) -> (float) Math.max(a, b))); 818 } 819 820 @Override 821 @ForceInline 822 public Float256Vector max(Vector<Float> v, Mask<Float> m) { 823 return blend(max(v), m); 824 } 825 826 827 // Ternary operations 828 829 @Override 830 @ForceInline 831 public Float256Vector fma(Vector<Float> o1, Vector<Float> o2) { 832 Objects.requireNonNull(o1); 833 Objects.requireNonNull(o2); 834 Float256Vector v1 = (Float256Vector)o1; 835 Float256Vector v2 = (Float256Vector)o2; 836 return VectorIntrinsics.ternaryOp( 837 VECTOR_OP_FMA, Float256Vector.class, float.class, LENGTH, 838 this, v1, v2, 839 (w1, w2, w3) -> w1.tOp(w2, w3, (i, a, b, c) -> Math.fma(a, b, c))); 840 } 841 842 // Type specific horizontal reductions 843 844 @Override 845 @ForceInline 846 public float addAll() { 847 int bits = (int) VectorIntrinsics.reductionCoerced( 848 VECTOR_OP_ADD, Float256Vector.class, float.class, LENGTH, 849 this, 850 v -> { 851 float r = v.rOp((float) 0, (i, a, b) -> (float) (a + b)); 852 return (long)Float.floatToIntBits(r); 853 }); 854 return Float.intBitsToFloat(bits); 855 } 856 857 @Override 858 @ForceInline 859 public float mulAll() { 860 int bits = (int) VectorIntrinsics.reductionCoerced( 861 VECTOR_OP_MUL, Float256Vector.class, float.class, LENGTH, 862 this, 863 v -> { 864 float r = v.rOp((float) 1, (i, a, b) -> (float) (a * b)); 865 return (long)Float.floatToIntBits(r); 866 }); 867 return Float.intBitsToFloat(bits); 868 } 869 870 @Override 871 @ForceInline 872 public float minAll() { 873 int bits = (int) VectorIntrinsics.reductionCoerced( 874 VECTOR_OP_MIN, Float256Vector.class, float.class, LENGTH, 875 this, 876 v -> { 877 float r = v.rOp(Float.MAX_VALUE , (i, a, b) -> (float) Math.min(a, b)); 878 return (long)Float.floatToIntBits(r); 879 }); 880 return Float.intBitsToFloat(bits); 881 } 882 883 @Override 884 @ForceInline 885 public float maxAll() { 886 int bits = (int) VectorIntrinsics.reductionCoerced( 887 VECTOR_OP_MAX, Float256Vector.class, float.class, LENGTH, 888 this, 889 v -> { 890 float r = v.rOp(Float.MIN_VALUE , (i, a, b) -> (float) Math.max(a, b)); 891 return (long)Float.floatToIntBits(r); 892 }); 893 return Float.intBitsToFloat(bits); 894 } 895 896 897 @Override 898 @ForceInline 899 public float addAll(Mask<Float> m) { 900 return blend(SPECIES.broadcast((float) 0), m).addAll(); 901 } 902 903 @Override 904 @ForceInline 905 public float mulAll(Mask<Float> m) { 906 return blend(SPECIES.broadcast((float) 1), m).mulAll(); 907 } 908 909 @Override 910 @ForceInline 911 public float minAll(Mask<Float> m) { 912 return blend(SPECIES.broadcast(Float.MAX_VALUE), m).minAll(); 913 } 914 915 @Override 916 @ForceInline 917 public float maxAll(Mask<Float> m) { 918 return blend(SPECIES.broadcast(Float.MIN_VALUE), m).maxAll(); 919 } 920 921 @Override 922 @ForceInline 923 public Shuffle<Float> toShuffle() { 924 float[] a = toArray(); 925 int[] sa = new int[a.length]; 926 for (int i = 0; i < a.length; i++) { 927 sa[i] = (int) a[i]; 928 } 929 return FloatVector.shuffleFromArray(SPECIES, sa, 0); 930 } 931 932 // Memory operations 933 934 private static final int ARRAY_SHIFT = 31 - Integer.numberOfLeadingZeros(Unsafe.ARRAY_FLOAT_INDEX_SCALE); 935 private static final int BOOLEAN_ARRAY_SHIFT = 31 - Integer.numberOfLeadingZeros(Unsafe.ARRAY_BOOLEAN_INDEX_SCALE); 936 937 @Override 938 @ForceInline 939 public void intoArray(float[] a, int ix) { 940 Objects.requireNonNull(a); 941 ix = VectorIntrinsics.checkIndex(ix, a.length, LENGTH); 942 VectorIntrinsics.store(Float256Vector.class, float.class, LENGTH, 943 a, (((long) ix) << ARRAY_SHIFT) + Unsafe.ARRAY_FLOAT_BASE_OFFSET, 944 this, 945 a, ix, 946 (arr, idx, v) -> v.forEach((i, e) -> arr[idx + i] = e)); 947 } 948 949 @Override 950 @ForceInline 951 public final void intoArray(float[] a, int ax, Mask<Float> m) { 952 FloatVector oldVal = FloatVector.fromArray(SPECIES, a, ax); 953 FloatVector newVal = oldVal.blend(this, m); 954 newVal.intoArray(a, ax); 955 } 956 @Override 957 @ForceInline 958 public void intoArray(float[] a, int ix, int[] b, int iy) { 959 Objects.requireNonNull(a); 960 Objects.requireNonNull(b); 961 962 // Index vector: vix[0:n] = i -> ix + indexMap[iy + i] 963 IntVector vix = IntVector.fromArray(INDEX_SPEC, b, iy).add(ix); 964 965 vix = VectorIntrinsics.checkIndex(vix, a.length); 966 967 VectorIntrinsics.storeWithMap(Float256Vector.class, float.class, LENGTH, Int256Vector.class, 968 a, Unsafe.ARRAY_FLOAT_BASE_OFFSET, vix, 969 this, 970 a, ix, b, iy, 971 (arr, idx, v, indexMap, idy) -> v.forEach((i, e) -> arr[idx+indexMap[idy+i]] = e)); 972 } 973 974 @Override 975 @ForceInline 976 public final void intoArray(float[] a, int ax, Mask<Float> m, int[] b, int iy) { 977 // @@@ This can result in out of bounds errors for unset mask lanes 978 FloatVector oldVal = FloatVector.fromArray(SPECIES, a, ax, b, iy); 979 FloatVector newVal = oldVal.blend(this, m); 980 newVal.intoArray(a, ax, b, iy); 981 } 982 983 @Override 984 @ForceInline 985 public void intoByteArray(byte[] a, int ix) { 986 Objects.requireNonNull(a); 987 ix = VectorIntrinsics.checkIndex(ix, a.length, bitSize() / Byte.SIZE); 988 VectorIntrinsics.store(Float256Vector.class, float.class, LENGTH, 989 a, ((long) ix) + Unsafe.ARRAY_BYTE_BASE_OFFSET, 990 this, 991 a, ix, 992 (c, idx, v) -> { 993 ByteBuffer bbc = ByteBuffer.wrap(c, idx, c.length - idx).order(ByteOrder.nativeOrder()); 994 FloatBuffer tb = bbc.asFloatBuffer(); 995 v.forEach((i, e) -> tb.put(e)); 996 }); 997 } 998 999 @Override 1000 @ForceInline 1001 public final void intoByteArray(byte[] a, int ix, Mask<Float> m) { 1002 Float256Vector oldVal = (Float256Vector) FloatVector.fromByteArray(SPECIES, a, ix); 1003 Float256Vector newVal = oldVal.blend(this, m); 1004 newVal.intoByteArray(a, ix); 1005 } 1006 1007 @Override 1008 @ForceInline 1009 public void intoByteBuffer(ByteBuffer bb, int ix) { 1010 if (bb.order() != ByteOrder.nativeOrder()) { 1011 throw new IllegalArgumentException(); 1012 } 1013 if (bb.isReadOnly()) { 1014 throw new ReadOnlyBufferException(); 1015 } 1016 ix = VectorIntrinsics.checkIndex(ix, bb.limit(), bitSize() / Byte.SIZE); 1017 VectorIntrinsics.store(Float256Vector.class, float.class, LENGTH, 1018 U.getReference(bb, BYTE_BUFFER_HB), ix + U.getLong(bb, BUFFER_ADDRESS), 1019 this, 1020 bb, ix, 1021 (c, idx, v) -> { 1022 ByteBuffer bbc = c.duplicate().position(idx).order(ByteOrder.nativeOrder()); 1023 FloatBuffer tb = bbc.asFloatBuffer(); 1024 v.forEach((i, e) -> tb.put(e)); 1025 }); 1026 } 1027 1028 @Override 1029 @ForceInline 1030 public void intoByteBuffer(ByteBuffer bb, int ix, Mask<Float> m) { 1031 Float256Vector oldVal = (Float256Vector) FloatVector.fromByteBuffer(SPECIES, bb, ix); 1032 Float256Vector newVal = oldVal.blend(this, m); 1033 newVal.intoByteBuffer(bb, ix); 1034 } 1035 1036 // 1037 1038 @Override 1039 public String toString() { 1040 return Arrays.toString(getElements()); 1041 } 1042 1043 @Override 1044 public boolean equals(Object o) { 1045 if (this == o) return true; 1046 if (o == null || this.getClass() != o.getClass()) return false; 1047 1048 Float256Vector that = (Float256Vector) o; 1049 return this.equal(that).allTrue(); 1050 } 1051 1052 @Override 1053 public int hashCode() { 1054 return Arrays.hashCode(vec); 1055 } 1056 1057 // Binary test 1058 1059 @Override 1060 Float256Mask bTest(Vector<Float> o, FBinTest f) { 1061 float[] vec1 = getElements(); 1062 float[] vec2 = ((Float256Vector)o).getElements(); 1063 boolean[] bits = new boolean[length()]; 1064 for (int i = 0; i < length(); i++){ 1065 bits[i] = f.apply(i, vec1[i], vec2[i]); 1066 } 1067 return new Float256Mask(bits); 1068 } 1069 1070 // Comparisons 1071 1072 @Override 1073 @ForceInline 1074 public Float256Mask equal(Vector<Float> o) { 1075 Objects.requireNonNull(o); 1076 Float256Vector v = (Float256Vector)o; 1077 1078 return VectorIntrinsics.compare( 1079 BT_eq, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1080 this, v, 1081 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a == b)); 1082 } 1083 1084 @Override 1085 @ForceInline 1086 public Float256Mask notEqual(Vector<Float> o) { 1087 Objects.requireNonNull(o); 1088 Float256Vector v = (Float256Vector)o; 1089 1090 return VectorIntrinsics.compare( 1091 BT_ne, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1092 this, v, 1093 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a != b)); 1094 } 1095 1096 @Override 1097 @ForceInline 1098 public Float256Mask lessThan(Vector<Float> o) { 1099 Objects.requireNonNull(o); 1100 Float256Vector v = (Float256Vector)o; 1101 1102 return VectorIntrinsics.compare( 1103 BT_lt, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1104 this, v, 1105 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a < b)); 1106 } 1107 1108 @Override 1109 @ForceInline 1110 public Float256Mask lessThanEq(Vector<Float> o) { 1111 Objects.requireNonNull(o); 1112 Float256Vector v = (Float256Vector)o; 1113 1114 return VectorIntrinsics.compare( 1115 BT_le, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1116 this, v, 1117 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a <= b)); 1118 } 1119 1120 @Override 1121 @ForceInline 1122 public Float256Mask greaterThan(Vector<Float> o) { 1123 Objects.requireNonNull(o); 1124 Float256Vector v = (Float256Vector)o; 1125 1126 return (Float256Mask) VectorIntrinsics.compare( 1127 BT_gt, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1128 this, v, 1129 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a > b)); 1130 } 1131 1132 @Override 1133 @ForceInline 1134 public Float256Mask greaterThanEq(Vector<Float> o) { 1135 Objects.requireNonNull(o); 1136 Float256Vector v = (Float256Vector)o; 1137 1138 return VectorIntrinsics.compare( 1139 BT_ge, Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1140 this, v, 1141 (v1, v2) -> v1.bTest(v2, (i, a, b) -> a >= b)); 1142 } 1143 1144 // Foreach 1145 1146 @Override 1147 void forEach(FUnCon f) { 1148 float[] vec = getElements(); 1149 for (int i = 0; i < length(); i++) { 1150 f.apply(i, vec[i]); 1151 } 1152 } 1153 1154 @Override 1155 void forEach(Mask<Float> o, FUnCon f) { 1156 boolean[] mbits = ((Float256Mask)o).getBits(); 1157 forEach((i, a) -> { 1158 if (mbits[i]) { f.apply(i, a); } 1159 }); 1160 } 1161 1162 Int256Vector toBits() { 1163 float[] vec = getElements(); 1164 int[] res = new int[this.species().length()]; 1165 for(int i = 0; i < this.species().length(); i++){ 1166 res[i] = Float.floatToIntBits(vec[i]); 1167 } 1168 return new Int256Vector(res); 1169 } 1170 1171 1172 @Override 1173 public Float256Vector rotateEL(int j) { 1174 float[] vec = getElements(); 1175 float[] res = new float[length()]; 1176 for (int i = 0; i < length(); i++){ 1177 res[(j + i) % length()] = vec[i]; 1178 } 1179 return new Float256Vector(res); 1180 } 1181 1182 @Override 1183 public Float256Vector rotateER(int j) { 1184 float[] vec = getElements(); 1185 float[] res = new float[length()]; 1186 for (int i = 0; i < length(); i++){ 1187 int z = i - j; 1188 if(j < 0) { 1189 res[length() + z] = vec[i]; 1190 } else { 1191 res[z] = vec[i]; 1192 } 1193 } 1194 return new Float256Vector(res); 1195 } 1196 1197 @Override 1198 public Float256Vector shiftEL(int j) { 1199 float[] vec = getElements(); 1200 float[] res = new float[length()]; 1201 for (int i = 0; i < length() - j; i++) { 1202 res[i] = vec[i + j]; 1203 } 1204 return new Float256Vector(res); 1205 } 1206 1207 @Override 1208 public Float256Vector shiftER(int j) { 1209 float[] vec = getElements(); 1210 float[] res = new float[length()]; 1211 for (int i = 0; i < length() - j; i++){ 1212 res[i + j] = vec[i]; 1213 } 1214 return new Float256Vector(res); 1215 } 1216 1217 @Override 1218 @ForceInline 1219 public Float256Vector rearrange(Vector<Float> v, 1220 Shuffle<Float> s, Mask<Float> m) { 1221 return this.rearrange(s).blend(v.rearrange(s), m); 1222 } 1223 1224 @Override 1225 @ForceInline 1226 public Float256Vector rearrange(Shuffle<Float> o1) { 1227 Objects.requireNonNull(o1); 1228 Float256Shuffle s = (Float256Shuffle)o1; 1229 1230 return VectorIntrinsics.rearrangeOp( 1231 Float256Vector.class, Float256Shuffle.class, float.class, LENGTH, 1232 this, s, 1233 (v1, s_) -> v1.uOp((i, a) -> { 1234 int ei = s_.getElement(i); 1235 return v1.get(ei); 1236 })); 1237 } 1238 1239 @Override 1240 @ForceInline 1241 public Float256Vector blend(Vector<Float> o1, Mask<Float> o2) { 1242 Objects.requireNonNull(o1); 1243 Objects.requireNonNull(o2); 1244 Float256Vector v = (Float256Vector)o1; 1245 Float256Mask m = (Float256Mask)o2; 1246 1247 return VectorIntrinsics.blend( 1248 Float256Vector.class, Float256Mask.class, float.class, LENGTH, 1249 this, v, m, 1250 (v1, v2, m_) -> v1.bOp(v2, (i, a, b) -> m_.getElement(i) ? b : a)); 1251 } 1252 1253 // Accessors 1254 1255 @Override 1256 public float get(int i) { 1257 if (i < 0 || i >= LENGTH) { 1258 throw new IllegalArgumentException("Index " + i + " must be zero or positive, and less than " + LENGTH); 1259 } 1260 int bits = (int) VectorIntrinsics.extract( 1261 Float256Vector.class, float.class, LENGTH, 1262 this, i, 1263 (vec, ix) -> { 1264 float[] vecarr = vec.getElements(); 1265 return (long)Float.floatToIntBits(vecarr[ix]); 1266 }); 1267 return Float.intBitsToFloat(bits); 1268 } 1269 1270 @Override 1271 public Float256Vector with(int i, float e) { 1272 if (i < 0 || i >= LENGTH) { 1273 throw new IllegalArgumentException("Index " + i + " must be zero or positive, and less than " + LENGTH); 1274 } 1275 return VectorIntrinsics.insert( 1276 Float256Vector.class, float.class, LENGTH, 1277 this, i, (long)Float.floatToIntBits(e), 1278 (v, ix, bits) -> { 1279 float[] res = v.getElements().clone(); 1280 res[ix] = Float.intBitsToFloat((int)bits); 1281 return new Float256Vector(res); 1282 }); 1283 } 1284 1285 // Mask 1286 1287 static final class Float256Mask extends AbstractMask<Float> { 1288 static final Float256Mask TRUE_MASK = new Float256Mask(true); 1289 static final Float256Mask FALSE_MASK = new Float256Mask(false); 1290 1291 private final boolean[] bits; // Don't access directly, use getBits() instead. 1292 1293 public Float256Mask(boolean[] bits) { 1294 this(bits, 0); 1295 } 1296 1297 public Float256Mask(boolean[] bits, int offset) { 1298 boolean[] a = new boolean[species().length()]; 1299 for (int i = 0; i < a.length; i++) { 1300 a[i] = bits[offset + i]; 1301 } 1302 this.bits = a; 1303 } 1304 1305 public Float256Mask(boolean val) { 1306 boolean[] bits = new boolean[species().length()]; 1307 Arrays.fill(bits, val); 1308 this.bits = bits; 1309 } 1310 1311 boolean[] getBits() { 1312 return VectorIntrinsics.maybeRebox(this).bits; 1313 } 1314 1315 @Override 1316 Float256Mask uOp(MUnOp f) { 1317 boolean[] res = new boolean[species().length()]; 1318 boolean[] bits = getBits(); 1319 for (int i = 0; i < species().length(); i++) { 1320 res[i] = f.apply(i, bits[i]); 1321 } 1322 return new Float256Mask(res); 1323 } 1324 1325 @Override 1326 Float256Mask bOp(Mask<Float> o, MBinOp f) { 1327 boolean[] res = new boolean[species().length()]; 1328 boolean[] bits = getBits(); 1329 boolean[] mbits = ((Float256Mask)o).getBits(); 1330 for (int i = 0; i < species().length(); i++) { 1331 res[i] = f.apply(i, bits[i], mbits[i]); 1332 } 1333 return new Float256Mask(res); 1334 } 1335 1336 @Override 1337 public Float256Species species() { 1338 return SPECIES; 1339 } 1340 1341 @Override 1342 public Float256Vector toVector() { 1343 float[] res = new float[species().length()]; 1344 boolean[] bits = getBits(); 1345 for (int i = 0; i < species().length(); i++) { 1346 // -1 will result in the most significant bit being set in 1347 // addition to some or all other bits 1348 res[i] = (float) (bits[i] ? -1 : 0); 1349 } 1350 return new Float256Vector(res); 1351 } 1352 1353 // Unary operations 1354 1355 @Override 1356 @ForceInline 1357 public Float256Mask not() { 1358 return (Float256Mask) VectorIntrinsics.unaryOp( 1359 VECTOR_OP_NOT, Float256Mask.class, int.class, LENGTH, 1360 this, 1361 (m1) -> m1.uOp((i, a) -> !a)); 1362 } 1363 1364 // Binary operations 1365 1366 @Override 1367 @ForceInline 1368 public Float256Mask and(Mask<Float> o) { 1369 Objects.requireNonNull(o); 1370 Float256Mask m = (Float256Mask)o; 1371 return VectorIntrinsics.binaryOp(VECTOR_OP_AND, Float256Mask.class, int.class, LENGTH, 1372 this, m, 1373 (m1, m2) -> m1.bOp(m2, (i, a, b) -> a & b)); 1374 } 1375 1376 @Override 1377 @ForceInline 1378 public Float256Mask or(Mask<Float> o) { 1379 Objects.requireNonNull(o); 1380 Float256Mask m = (Float256Mask)o; 1381 return VectorIntrinsics.binaryOp(VECTOR_OP_OR, Float256Mask.class, int.class, LENGTH, 1382 this, m, 1383 (m1, m2) -> m1.bOp(m2, (i, a, b) -> a | b)); 1384 } 1385 1386 // Reductions 1387 1388 @Override 1389 @ForceInline 1390 public boolean anyTrue() { 1391 return VectorIntrinsics.test(BT_ne, Float256Mask.class, int.class, LENGTH, 1392 this, this, 1393 (m, __) -> anyTrueHelper(((Float256Mask)m).getBits())); 1394 } 1395 1396 @Override 1397 @ForceInline 1398 public boolean allTrue() { 1399 return VectorIntrinsics.test(BT_overflow, Float256Mask.class, int.class, LENGTH, 1400 this, FloatVector.maskAllTrue(species()), 1401 (m, __) -> allTrueHelper(((Float256Mask)m).getBits())); 1402 } 1403 } 1404 1405 // Shuffle 1406 1407 static final class Float256Shuffle extends AbstractShuffle<Float> { 1408 Float256Shuffle(byte[] reorder) { 1409 super(reorder); 1410 } 1411 1412 public Float256Shuffle(int[] reorder) { 1413 super(reorder); 1414 } 1415 1416 public Float256Shuffle(int[] reorder, int i) { 1417 super(reorder, i); 1418 } 1419 1420 public Float256Shuffle(IntUnaryOperator f) { 1421 super(f); 1422 } 1423 1424 @Override 1425 public Float256Species species() { 1426 return SPECIES; 1427 } 1428 1429 @Override 1430 public FloatVector toVector() { 1431 float[] va = new float[SPECIES.length()]; 1432 for (int i = 0; i < va.length; i++) { 1433 va[i] = (float) getElement(i); 1434 } 1435 return FloatVector.fromArray(SPECIES, va, 0); 1436 } 1437 1438 @Override 1439 public Float256Shuffle rearrange(Vector.Shuffle<Float> o) { 1440 Float256Shuffle s = (Float256Shuffle) o; 1441 byte[] r = new byte[reorder.length]; 1442 for (int i = 0; i < reorder.length; i++) { 1443 r[i] = reorder[s.reorder[i]]; 1444 } 1445 return new Float256Shuffle(r); 1446 } 1447 } 1448 1449 // Species 1450 1451 @Override 1452 public Float256Species species() { 1453 return SPECIES; 1454 } 1455 1456 static final class Float256Species extends FloatSpecies { 1457 static final int BIT_SIZE = Shape.S_256_BIT.bitSize(); 1458 1459 static final int LENGTH = BIT_SIZE / Float.SIZE; 1460 1461 @Override 1462 public String toString() { 1463 StringBuilder sb = new StringBuilder("Shape["); 1464 sb.append(bitSize()).append(" bits, "); 1465 sb.append(length()).append(" ").append(float.class.getSimpleName()).append("s x "); 1466 sb.append(elementSize()).append(" bits"); 1467 sb.append("]"); 1468 return sb.toString(); 1469 } 1470 1471 @Override 1472 @ForceInline 1473 public int bitSize() { 1474 return BIT_SIZE; 1475 } 1476 1477 @Override 1478 @ForceInline 1479 public int length() { 1480 return LENGTH; 1481 } 1482 1483 @Override 1484 @ForceInline 1485 public Class<Float> elementType() { 1486 return float.class; 1487 } 1488 1489 @Override 1490 @ForceInline 1491 public Class<?> boxType() { 1492 return Float256Vector.class; 1493 } 1494 1495 @Override 1496 @ForceInline 1497 public Class<?> maskType() { 1498 return Float256Mask.class; 1499 } 1500 1501 @Override 1502 @ForceInline 1503 public int elementSize() { 1504 return Float.SIZE; 1505 } 1506 1507 @Override 1508 @ForceInline 1509 @SuppressWarnings("unchecked") 1510 Class<?> vectorType() { 1511 return Float256Vector.class; 1512 } 1513 1514 @Override 1515 @ForceInline 1516 public Shape shape() { 1517 return Shape.S_256_BIT; 1518 } 1519 1520 @Override 1521 IntVector.IntSpecies indexSpecies() { 1522 return INDEX_SPEC; 1523 } 1524 1525 @Override 1526 Float256Vector op(FOp f) { 1527 float[] res = new float[length()]; 1528 for (int i = 0; i < length(); i++) { 1529 res[i] = f.apply(i); 1530 } 1531 return new Float256Vector(res); 1532 } 1533 1534 @Override 1535 Float256Vector op(Mask<Float> o, FOp f) { 1536 float[] res = new float[length()]; 1537 boolean[] mbits = ((Float256Mask)o).getBits(); 1538 for (int i = 0; i < length(); i++) { 1539 if (mbits[i]) { 1540 res[i] = f.apply(i); 1541 } 1542 } 1543 return new Float256Vector(res); 1544 } 1545 1546 @Override 1547 Float256Mask opm(FOpm f) { 1548 boolean[] res = new boolean[length()]; 1549 for (int i = 0; i < length(); i++) { 1550 res[i] = (boolean)f.apply(i); 1551 } 1552 return new Float256Mask(res); 1553 } 1554 1555 // Factories 1556 1557 @Override 1558 @ForceInline 1559 public Float256Vector zero() { 1560 return VectorIntrinsics.broadcastCoerced(Float256Vector.class, float.class, LENGTH, 1561 Float.floatToIntBits(0.0f), SPECIES, 1562 ((bits, s) -> ((Float256Species)s).op(i -> Float.intBitsToFloat((int)bits)))); 1563 } 1564 1565 @Override 1566 @ForceInline 1567 public Float256Vector broadcast(float e) { 1568 return VectorIntrinsics.broadcastCoerced( 1569 Float256Vector.class, float.class, LENGTH, 1570 Float.floatToIntBits(e), SPECIES, 1571 ((bits, s) -> ((Float256Species)s).op(i -> Float.intBitsToFloat((int)bits)))); 1572 } 1573 1574 @Override 1575 @ForceInline 1576 public Float256Vector scalars(float... es) { 1577 Objects.requireNonNull(es); 1578 int ix = VectorIntrinsics.checkIndex(0, es.length, LENGTH); 1579 return VectorIntrinsics.load(Float256Vector.class, float.class, LENGTH, 1580 es, Unsafe.ARRAY_FLOAT_BASE_OFFSET, 1581 es, ix, SPECIES, 1582 (c, idx, s) -> ((Float256Species)s).op(n -> c[idx + n])); 1583 } 1584 1585 @Override 1586 @ForceInline 1587 public <E> Float256Mask cast(Mask<E> m) { 1588 if (m.length() != LENGTH) 1589 throw new IllegalArgumentException("Mask length this species length differ"); 1590 return new Float256Mask(m.toArray()); 1591 } 1592 1593 @Override 1594 @ForceInline 1595 public <E> Float256Shuffle cast(Shuffle<E> s) { 1596 if (s.length() != LENGTH) 1597 throw new IllegalArgumentException("Shuffle length this species length differ"); 1598 return new Float256Shuffle(s.toArray()); 1599 } 1600 } 1601 }