--- old/src/hotspot/cpu/x86/stubGenerator_x86_64.cpp 2020-04-02 18:03:47.144854101 -0700 +++ new/src/hotspot/cpu/x86/stubGenerator_x86_64.cpp 2020-04-02 18:03:46.980854101 -0700 @@ -973,6 +973,21 @@ return start; } + address generate_iota_indices(const char *stub_name) { + __ align(CodeEntryAlignment); + StubCodeMark mark(this, "StubRoutines", stub_name); + address start = __ pc(); + __ emit_data64(0x0706050403020100, relocInfo::none); + __ emit_data64(0x0F0E0D0C0B0A0908, relocInfo::none); + __ emit_data64(0x1716151413121110, relocInfo::none); + __ emit_data64(0x1F1E1D1C1B1A1918, relocInfo::none); + __ emit_data64(0x2726252423222120, relocInfo::none); + __ emit_data64(0x2F2E2D2C2B2A2928, relocInfo::none); + __ emit_data64(0x3736353433323130, relocInfo::none); + __ emit_data64(0x3F3E3D3C3B3A3938, relocInfo::none); + return start; + } + address generate_fp_mask(const char *stub_name, int64_t mask) { __ align(CodeEntryAlignment); StubCodeMark mark(this, "StubRoutines", stub_name); @@ -1018,6 +1033,57 @@ return start; } + address generate_vector_fp_mask(const char *stub_name, int64_t mask) { + __ align(CodeEntryAlignment); + StubCodeMark mark(this, "StubRoutines", stub_name); + address start = __ pc(); + + __ emit_data64(mask, relocInfo::none); + __ emit_data64(mask, relocInfo::none); + __ emit_data64(mask, relocInfo::none); + __ emit_data64(mask, relocInfo::none); + __ emit_data64(mask, relocInfo::none); + __ emit_data64(mask, relocInfo::none); + __ emit_data64(mask, relocInfo::none); + __ emit_data64(mask, relocInfo::none); + + return start; + } + + address generate_vector_custom_i32(const char *stub_name, Assembler::AvxVectorLen len, + int32_t val0, int32_t val1, int32_t val2, int32_t val3, + int32_t val4 = 0, int32_t val5 = 0, int32_t val6 = 0, int32_t val7 = 0, + int32_t val8 = 0, int32_t val9 = 0, int32_t val10 = 0, int32_t val11 = 0, + int32_t val12 = 0, int32_t val13 = 0, int32_t val14 = 0, int32_t val15 = 0) { + __ align(CodeEntryAlignment); + StubCodeMark mark(this, "StubRoutines", stub_name); + address start = __ pc(); + + assert(len != Assembler::AVX_NoVec, "vector len must be specified"); + __ emit_data(val0, relocInfo::none, 0); + __ emit_data(val1, relocInfo::none, 0); + __ emit_data(val2, relocInfo::none, 0); + __ emit_data(val3, relocInfo::none, 0); + if (len >= Assembler::AVX_256bit) { + __ emit_data(val4, relocInfo::none, 0); + __ emit_data(val5, relocInfo::none, 0); + __ emit_data(val6, relocInfo::none, 0); + __ emit_data(val7, relocInfo::none, 0); + if (len >= Assembler::AVX_512bit) { + __ emit_data(val8, relocInfo::none, 0); + __ emit_data(val9, relocInfo::none, 0); + __ emit_data(val10, relocInfo::none, 0); + __ emit_data(val11, relocInfo::none, 0); + __ emit_data(val12, relocInfo::none, 0); + __ emit_data(val13, relocInfo::none, 0); + __ emit_data(val14, relocInfo::none, 0); + __ emit_data(val15, relocInfo::none, 0); + } + } + + return start; + } + // Non-destructive plausibility checks for oops // // Arguments: @@ -6446,9 +6512,20 @@ StubRoutines::x86::_vector_float_sign_flip = generate_vector_mask("vector_float_sign_flip", 0x8000000080000000); StubRoutines::x86::_vector_double_sign_mask = generate_vector_mask("vector_double_sign_mask", 0x7FFFFFFFFFFFFFFF); StubRoutines::x86::_vector_double_sign_flip = generate_vector_mask("vector_double_sign_flip", 0x8000000000000000); + StubRoutines::x86::_vector_all_bits_set = generate_vector_mask("vector_all_bits_set", 0xFFFFFFFFFFFFFFFF); StubRoutines::x86::_vector_short_to_byte_mask = generate_vector_mask("vector_short_to_byte_mask", 0x00ff00ff00ff00ff); StubRoutines::x86::_vector_byte_perm_mask = generate_vector_byte_perm_mask("vector_byte_perm_mask"); + StubRoutines::x86::_vector_int_to_byte_mask = generate_vector_mask("vector_int_to_byte_mask", 0x000000ff000000ff); + StubRoutines::x86::_vector_int_to_short_mask = generate_vector_mask("vector_int_to_short_mask", 0x0000ffff0000ffff); + StubRoutines::x86::_vector_32_bit_mask = generate_vector_custom_i32("vector_32_bit_mask", Assembler::AVX_512bit, + 0xFFFFFFFF, 0, 0, 0); + StubRoutines::x86::_vector_64_bit_mask = generate_vector_custom_i32("vector_64_bit_mask", Assembler::AVX_512bit, + 0xFFFFFFFF, 0xFFFFFFFF, 0, 0); + StubRoutines::x86::_vector_int_shuffle_mask = generate_vector_mask("vector_int_shuffle_mask", 0x0302010003020100); + StubRoutines::x86::_vector_short_shuffle_mask = generate_vector_mask("vector_short_shuffle_mask", 0x0100010001000100); + StubRoutines::x86::_vector_long_shuffle_mask = generate_vector_mask("vector_long_shuffle_mask", 0x0000000100000000); StubRoutines::x86::_vector_long_sign_mask = generate_vector_mask("vector_long_sign_mask", 0x8000000000000000); + StubRoutines::x86::_vector_iota_indices = generate_iota_indices("iota_indices"); // support for verify_oop (must happen after universe_init) StubRoutines::_verify_oop_subroutine_entry = generate_verify_oop();