1 /*
   2  * Copyright (c) 1997, 2017, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  *
  23  */
  24 
  25 #include "precompiled.hpp"
  26 #include "asm/macroAssembler.inline.hpp"
  27 #include "logging/log.hpp"
  28 #include "memory/resourceArea.hpp"
  29 #include "prims/jvm.h"
  30 #include "runtime/java.hpp"
  31 #include "runtime/os.hpp"
  32 #include "runtime/stubCodeGenerator.hpp"
  33 #include "vm_version_sparc.hpp"
  34 
  35 #include <sys/mman.h>
  36 
  37 uint VM_Version::_L2_data_cache_line_size = 0;
  38 
  39 void VM_Version::initialize() {
  40   assert(_features != 0, "System pre-initialization is not complete.");
  41   guarantee(VM_Version::has_v9(), "only SPARC v9 is supported");
  42 
  43   PrefetchCopyIntervalInBytes = prefetch_copy_interval_in_bytes();
  44   PrefetchScanIntervalInBytes = prefetch_scan_interval_in_bytes();
  45   PrefetchFieldsAhead         = prefetch_fields_ahead();
  46 
  47   // Allocation prefetch settings
  48 
  49   AllocatePrefetchDistance = allocate_prefetch_distance();
  50   AllocatePrefetchStyle    = allocate_prefetch_style();
  51 
  52   intx cache_line_size = prefetch_data_size();
  53 
  54   if (FLAG_IS_DEFAULT(AllocatePrefetchStepSize)) {
  55     AllocatePrefetchStepSize = MAX2(AllocatePrefetchStepSize, cache_line_size);
  56   }
  57 
  58   if (AllocatePrefetchInstr == 1) {
  59     if (!has_blk_init()) {
  60       warning("BIS instructions required for AllocatePrefetchInstr 1 unavailable");
  61       FLAG_SET_DEFAULT(AllocatePrefetchInstr, 0);
  62     }
  63     if (cache_line_size <= 0) {
  64       warning("Cache-line size must be known for AllocatePrefetchInstr 1 to work");
  65       FLAG_SET_DEFAULT(AllocatePrefetchInstr, 0);
  66     }
  67   }
  68 
  69   UseSSE = false;                   // Only used on x86 and x64.
  70 
  71   _supports_cx8 = true;             // All SPARC V9 implementations.
  72   _supports_atomic_getset4 = true;  // Using the 'swap' instruction.
  73 
  74   if (has_fast_ind_br() && FLAG_IS_DEFAULT(UseInlineCaches)) {
  75     // Indirect and direct branches are cost equivalent.
  76     FLAG_SET_DEFAULT(UseInlineCaches, false);
  77   }
  78   // Align loops on the proper instruction boundary to fill the instruction
  79   // fetch buffer.
  80   if (FLAG_IS_DEFAULT(OptoLoopAlignment)) {
  81     FLAG_SET_DEFAULT(OptoLoopAlignment, VM_Version::insn_fetch_alignment);
  82   }
  83 
  84   // 32-bit oops don't make sense for the 64-bit VM on SPARC since the 32-bit
  85   // VM has the same registers and smaller objects.
  86   Universe::set_narrow_oop_shift(LogMinObjAlignmentInBytes);
  87   Universe::set_narrow_klass_shift(LogKlassAlignmentInBytes);
  88 
  89 #ifdef COMPILER2
  90   if (has_fast_ind_br() && FLAG_IS_DEFAULT(UseJumpTables)) {
  91     // Indirect and direct branches are cost equivalent.
  92     FLAG_SET_DEFAULT(UseJumpTables, true);
  93   }
  94   // Entry and loop tops are aligned to fill the instruction fetch buffer.
  95   if (FLAG_IS_DEFAULT(InteriorEntryAlignment)) {
  96     FLAG_SET_DEFAULT(InteriorEntryAlignment, VM_Version::insn_fetch_alignment);
  97   }
  98   if (UseTLAB && cache_line_size > 0 &&
  99       FLAG_IS_DEFAULT(AllocatePrefetchInstr)) {
 100     if (has_fast_bis()) {
 101       // Use BIS instruction for TLAB allocation prefetch.
 102       FLAG_SET_DEFAULT(AllocatePrefetchInstr, 1);
 103     }
 104     else if (has_sparc5()) {
 105       // Use prefetch instruction to avoid partial RAW issue on Core S4 processors,
 106       // also use prefetch style 3.
 107       FLAG_SET_DEFAULT(AllocatePrefetchInstr, 0);
 108       if (FLAG_IS_DEFAULT(AllocatePrefetchStyle)) {
 109         FLAG_SET_DEFAULT(AllocatePrefetchStyle, 3);
 110       }
 111     }
 112   }
 113   if (AllocatePrefetchInstr == 1) {
 114     // Use allocation prefetch style 3 because BIS instructions require
 115     // aligned memory addresses.
 116     FLAG_SET_DEFAULT(AllocatePrefetchStyle, 3);
 117   }
 118   if (FLAG_IS_DEFAULT(AllocatePrefetchDistance)) {
 119     if (AllocatePrefetchInstr == 0) {
 120       // Use different prefetch distance without BIS
 121       FLAG_SET_DEFAULT(AllocatePrefetchDistance, 256);
 122     } else {
 123       // Use smaller prefetch distance with BIS
 124       FLAG_SET_DEFAULT(AllocatePrefetchDistance, 64);
 125     }
 126   }
 127 
 128   // We increase the number of prefetched cache lines, to use just a bit more
 129   // aggressive approach, when the L2-cache line size is small (32 bytes), or
 130   // when running on newer processor implementations, such as the Core S4.
 131   bool inc_prefetch = cache_line_size > 0 && (cache_line_size < 64 || has_sparc5());
 132 
 133   if (inc_prefetch) {
 134     // We use a factor two for small cache line sizes (as before) but a slightly
 135     // more conservative increase when running on more recent hardware that will
 136     // benefit from just a bit more aggressive prefetching.
 137     if (FLAG_IS_DEFAULT(AllocatePrefetchLines)) {
 138       const int ap_lns = AllocatePrefetchLines;
 139       const int ap_inc = cache_line_size < 64 ? ap_lns : (ap_lns + 1) / 2;
 140       FLAG_SET_ERGO(intx, AllocatePrefetchLines, ap_lns + ap_inc);
 141     }
 142     if (FLAG_IS_DEFAULT(AllocateInstancePrefetchLines)) {
 143       const int ip_lns = AllocateInstancePrefetchLines;
 144       const int ip_inc = cache_line_size < 64 ? ip_lns : (ip_lns + 1) / 2;
 145       FLAG_SET_ERGO(intx, AllocateInstancePrefetchLines, ip_lns + ip_inc);
 146     }
 147   }
 148 #endif /* COMPILER2 */
 149 
 150   // Use hardware population count instruction if available.
 151   if (has_popc()) {
 152     if (FLAG_IS_DEFAULT(UsePopCountInstruction)) {
 153       FLAG_SET_DEFAULT(UsePopCountInstruction, true);
 154     }
 155   } else if (UsePopCountInstruction) {
 156     warning("POPC instruction is not available on this CPU");
 157     FLAG_SET_DEFAULT(UsePopCountInstruction, false);
 158   }
 159 
 160   // Use compare and branch instructions if available.
 161   if (has_cbcond()) {
 162     if (FLAG_IS_DEFAULT(UseCBCond)) {
 163       FLAG_SET_DEFAULT(UseCBCond, true);
 164     }
 165   } else if (UseCBCond) {
 166     warning("CBCOND instruction is not available on this CPU");
 167     FLAG_SET_DEFAULT(UseCBCond, false);
 168   }
 169 
 170   assert(BlockZeroingLowLimit > 0, "invalid value");
 171 
 172   if (has_blk_zeroing() && cache_line_size > 0) {
 173     if (FLAG_IS_DEFAULT(UseBlockZeroing)) {
 174       FLAG_SET_DEFAULT(UseBlockZeroing, true);
 175     }
 176   } else if (UseBlockZeroing) {
 177     warning("BIS zeroing instructions are not available on this CPU");
 178     FLAG_SET_DEFAULT(UseBlockZeroing, false);
 179   }
 180 
 181   assert(BlockCopyLowLimit > 0, "invalid value");
 182 
 183   if (has_blk_zeroing() && cache_line_size > 0) {
 184     if (FLAG_IS_DEFAULT(UseBlockCopy)) {
 185       FLAG_SET_DEFAULT(UseBlockCopy, true);
 186     }
 187   } else if (UseBlockCopy) {
 188     warning("BIS instructions are not available or expensive on this CPU");
 189     FLAG_SET_DEFAULT(UseBlockCopy, false);
 190   }
 191 
 192 #ifdef COMPILER2
 193   if (has_fast_rdpc() && FLAG_IS_DEFAULT(UseRDPCForConstantTableBase)) {
 194     FLAG_SET_DEFAULT(UseRDPCForConstantTableBase, true);
 195   }
 196 
 197   // Currently not supported anywhere.
 198   FLAG_SET_DEFAULT(UseFPUForSpilling, false);
 199 
 200   MaxVectorSize = 8;
 201 
 202   assert((InteriorEntryAlignment % relocInfo::addr_unit()) == 0, "alignment is not a multiple of NOP size");
 203 #endif
 204 
 205   assert((CodeEntryAlignment % relocInfo::addr_unit()) == 0, "alignment is not a multiple of NOP size");
 206   assert((OptoLoopAlignment % relocInfo::addr_unit()) == 0, "alignment is not a multiple of NOP size");
 207 
 208   char buf[512];
 209   jio_snprintf(buf, sizeof(buf),
 210                "%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s",
 211                (has_v9()          ? "v9" : ""),
 212                (has_popc()        ? ", popc" : ""),
 213                (has_vis1()        ? ", vis1" : ""),
 214                (has_vis2()        ? ", vis2" : ""),
 215                (has_blk_init()    ? ", blk_init" : ""),
 216                (has_fmaf()        ? ", fmaf" : ""),
 217                (has_hpc()         ? ", hpc" : ""),
 218                (has_ima()         ? ", ima" : ""),
 219                (has_aes()         ? ", aes" : ""),
 220                (has_des()         ? ", des" : ""),
 221                (has_kasumi()      ? ", kas" : ""),
 222                (has_camellia()    ? ", cam" : ""),
 223                (has_md5()         ? ", md5" : ""),
 224                (has_sha1()        ? ", sha1" : ""),
 225                (has_sha256()      ? ", sha256" : ""),
 226                (has_sha512()      ? ", sha512" : ""),
 227                (has_mpmul()       ? ", mpmul" : ""),
 228                (has_mont()        ? ", mont" : ""),
 229                (has_pause()       ? ", pause" : ""),
 230                (has_cbcond()      ? ", cbcond" : ""),
 231                (has_crc32c()      ? ", crc32c" : ""),
 232 
 233                (has_athena_plus() ? ", athena_plus" : ""),
 234                (has_vis3b()       ? ", vis3b" : ""),
 235                (has_adi()         ? ", adi" : ""),
 236                (has_sparc5()      ? ", sparc5" : ""),
 237                (has_mwait()       ? ", mwait" : ""),
 238                (has_xmpmul()      ? ", xmpmul" : ""),
 239                (has_xmont()       ? ", xmont" : ""),
 240                (has_pause_nsec()  ? ", pause_nsec" : ""),
 241                (has_vamask()      ? ", vamask" : ""),
 242 
 243                (has_fast_idiv()   ? ", *idiv" : ""),
 244                (has_fast_rdpc()   ? ", *rdpc" : ""),
 245                (has_fast_bis()    ? ", *bis" : ""),
 246                (has_fast_ld()     ? ", *ld" : ""),
 247                (has_fast_cmove()  ? ", *cmove" : ""),
 248                (has_fast_ind_br() ? ", *ind_br" : ""),
 249                (has_blk_zeroing() ? ", *blk_zeroing" : ""));
 250 
 251   assert(strlen(buf) >= 2, "must be");
 252 
 253   _features_string = os::strdup(buf);
 254 
 255   log_info(os, cpu)("SPARC features detected: %s", _features_string);
 256 
 257   // UseVIS is set to the smallest of what hardware supports and what the command
 258   // line requires, i.e. you cannot set UseVIS to 3 on older UltraSparc which do
 259   // not support it.
 260 
 261   if (UseVIS > 3) UseVIS = 3;
 262   if (UseVIS < 0) UseVIS = 0;
 263   if (!has_vis3()) // Drop to 2 if no VIS3 support
 264     UseVIS = MIN2((intx)2, UseVIS);
 265   if (!has_vis2()) // Drop to 1 if no VIS2 support
 266     UseVIS = MIN2((intx)1, UseVIS);
 267   if (!has_vis1()) // Drop to 0 if no VIS1 support
 268     UseVIS = 0;
 269 
 270   if (has_aes()) {
 271     if (FLAG_IS_DEFAULT(UseAES)) {
 272       FLAG_SET_DEFAULT(UseAES, true);
 273     }
 274     if (!UseAES) {
 275       if (UseAESIntrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
 276         warning("AES intrinsics require UseAES flag to be enabled. Intrinsics will be disabled.");
 277       }
 278       FLAG_SET_DEFAULT(UseAESIntrinsics, false);
 279     } else {
 280       // The AES intrinsic stubs require AES instruction support (of course)
 281       // but also require VIS3 mode or higher for instructions it use.
 282       if (UseVIS > 2) {
 283         if (FLAG_IS_DEFAULT(UseAESIntrinsics)) {
 284           FLAG_SET_DEFAULT(UseAESIntrinsics, true);
 285         }
 286       } else {
 287         if (UseAESIntrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
 288           warning("SPARC AES intrinsics require VIS3 instructions. Intrinsics will be disabled.");
 289         }
 290         FLAG_SET_DEFAULT(UseAESIntrinsics, false);
 291       }
 292     }
 293   } else if (UseAES || UseAESIntrinsics) {
 294     if (UseAES && !FLAG_IS_DEFAULT(UseAES)) {
 295       warning("AES instructions are not available on this CPU");
 296       FLAG_SET_DEFAULT(UseAES, false);
 297     }
 298     if (UseAESIntrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
 299       warning("AES intrinsics are not available on this CPU");
 300       FLAG_SET_DEFAULT(UseAESIntrinsics, false);
 301     }
 302   }
 303 
 304   if (UseAESCTRIntrinsics) {
 305     warning("AES/CTR intrinsics are not available on this CPU");
 306     FLAG_SET_DEFAULT(UseAESCTRIntrinsics, false);
 307   }
 308 
 309   // GHASH/GCM intrinsics
 310   if (has_vis3() && (UseVIS > 2)) {
 311     if (FLAG_IS_DEFAULT(UseGHASHIntrinsics)) {
 312       UseGHASHIntrinsics = true;
 313     }
 314   } else if (UseGHASHIntrinsics) {
 315     if (!FLAG_IS_DEFAULT(UseGHASHIntrinsics))
 316       warning("GHASH intrinsics require VIS3 instruction support. Intrinsics will be disabled");
 317     FLAG_SET_DEFAULT(UseGHASHIntrinsics, false);
 318   }
 319 
 320   if (has_fmaf()) {
 321     if (FLAG_IS_DEFAULT(UseFMA)) {
 322       UseFMA = true;
 323     }
 324   } else if (UseFMA) {
 325     warning("FMA instructions are not available on this CPU");
 326     FLAG_SET_DEFAULT(UseFMA, false);
 327   }
 328 
 329   // SHA1, SHA256, and SHA512 instructions were added to SPARC at different times
 330   if (has_sha1() || has_sha256() || has_sha512()) {
 331     if (UseVIS > 0) { // SHA intrinsics use VIS1 instructions
 332       if (FLAG_IS_DEFAULT(UseSHA)) {
 333         FLAG_SET_DEFAULT(UseSHA, true);
 334       }
 335     } else {
 336       if (UseSHA) {
 337         warning("SPARC SHA intrinsics require VIS1 instruction support. Intrinsics will be disabled.");
 338         FLAG_SET_DEFAULT(UseSHA, false);
 339       }
 340     }
 341   } else if (UseSHA) {
 342     warning("SHA instructions are not available on this CPU");
 343     FLAG_SET_DEFAULT(UseSHA, false);
 344   }
 345 
 346   if (UseSHA && has_sha1()) {
 347     if (FLAG_IS_DEFAULT(UseSHA1Intrinsics)) {
 348       FLAG_SET_DEFAULT(UseSHA1Intrinsics, true);
 349     }
 350   } else if (UseSHA1Intrinsics) {
 351     warning("Intrinsics for SHA-1 crypto hash functions not available on this CPU.");
 352     FLAG_SET_DEFAULT(UseSHA1Intrinsics, false);
 353   }
 354 
 355   if (UseSHA && has_sha256()) {
 356     if (FLAG_IS_DEFAULT(UseSHA256Intrinsics)) {
 357       FLAG_SET_DEFAULT(UseSHA256Intrinsics, true);
 358     }
 359   } else if (UseSHA256Intrinsics) {
 360     warning("Intrinsics for SHA-224 and SHA-256 crypto hash functions not available on this CPU.");
 361     FLAG_SET_DEFAULT(UseSHA256Intrinsics, false);
 362   }
 363 
 364   if (UseSHA && has_sha512()) {
 365     if (FLAG_IS_DEFAULT(UseSHA512Intrinsics)) {
 366       FLAG_SET_DEFAULT(UseSHA512Intrinsics, true);
 367     }
 368   } else if (UseSHA512Intrinsics) {
 369     warning("Intrinsics for SHA-384 and SHA-512 crypto hash functions not available on this CPU.");
 370     FLAG_SET_DEFAULT(UseSHA512Intrinsics, false);
 371   }
 372 
 373   if (!(UseSHA1Intrinsics || UseSHA256Intrinsics || UseSHA512Intrinsics)) {
 374     FLAG_SET_DEFAULT(UseSHA, false);
 375   }
 376 
 377   if (has_crc32c()) {
 378     if (UseVIS > 2) { // CRC32C intrinsics use VIS3 instructions
 379       if (FLAG_IS_DEFAULT(UseCRC32CIntrinsics)) {
 380         FLAG_SET_DEFAULT(UseCRC32CIntrinsics, true);
 381       }
 382     } else {
 383       if (UseCRC32CIntrinsics) {
 384         warning("SPARC CRC32C intrinsics require VIS3 instruction support. Intrinsics will be disabled.");
 385         FLAG_SET_DEFAULT(UseCRC32CIntrinsics, false);
 386       }
 387     }
 388   } else if (UseCRC32CIntrinsics) {
 389     warning("CRC32C instruction is not available on this CPU");
 390     FLAG_SET_DEFAULT(UseCRC32CIntrinsics, false);
 391   }
 392 
 393   if (UseVIS > 2) {
 394     if (FLAG_IS_DEFAULT(UseAdler32Intrinsics)) {
 395       FLAG_SET_DEFAULT(UseAdler32Intrinsics, true);
 396     }
 397   } else if (UseAdler32Intrinsics) {
 398     warning("SPARC Adler32 intrinsics require VIS3 instruction support. Intrinsics will be disabled.");
 399     FLAG_SET_DEFAULT(UseAdler32Intrinsics, false);
 400   }
 401 
 402   if (UseVIS > 2) {
 403     if (FLAG_IS_DEFAULT(UseCRC32Intrinsics)) {
 404       FLAG_SET_DEFAULT(UseCRC32Intrinsics, true);
 405     }
 406   } else if (UseCRC32Intrinsics) {
 407     warning("SPARC CRC32 intrinsics require VIS3 instructions support. Intrinsics will be disabled");
 408     FLAG_SET_DEFAULT(UseCRC32Intrinsics, false);
 409   }
 410 
 411   if (UseVectorizedMismatchIntrinsic) {
 412     warning("UseVectorizedMismatchIntrinsic specified, but not available on this CPU.");
 413     FLAG_SET_DEFAULT(UseVectorizedMismatchIntrinsic, false);
 414   }
 415 
 416   if (FLAG_IS_DEFAULT(ContendedPaddingWidth) &&
 417     (cache_line_size > ContendedPaddingWidth))
 418     ContendedPaddingWidth = cache_line_size;
 419 
 420   // This machine does not allow unaligned memory accesses
 421   if (UseUnalignedAccesses) {
 422     if (!FLAG_IS_DEFAULT(UseUnalignedAccesses))
 423       warning("Unaligned memory access is not available on this CPU");
 424     FLAG_SET_DEFAULT(UseUnalignedAccesses, false);
 425   }
 426 
 427   if (log_is_enabled(Info, os, cpu)) {
 428     ResourceMark rm;
 429     outputStream* log = Log(os, cpu)::info_stream();
 430     log->print_cr("L1 data cache line size: %u", L1_data_cache_line_size());
 431     log->print_cr("L2 data cache line size: %u", L2_data_cache_line_size());
 432     log->print("Allocation");
 433     if (AllocatePrefetchStyle <= 0) {
 434       log->print(": no prefetching");
 435     } else {
 436       log->print(" prefetching: ");
 437       if (AllocatePrefetchInstr == 0) {
 438           log->print("PREFETCH");
 439       } else if (AllocatePrefetchInstr == 1) {
 440           log->print("BIS");
 441       }
 442       if (AllocatePrefetchLines > 1) {
 443         log->print_cr(" at distance %d, %d lines of %d bytes", (int) AllocatePrefetchDistance, (int) AllocatePrefetchLines, (int) AllocatePrefetchStepSize);
 444       } else {
 445         log->print_cr(" at distance %d, one line of %d bytes", (int) AllocatePrefetchDistance, (int) AllocatePrefetchStepSize);
 446       }
 447     }
 448     if (PrefetchCopyIntervalInBytes > 0) {
 449       log->print_cr("PrefetchCopyIntervalInBytes %d", (int) PrefetchCopyIntervalInBytes);
 450     }
 451     if (PrefetchScanIntervalInBytes > 0) {
 452       log->print_cr("PrefetchScanIntervalInBytes %d", (int) PrefetchScanIntervalInBytes);
 453     }
 454     if (PrefetchFieldsAhead > 0) {
 455       log->print_cr("PrefetchFieldsAhead %d", (int) PrefetchFieldsAhead);
 456     }
 457     if (ContendedPaddingWidth > 0) {
 458       log->print_cr("ContendedPaddingWidth %d", (int) ContendedPaddingWidth);
 459     }
 460   }
 461 }
 462 
 463 void VM_Version::print_features() {
 464   tty->print("ISA features [0x%0" PRIx64 "]:", _features);
 465   if (_features_string != NULL) {
 466     tty->print(" %s", _features_string);
 467   }
 468   tty->cr();
 469 }
 470 
 471 void VM_Version::determine_features() {
 472   platform_features();      // platform_features() is os_arch specific.
 473 
 474   assert(has_v9(), "must be");
 475 
 476   if (UseNiagaraInstrs) {   // Limit code generation to Niagara.
 477     _features &= niagara1_msk;
 478   }
 479 }
 480 
 481 static uint64_t saved_features = 0;
 482 
 483 void VM_Version::allow_all() {
 484   saved_features = _features;
 485   _features      = full_feature_msk;
 486 }
 487 
 488 void VM_Version::revert() {
 489   _features = saved_features;
 490 }
 491 
 492 /* Determine a suitable number of threads on this particular machine.
 493  *
 494  * FIXME: Simply checking the processor family is insufficient.
 495  */
 496 unsigned int VM_Version::calc_parallel_worker_threads() {
 497   const int num = 5;
 498   const int den = is_post_niagara() ? 16 : 8;
 499   const int threshold = 8;
 500 
 501   return nof_parallel_worker_threads(num, den, threshold);
 502 }