1 /* 2 * Copyright (c) 1999, 2017, Oracle and/or its affiliates. All rights reserved. 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * This code is free software; you can redistribute it and/or modify it 6 * under the terms of the GNU General Public License version 2 only, as 7 * published by the Free Software Foundation. 8 * 9 * This code is distributed in the hope that it will be useful, but WITHOUT 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 12 * version 2 for more details (a copy is included in the LICENSE file that 13 * accompanied this code). 14 * 15 * You should have received a copy of the GNU General Public License version 16 * 2 along with this work; if not, write to the Free Software Foundation, 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 18 * 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 20 * or visit www.oracle.com if you need additional information or have any 21 * questions. 22 * 23 */ 24 25 #ifndef SHARE_VM_RUNTIME_ATOMIC_HPP 26 #define SHARE_VM_RUNTIME_ATOMIC_HPP 27 28 #include "memory/allocation.hpp" 29 #include "metaprogramming/enableIf.hpp" 30 #include "metaprogramming/isIntegral.hpp" 31 #include "metaprogramming/isSame.hpp" 32 #include "metaprogramming/primitiveConversions.hpp" 33 #include "metaprogramming/removeCV.hpp" 34 #include "utilities/align.hpp" 35 #include "utilities/macros.hpp" 36 37 enum cmpxchg_memory_order { 38 memory_order_relaxed, 39 // Use value which doesn't interfere with C++2011. We need to be more conservative. 40 memory_order_conservative = 8 41 }; 42 43 class Atomic : AllStatic { 44 public: 45 // Atomic operations on jlong types are not available on all 32-bit 46 // platforms. If atomic ops on jlongs are defined here they must only 47 // be used from code that verifies they are available at runtime and 48 // can provide an alternative action if not - see supports_cx8() for 49 // a means to test availability. 50 51 // The memory operations that are mentioned with each of the atomic 52 // function families come from src/share/vm/runtime/orderAccess.hpp, 53 // e.g., <fence> is described in that file and is implemented by the 54 // OrderAccess::fence() function. See that file for the gory details 55 // on the Memory Access Ordering Model. 56 57 // All of the atomic operations that imply a read-modify-write action 58 // guarantee a two-way memory barrier across that operation. Historically 59 // these semantics reflect the strength of atomic operations that are 60 // provided on SPARC/X86. We assume that strength is necessary unless 61 // we can prove that a weaker form is sufficiently safe. 62 63 // Atomically store to a location 64 inline static void store (jbyte store_value, jbyte* dest); 65 inline static void store (jshort store_value, jshort* dest); 66 inline static void store (jint store_value, jint* dest); 67 // See comment above about using jlong atomics on 32-bit platforms 68 inline static void store (jlong store_value, jlong* dest); 69 inline static void store_ptr(intptr_t store_value, intptr_t* dest); 70 inline static void store_ptr(void* store_value, void* dest); 71 72 inline static void store (jbyte store_value, volatile jbyte* dest); 73 inline static void store (jshort store_value, volatile jshort* dest); 74 inline static void store (jint store_value, volatile jint* dest); 75 // See comment above about using jlong atomics on 32-bit platforms 76 inline static void store (jlong store_value, volatile jlong* dest); 77 inline static void store_ptr(intptr_t store_value, volatile intptr_t* dest); 78 inline static void store_ptr(void* store_value, volatile void* dest); 79 80 // See comment above about using jlong atomics on 32-bit platforms 81 inline static jlong load(const volatile jlong* src); 82 83 // Atomically add to a location. Returns updated value. add*() provide: 84 // <fence> add-value-to-dest <membar StoreLoad|StoreStore> 85 inline static jshort add (jshort add_value, volatile jshort* dest); 86 inline static jint add (jint add_value, volatile jint* dest); 87 inline static size_t add (size_t add_value, volatile size_t* dest); 88 inline static intptr_t add_ptr(intptr_t add_value, volatile intptr_t* dest); 89 inline static void* add_ptr(intptr_t add_value, volatile void* dest); 90 91 // Atomically increment location. inc*() provide: 92 // <fence> increment-dest <membar StoreLoad|StoreStore> 93 inline static void inc (volatile jint* dest); 94 inline static void inc (volatile jshort* dest); 95 inline static void inc (volatile size_t* dest); 96 inline static void inc_ptr(volatile intptr_t* dest); 97 inline static void inc_ptr(volatile void* dest); 98 99 // Atomically decrement a location. dec*() provide: 100 // <fence> decrement-dest <membar StoreLoad|StoreStore> 101 inline static void dec (volatile jint* dest); 102 inline static void dec (volatile jshort* dest); 103 inline static void dec (volatile size_t* dest); 104 inline static void dec_ptr(volatile intptr_t* dest); 105 inline static void dec_ptr(volatile void* dest); 106 107 // Performs atomic exchange of *dest with exchange_value. Returns old 108 // prior value of *dest. xchg*() provide: 109 // <fence> exchange-value-with-dest <membar StoreLoad|StoreStore> 110 inline static jint xchg (jint exchange_value, volatile jint* dest); 111 inline static unsigned int xchg (unsigned int exchange_value, volatile unsigned int* dest); 112 inline static intptr_t xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest); 113 inline static void* xchg_ptr(void* exchange_value, volatile void* dest); 114 115 // Performs atomic compare of *dest and compare_value, and exchanges 116 // *dest with exchange_value if the comparison succeeded. Returns prior 117 // value of *dest. cmpxchg*() provide: 118 // <fence> compare-and-exchange <membar StoreLoad|StoreStore> 119 120 template<typename T, typename D, typename U> 121 inline static D cmpxchg(T exchange_value, 122 D volatile* dest, 123 U compare_value, 124 cmpxchg_memory_order order = memory_order_conservative); 125 126 // Performs atomic compare of *dest and NULL, and replaces *dest 127 // with exchange_value if the comparison succeeded. Returns true if 128 // the comparison succeeded and the exchange occurred. This is 129 // often used as part of lazy initialization, as a lock-free 130 // alternative to the Double-Checked Locking Pattern. 131 template<typename T, typename D> 132 inline static bool replace_if_null(T* value, D* volatile* dest, 133 cmpxchg_memory_order order = memory_order_conservative); 134 135 inline static intptr_t cmpxchg_ptr(intptr_t exchange_value, 136 volatile intptr_t* dest, 137 intptr_t compare_value, 138 cmpxchg_memory_order order = memory_order_conservative) { 139 return cmpxchg(exchange_value, dest, compare_value, order); 140 } 141 142 inline static void* cmpxchg_ptr(void* exchange_value, 143 volatile void* dest, 144 void* compare_value, 145 cmpxchg_memory_order order = memory_order_conservative) { 146 return cmpxchg(exchange_value, 147 reinterpret_cast<void* volatile*>(dest), 148 compare_value, 149 order); 150 } 151 152 private: 153 // Test whether From is implicitly convertible to To. 154 // From and To must be pointer types. 155 // Note: Provides the limited subset of C++11 std::is_convertible 156 // that is needed here. 157 template<typename From, typename To> struct IsPointerConvertible; 158 159 // Dispatch handler for cmpxchg. Provides type-based validity 160 // checking and limited conversions around calls to the 161 // platform-specific implementation layer provided by 162 // PlatformCmpxchg. 163 template<typename T, typename D, typename U, typename Enable = void> 164 struct CmpxchgImpl; 165 166 // Platform-specific implementation of cmpxchg. Support for sizes 167 // of 1, 4, and 8 are required. The class is a function object that 168 // must be default constructable, with these requirements: 169 // 170 // - dest is of type T*. 171 // - exchange_value and compare_value are of type T. 172 // - order is of type cmpxchg_memory_order. 173 // - platform_cmpxchg is an object of type PlatformCmpxchg<sizeof(T)>. 174 // 175 // Then 176 // platform_cmpxchg(exchange_value, dest, compare_value, order) 177 // must be a valid expression, returning a result convertible to T. 178 // 179 // A default definition is provided, which declares a function template 180 // T operator()(T, T volatile*, T, cmpxchg_memory_order) const 181 // 182 // For each required size, a platform must either provide an 183 // appropriate definition of that function, or must entirely 184 // specialize the class template for that size. 185 template<size_t byte_size> struct PlatformCmpxchg; 186 187 // Support for platforms that implement some variants of cmpxchg 188 // using a (typically out of line) non-template helper function. 189 // The generic arguments passed to PlatformCmpxchg need to be 190 // translated to the appropriate type for the helper function, the 191 // helper invoked on the translated arguments, and the result 192 // translated back. Type is the parameter / return type of the 193 // helper function. 194 template<typename Type, typename Fn, typename T> 195 static T cmpxchg_using_helper(Fn fn, 196 T exchange_value, 197 T volatile* dest, 198 T compare_value); 199 200 // Support platforms that do not provide Read-Modify-Write 201 // byte-level atomic access. To use, derive PlatformCmpxchg<1> from 202 // this class. 203 public: // Temporary, can't be private: C++03 11.4/2. Fixed by C++11. 204 struct CmpxchgByteUsingInt; 205 private: 206 }; 207 208 template<typename From, typename To> 209 struct Atomic::IsPointerConvertible<From*, To*> : AllStatic { 210 // Determine whether From* is implicitly convertible to To*, using 211 // the "sizeof trick". 212 typedef char yes; 213 typedef char (&no)[2]; 214 215 static yes test(To*); 216 static no test(...); 217 static From* test_value; 218 219 static const bool value = (sizeof(yes) == sizeof(test(test_value))); 220 }; 221 222 // Define the class before including platform file, which may specialize 223 // the operator definition. No generic definition of specializations 224 // of the operator template are provided, nor are there any generic 225 // specializations of the class. The platform file is responsible for 226 // providing those. 227 template<size_t byte_size> 228 struct Atomic::PlatformCmpxchg VALUE_OBJ_CLASS_SPEC { 229 template<typename T> 230 T operator()(T exchange_value, 231 T volatile* dest, 232 T compare_value, 233 cmpxchg_memory_order order) const; 234 }; 235 236 // Define the class before including platform file, which may use this 237 // as a base class, requiring it be complete. The definition is later 238 // in this file, near the other definitions related to cmpxchg. 239 struct Atomic::CmpxchgByteUsingInt VALUE_OBJ_CLASS_SPEC { 240 template<typename T> 241 T operator()(T exchange_value, 242 T volatile* dest, 243 T compare_value, 244 cmpxchg_memory_order order) const; 245 }; 246 247 // platform specific in-line definitions - must come before shared definitions 248 249 #include OS_CPU_HEADER(atomic) 250 251 // shared in-line definitions 252 253 // size_t casts... 254 #if (SIZE_MAX != UINTPTR_MAX) 255 #error size_t is not WORD_SIZE, interesting platform, but missing implementation here 256 #endif 257 258 inline size_t Atomic::add(size_t add_value, volatile size_t* dest) { 259 return (size_t) add_ptr((intptr_t) add_value, (volatile intptr_t*) dest); 260 } 261 262 inline void Atomic::inc(volatile size_t* dest) { 263 inc_ptr((volatile intptr_t*) dest); 264 } 265 266 inline void Atomic::dec(volatile size_t* dest) { 267 dec_ptr((volatile intptr_t*) dest); 268 } 269 270 template<typename T, typename D, typename U> 271 inline D Atomic::cmpxchg(T exchange_value, 272 D volatile* dest, 273 U compare_value, 274 cmpxchg_memory_order order) { 275 return CmpxchgImpl<T, D, U>()(exchange_value, dest, compare_value, order); 276 } 277 278 template<typename T, typename D> 279 inline bool Atomic::replace_if_null(T* value, D* volatile* dest, 280 cmpxchg_memory_order order) { 281 // Presently using a trivial implementation in terms of cmpxchg. 282 // Consider adding platform support, to permit the use of compiler 283 // intrinsics like gcc's __sync_bool_compare_and_swap. 284 D* expected_null = NULL; 285 return expected_null == cmpxchg(value, dest, expected_null, order); 286 } 287 288 // Handle cmpxchg for integral and enum types. 289 // 290 // All the involved types must be identical. 291 template<typename T> 292 struct Atomic::CmpxchgImpl< 293 T, T, T, 294 typename EnableIf<IsIntegral<T>::value || IsRegisteredEnum<T>::value>::type> 295 VALUE_OBJ_CLASS_SPEC 296 { 297 T operator()(T exchange_value, T volatile* dest, T compare_value, 298 cmpxchg_memory_order order) const { 299 // Forward to the platform handler for the size of T. 300 return PlatformCmpxchg<sizeof(T)>()(exchange_value, 301 dest, 302 compare_value, 303 order); 304 } 305 }; 306 307 // Handle cmpxchg for pointer types. 308 // 309 // The destination's type and the compare_value type must be the same, 310 // ignoring cv-qualifiers; we don't care about the cv-qualifiers of 311 // the compare_value. 312 // 313 // The exchange_value must be implicitly convertible to the 314 // destination's type; it must be type-correct to store the 315 // exchange_value in the destination. 316 template<typename T, typename D, typename U> 317 struct Atomic::CmpxchgImpl< 318 T*, D*, U*, 319 typename EnableIf<Atomic::IsPointerConvertible<T*, D*>::value && 320 IsSame<typename RemoveCV<D>::type, 321 typename RemoveCV<U>::type>::value>::type> 322 VALUE_OBJ_CLASS_SPEC 323 { 324 D* operator()(T* exchange_value, D* volatile* dest, U* compare_value, 325 cmpxchg_memory_order order) const { 326 // Allow derived to base conversion, and adding cv-qualifiers. 327 D* new_value = exchange_value; 328 // Don't care what the CV qualifiers for compare_value are, 329 // but we need to match D* when calling platform support. 330 D* old_value = const_cast<D*>(compare_value); 331 return PlatformCmpxchg<sizeof(D*)>()(new_value, dest, old_value, order); 332 } 333 }; 334 335 // Handle cmpxchg for types that have a translator. 336 // 337 // All the involved types must be identical. 338 // 339 // This translates the original call into a call on the decayed 340 // arguments, and returns the recovered result of that translated 341 // call. 342 template<typename T> 343 struct Atomic::CmpxchgImpl< 344 T, T, T, 345 typename EnableIf<PrimitiveConversions::Translate<T>::value>::type> 346 VALUE_OBJ_CLASS_SPEC 347 { 348 T operator()(T exchange_value, T volatile* dest, T compare_value, 349 cmpxchg_memory_order order) const { 350 typedef PrimitiveConversions::Translate<T> Translator; 351 typedef typename Translator::Decayed Decayed; 352 STATIC_ASSERT(sizeof(T) == sizeof(Decayed)); 353 return Translator::recover( 354 cmpxchg(Translator::decay(exchange_value), 355 reinterpret_cast<Decayed volatile*>(dest), 356 Translator::decay(compare_value), 357 order)); 358 } 359 }; 360 361 template<typename Type, typename Fn, typename T> 362 inline T Atomic::cmpxchg_using_helper(Fn fn, 363 T exchange_value, 364 T volatile* dest, 365 T compare_value) { 366 STATIC_ASSERT(sizeof(Type) == sizeof(T)); 367 return PrimitiveConversions::cast<T>( 368 fn(PrimitiveConversions::cast<Type>(exchange_value), 369 reinterpret_cast<Type volatile*>(dest), 370 PrimitiveConversions::cast<Type>(compare_value))); 371 } 372 373 template<typename T> 374 inline T Atomic::CmpxchgByteUsingInt::operator()(T exchange_value, 375 T volatile* dest, 376 T compare_value, 377 cmpxchg_memory_order order) const { 378 STATIC_ASSERT(sizeof(T) == sizeof(uint8_t)); 379 uint8_t canon_exchange_value = exchange_value; 380 uint8_t canon_compare_value = compare_value; 381 volatile uint32_t* aligned_dest 382 = reinterpret_cast<volatile uint32_t*>(align_down(dest, sizeof(uint32_t))); 383 size_t offset = pointer_delta(dest, aligned_dest, 1); 384 uint32_t cur = *aligned_dest; 385 uint8_t* cur_as_bytes = reinterpret_cast<uint8_t*>(&cur); 386 387 // current value may not be what we are looking for, so force it 388 // to that value so the initial cmpxchg will fail if it is different 389 cur_as_bytes[offset] = canon_compare_value; 390 391 // always execute a real cmpxchg so that we get the required memory 392 // barriers even on initial failure 393 do { 394 // value to swap in matches current value ... 395 uint32_t new_value = cur; 396 // ... except for the one jbyte we want to update 397 reinterpret_cast<uint8_t*>(&new_value)[offset] = canon_exchange_value; 398 399 uint32_t res = cmpxchg(new_value, aligned_dest, cur, order); 400 if (res == cur) break; // success 401 402 // at least one byte in the int changed value, so update 403 // our view of the current int 404 cur = res; 405 // if our byte is still as cur we loop and try again 406 } while (cur_as_bytes[offset] == canon_compare_value); 407 408 return PrimitiveConversions::cast<T>(cur_as_bytes[offset]); 409 } 410 411 inline unsigned Atomic::xchg(unsigned int exchange_value, volatile unsigned int* dest) { 412 assert(sizeof(unsigned int) == sizeof(jint), "more work to do"); 413 return (unsigned int)Atomic::xchg((jint)exchange_value, (volatile jint*)dest); 414 } 415 416 inline jshort Atomic::add(jshort add_value, volatile jshort* dest) { 417 // Most platforms do not support atomic add on a 2-byte value. However, 418 // if the value occupies the most significant 16 bits of an aligned 32-bit 419 // word, then we can do this with an atomic add of (add_value << 16) 420 // to the 32-bit word. 421 // 422 // The least significant parts of this 32-bit word will never be affected, even 423 // in case of overflow/underflow. 424 // 425 // Use the ATOMIC_SHORT_PAIR macro (see macros.hpp) to get the desired alignment. 426 #ifdef VM_LITTLE_ENDIAN 427 assert((intx(dest) & 0x03) == 0x02, "wrong alignment"); 428 jint new_value = Atomic::add(add_value << 16, (volatile jint*)(dest-1)); 429 #else 430 assert((intx(dest) & 0x03) == 0x00, "wrong alignment"); 431 jint new_value = Atomic::add(add_value << 16, (volatile jint*)(dest)); 432 #endif 433 return (jshort)(new_value >> 16); // preserves sign 434 } 435 436 inline void Atomic::inc(volatile jshort* dest) { 437 (void)add(1, dest); 438 } 439 440 inline void Atomic::dec(volatile jshort* dest) { 441 (void)add(-1, dest); 442 } 443 444 #endif // SHARE_VM_RUNTIME_ATOMIC_HPP