1 /* 2 * Copyright (c) 2001, 2019, Oracle and/or its affiliates. All rights reserved. 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * This code is free software; you can redistribute it and/or modify it 6 * under the terms of the GNU General Public License version 2 only, as 7 * published by the Free Software Foundation. 8 * 9 * This code is distributed in the hope that it will be useful, but WITHOUT 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 12 * version 2 for more details (a copy is included in the LICENSE file that 13 * accompanied this code). 14 * 15 * You should have received a copy of the GNU General Public License version 16 * 2 along with this work; if not, write to the Free Software Foundation, 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 18 * 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 20 * or visit www.oracle.com if you need additional information or have any 21 * questions. 22 * 23 */ 24 25 #ifndef SHARE_GC_SHARED_PTRQUEUE_HPP 26 #define SHARE_GC_SHARED_PTRQUEUE_HPP 27 28 #include "memory/padded.hpp" 29 #include "utilities/align.hpp" 30 #include "utilities/debug.hpp" 31 #include "utilities/lockFreeStack.hpp" 32 #include "utilities/sizes.hpp" 33 34 class Mutex; 35 class Monitor; 36 37 // There are various techniques that require threads to be able to log 38 // addresses. For example, a generational write barrier might log 39 // the addresses of modified old-generation objects. This type supports 40 // this operation. 41 42 class BufferNode; 43 class PtrQueueSet; 44 class PtrQueue { 45 friend class VMStructs; 46 47 // Noncopyable - not defined. 48 PtrQueue(const PtrQueue&); 49 PtrQueue& operator=(const PtrQueue&); 50 51 // The ptr queue set to which this queue belongs. 52 PtrQueueSet* const _qset; 53 54 // Whether updates should be logged. 55 bool _active; 56 57 // The (byte) index at which an object was last enqueued. Starts at 58 // capacity_in_bytes (indicating an empty buffer) and goes towards zero. 59 // Value is always pointer-size aligned. 60 size_t _index; 61 62 // Size of the current buffer, in bytes. 63 // Value is always pointer-size aligned. 64 size_t _capacity_in_bytes; 65 66 static const size_t _element_size = sizeof(void*); 67 68 // Get the capacity, in bytes. The capacity must have been set. 69 size_t capacity_in_bytes() const { 70 assert(_capacity_in_bytes > 0, "capacity not set"); 71 return _capacity_in_bytes; 72 } 73 74 void set_capacity(size_t entries) { 75 size_t byte_capacity = index_to_byte_index(entries); 76 assert(_capacity_in_bytes == 0 || _capacity_in_bytes == byte_capacity, 77 "changing capacity " SIZE_FORMAT " -> " SIZE_FORMAT, 78 _capacity_in_bytes, byte_capacity); 79 _capacity_in_bytes = byte_capacity; 80 } 81 82 static size_t byte_index_to_index(size_t ind) { 83 assert(is_aligned(ind, _element_size), "precondition"); 84 return ind / _element_size; 85 } 86 87 static size_t index_to_byte_index(size_t ind) { 88 return ind * _element_size; 89 } 90 91 protected: 92 // The buffer. 93 void** _buf; 94 95 size_t index() const { 96 return byte_index_to_index(_index); 97 } 98 99 void set_index(size_t new_index) { 100 size_t byte_index = index_to_byte_index(new_index); 101 assert(byte_index <= capacity_in_bytes(), "precondition"); 102 _index = byte_index; 103 } 104 105 size_t capacity() const { 106 return byte_index_to_index(capacity_in_bytes()); 107 } 108 109 PtrQueueSet* qset() { return _qset; } 110 111 // Process queue entries and release resources. 112 void flush_impl(); 113 114 // Initialize this queue to contain a null buffer, and be part of the 115 // given PtrQueueSet. 116 PtrQueue(PtrQueueSet* qset, bool active = false); 117 118 // Requires queue flushed. 119 ~PtrQueue(); 120 121 public: 122 123 // Forcibly set empty. 124 void reset() { 125 if (_buf != NULL) { 126 _index = capacity_in_bytes(); 127 } 128 } 129 130 void enqueue(volatile void* ptr) { 131 enqueue((void*)(ptr)); 132 } 133 134 // Enqueues the given "obj". 135 void enqueue(void* ptr) { 136 if (!_active) return; 137 else enqueue_known_active(ptr); 138 } 139 140 // This method is called when we're doing the zero index handling 141 // and gives a chance to the queues to do any pre-enqueueing 142 // processing they might want to do on the buffer. It should return 143 // true if the buffer should be enqueued, or false if enough 144 // entries were cleared from it so that it can be re-used. It should 145 // not return false if the buffer is still full (otherwise we can 146 // get into an infinite loop). 147 virtual bool should_enqueue_buffer() { return true; } 148 void handle_zero_index(); 149 150 void enqueue_known_active(void* ptr); 151 152 // Return the size of the in-use region. 153 size_t size() const { 154 size_t result = 0; 155 if (_buf != NULL) { 156 assert(_index <= capacity_in_bytes(), "Invariant"); 157 result = byte_index_to_index(capacity_in_bytes() - _index); 158 } 159 return result; 160 } 161 162 bool is_empty() const { 163 return _buf == NULL || capacity_in_bytes() == _index; 164 } 165 166 // Set the "active" property of the queue to "b". An enqueue to an 167 // inactive thread is a no-op. Setting a queue to inactive resets its 168 // log to the empty state. 169 void set_active(bool b) { 170 _active = b; 171 if (!b && _buf != NULL) { 172 reset(); 173 } else if (b && _buf != NULL) { 174 assert(index() == capacity(), 175 "invariant: queues are empty when activated."); 176 } 177 } 178 179 bool is_active() const { return _active; } 180 181 // To support compiler. 182 183 protected: 184 template<typename Derived> 185 static ByteSize byte_offset_of_index() { 186 return byte_offset_of(Derived, _index); 187 } 188 189 static ByteSize byte_width_of_index() { return in_ByteSize(sizeof(size_t)); } 190 191 template<typename Derived> 192 static ByteSize byte_offset_of_buf() { 193 return byte_offset_of(Derived, _buf); 194 } 195 196 static ByteSize byte_width_of_buf() { return in_ByteSize(_element_size); } 197 198 template<typename Derived> 199 static ByteSize byte_offset_of_active() { 200 return byte_offset_of(Derived, _active); 201 } 202 203 static ByteSize byte_width_of_active() { return in_ByteSize(sizeof(bool)); } 204 205 }; 206 207 class BufferNode { 208 size_t _index; 209 BufferNode* volatile _next; 210 void* _buffer[1]; // Pseudo flexible array member. 211 212 BufferNode() : _index(0), _next(NULL) { } 213 ~BufferNode() { } 214 215 static size_t buffer_offset() { 216 return offset_of(BufferNode, _buffer); 217 } 218 219 static BufferNode* volatile* next_ptr(BufferNode& bn) { return &bn._next; } 220 221 AIX_ONLY(public:) // xlC 12 on AIX doesn't implement C++ DR45. 222 // Allocate a new BufferNode with the "buffer" having size elements. 223 static BufferNode* allocate(size_t size); 224 225 // Free a BufferNode. 226 static void deallocate(BufferNode* node); 227 228 public: 229 typedef LockFreeStack<BufferNode, &next_ptr> Stack; 230 231 BufferNode* next() const { return _next; } 232 void set_next(BufferNode* n) { _next = n; } 233 size_t index() const { return _index; } 234 void set_index(size_t i) { _index = i; } 235 236 // Return the BufferNode containing the buffer, after setting its index. 237 static BufferNode* make_node_from_buffer(void** buffer, size_t index) { 238 BufferNode* node = 239 reinterpret_cast<BufferNode*>( 240 reinterpret_cast<char*>(buffer) - buffer_offset()); 241 node->set_index(index); 242 return node; 243 } 244 245 // Return the buffer for node. 246 static void** make_buffer_from_node(BufferNode *node) { 247 // &_buffer[0] might lead to index out of bounds warnings. 248 return reinterpret_cast<void**>( 249 reinterpret_cast<char*>(node) + buffer_offset()); 250 } 251 252 class Allocator; // Free-list based allocator. 253 class TestSupport; // Unit test support. 254 }; 255 256 // Allocation is based on a lock-free free list of nodes, linked through 257 // BufferNode::_next (see BufferNode::Stack). To solve the ABA problem, 258 // popping a node from the free list is performed within a GlobalCounter 259 // critical section, and pushing nodes onto the free list is done after 260 // a GlobalCounter synchronization associated with the nodes to be pushed. 261 // This is documented behavior so that other parts of the node life-cycle 262 // can depend on and make use of it too. 263 class BufferNode::Allocator { 264 friend class TestSupport; 265 266 // Since we don't expect many instances, and measured >15% speedup 267 // on stress gtest, padding seems like a good tradeoff here. 268 #define DECLARE_PADDED_MEMBER(Id, Type, Name) \ 269 Type Name; DEFINE_PAD_MINUS_SIZE(Id, DEFAULT_CACHE_LINE_SIZE, sizeof(Type)) 270 271 const size_t _buffer_size; 272 char _name[DEFAULT_CACHE_LINE_SIZE - sizeof(size_t)]; // Use name as padding. 273 DECLARE_PADDED_MEMBER(1, Stack, _pending_list); 274 DECLARE_PADDED_MEMBER(2, Stack, _free_list); 275 DECLARE_PADDED_MEMBER(3, volatile size_t, _pending_count); 276 DECLARE_PADDED_MEMBER(4, volatile size_t, _free_count); 277 DECLARE_PADDED_MEMBER(5, volatile bool, _transfer_lock); 278 279 #undef DECLARE_PADDED_MEMBER 280 281 void delete_list(BufferNode* list); 282 bool try_transfer_pending(); 283 284 public: 285 Allocator(const char* name, size_t buffer_size); 286 ~Allocator(); 287 288 const char* name() const { return _name; } 289 size_t buffer_size() const { return _buffer_size; } 290 size_t free_count() const; 291 BufferNode* allocate(); 292 void release(BufferNode* node); 293 294 // Deallocate some of the available buffers. remove_goal is the target 295 // number to remove. Returns the number actually deallocated, which may 296 // be less than the goal if there were fewer available. 297 size_t reduce_free_list(size_t remove_goal); 298 }; 299 300 // A PtrQueueSet represents resources common to a set of pointer queues. 301 // In particular, the individual queues allocate buffers from this shared 302 // set, and return completed buffers to the set. 303 class PtrQueueSet { 304 BufferNode::Allocator* _allocator; 305 306 Monitor* _cbl_mon; // Protects the fields below. 307 BufferNode* _completed_buffers_head; 308 BufferNode* _completed_buffers_tail; 309 size_t _n_completed_buffers; 310 311 size_t _process_completed_buffers_threshold; 312 volatile bool _process_completed_buffers; 313 314 // If true, notify_all on _cbl_mon when the threshold is reached. 315 bool _notify_when_complete; 316 317 // Maximum number of elements allowed on completed queue: after that, 318 // enqueuer does the work itself. 319 size_t _max_completed_buffers; 320 size_t _completed_buffers_padding; 321 322 void assert_completed_buffers_list_len_correct_locked() NOT_DEBUG_RETURN; 323 324 protected: 325 bool _all_active; 326 327 // A mutator thread does the the work of processing a buffer. 328 // Returns "true" iff the work is complete (and the buffer may be 329 // deallocated). 330 virtual bool mut_process_buffer(BufferNode* node) { 331 ShouldNotReachHere(); 332 return false; 333 } 334 335 // Create an empty ptr queue set. 336 PtrQueueSet(bool notify_when_complete = false); 337 ~PtrQueueSet(); 338 339 // Because of init-order concerns, we can't pass these as constructor 340 // arguments. 341 void initialize(Monitor* cbl_mon, BufferNode::Allocator* allocator); 342 343 // For (unlocked!) iteration over the completed buffers. 344 BufferNode* completed_buffers_head() const { return _completed_buffers_head; } 345 346 // Deallocate all of the completed buffers. 347 void abandon_completed_buffers(); 348 349 public: 350 351 // Return the buffer for a BufferNode of size buffer_size(). 352 void** allocate_buffer(); 353 354 // Return an empty buffer to the free list. The node is required 355 // to have been allocated with a size of buffer_size(). 356 void deallocate_buffer(BufferNode* node); 357 358 // A completed buffer is a buffer the mutator is finished with, and 359 // is ready to be processed by the collector. It need not be full. 360 361 // Adds node to the completed buffer list. 362 void enqueue_completed_buffer(BufferNode* node); 363 364 // If the number of completed buffers is > stop_at, then remove and 365 // return a completed buffer from the list. Otherwise, return NULL. 366 BufferNode* get_completed_buffer(size_t stop_at = 0); 367 368 // To be invoked by the mutator. 369 bool process_or_enqueue_completed_buffer(BufferNode* node); 370 371 bool process_completed_buffers() { return _process_completed_buffers; } 372 void set_process_completed_buffers(bool x) { _process_completed_buffers = x; } 373 374 bool is_active() { return _all_active; } 375 376 size_t buffer_size() const { 377 return _allocator->buffer_size(); 378 } 379 380 // Get/Set the number of completed buffers that triggers log processing. 381 // Log processing should be done when the number of buffers exceeds the 382 // threshold. 383 void set_process_completed_buffers_threshold(size_t sz) { 384 _process_completed_buffers_threshold = sz; 385 } 386 size_t process_completed_buffers_threshold() const { 387 return _process_completed_buffers_threshold; 388 } 389 static const size_t ProcessCompletedBuffersThresholdNever = ~size_t(0); 390 391 size_t completed_buffers_num() const { return _n_completed_buffers; } 392 393 void merge_bufferlists(PtrQueueSet* src); 394 395 void set_max_completed_buffers(size_t m) { 396 _max_completed_buffers = m; 397 } 398 size_t max_completed_buffers() const { 399 return _max_completed_buffers; 400 } 401 static const size_t MaxCompletedBuffersUnlimited = ~size_t(0); 402 403 void set_completed_buffers_padding(size_t padding) { 404 _completed_buffers_padding = padding; 405 } 406 size_t completed_buffers_padding() const { 407 return _completed_buffers_padding; 408 } 409 410 // Notify the consumer if the number of buffers crossed the threshold 411 void notify_if_necessary(); 412 }; 413 414 #endif // SHARE_GC_SHARED_PTRQUEUE_HPP