1 /*
   2  * Copyright (c) 2014, 2015, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.
   8  *
   9  * This code is distributed in the hope that it will be useful, but WITHOUT
  10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  12  * version 2 for more details (a copy is included in the LICENSE file that
  13  * accompanied this code).
  14  *
  15  * You should have received a copy of the GNU General Public License version
  16  * 2 along with this work; if not, write to the Free Software Foundation,
  17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  18  *
  19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  20  * or visit www.oracle.com if you need additional information or have any
  21  * questions.
  22  *
  23  */
  24 
  25 #ifndef SHARE_VM_GC_G1_G1STRINGDEDUPTABLE_HPP
  26 #define SHARE_VM_GC_G1_G1STRINGDEDUPTABLE_HPP
  27 
  28 #include "gc/g1/g1StringDedupStat.hpp"
  29 #include "runtime/mutexLocker.hpp"
  30 
  31 class G1StringDedupEntryCache;
  32 class G1StringDedupUnlinkOrOopsDoClosure;
  33 
  34 //
  35 // Table entry in the deduplication hashtable. Points weakly to the
  36 // character array. Can be chained in a linked list in case of hash
  37 // collisions or when placed in a freelist in the entry cache.
  38 //
  39 class G1StringDedupEntry : public CHeapObj<mtGC> {
  40 private:
  41   G1StringDedupEntry* _next;
  42   unsigned int      _hash;
  43   typeArrayOop      _obj;
  44 
  45 public:
  46   G1StringDedupEntry() :
  47     _next(NULL),
  48     _hash(0),
  49     _obj(NULL) {
  50   }
  51 
  52   G1StringDedupEntry* next() {
  53     return _next;
  54   }
  55 
  56   G1StringDedupEntry** next_addr() {
  57     return &_next;
  58   }
  59 
  60   void set_next(G1StringDedupEntry* next) {
  61     _next = next;
  62   }
  63 
  64   unsigned int hash() {
  65     return _hash;
  66   }
  67 
  68   void set_hash(unsigned int hash) {
  69     _hash = hash;
  70   }
  71 
  72   typeArrayOop obj() {
  73     return _obj;
  74   }
  75 
  76   typeArrayOop* obj_addr() {
  77     return &_obj;
  78   }
  79 
  80   void set_obj(typeArrayOop obj) {
  81     _obj = obj;
  82   }
  83 };
  84 
  85 //
  86 // The deduplication hashtable keeps track of all unique character arrays used
  87 // by String objects. Each table entry weakly points to an character array, allowing
  88 // otherwise unreachable character arrays to be declared dead and pruned from the
  89 // table.
  90 //
  91 // The table is dynamically resized to accommodate the current number of table entries.
  92 // The table has hash buckets with chains for hash collision. If the average chain
  93 // length goes above or below given thresholds the table grows or shrinks accordingly.
  94 //
  95 // The table is also dynamically rehashed (using a new hash seed) if it becomes severely
  96 // unbalanced, i.e., a hash chain is significantly longer than average.
  97 //
  98 // All access to the table is protected by the StringDedupTable_lock, except under
  99 // safepoints in which case GC workers are allowed to access a table partitions they
 100 // have claimed without first acquiring the lock. Note however, that this applies only
 101 // the table partition (i.e. a range of elements in _buckets), not other parts of the
 102 // table such as the _entries field, statistics counters, etc.
 103 //
 104 class G1StringDedupTable : public CHeapObj<mtGC> {
 105 private:
 106   // The currently active hashtable instance. Only modified when
 107   // the table is resizes or rehashed.
 108   static G1StringDedupTable*      _table;
 109 
 110   // Cache for reuse and fast alloc/free of table entries.
 111   static G1StringDedupEntryCache* _entry_cache;
 112 
 113   G1StringDedupEntry**            _buckets;
 114   size_t                          _size;
 115   uintx                           _entries;
 116   uintx                           _shrink_threshold;
 117   uintx                           _grow_threshold;
 118   bool                            _rehash_needed;
 119 
 120   // The hash seed also dictates which hash function to use. A
 121   // zero hash seed means we will use the Java compatible hash
 122   // function (which doesn't use a seed), and a non-zero hash
 123   // seed means we use the murmur3 hash function.
 124   jint                            _hash_seed;
 125 
 126   // Constants governing table resize/rehash/cache.
 127   static const size_t             _min_size;
 128   static const size_t             _max_size;
 129   static const double             _grow_load_factor;
 130   static const double             _shrink_load_factor;
 131   static const uintx              _rehash_multiple;
 132   static const uintx              _rehash_threshold;
 133   static const double             _max_cache_factor;
 134 
 135   // Table statistics, only used for logging.
 136   static uintx                    _entries_added;
 137   static uintx                    _entries_removed;
 138   static uintx                    _resize_count;
 139   static uintx                    _rehash_count;
 140 
 141   G1StringDedupTable(size_t size, jint hash_seed = 0);
 142   ~G1StringDedupTable();
 143 
 144   // Returns the hash bucket at the given index.
 145   G1StringDedupEntry** bucket(size_t index) {
 146     return _buckets + index;
 147   }
 148 
 149   // Returns the hash bucket index for the given hash code.
 150   size_t hash_to_index(unsigned int hash) {
 151     return (size_t)hash & (_size - 1);
 152   }
 153 
 154   // Adds a new table entry to the given hash bucket.
 155   void add(typeArrayOop value, unsigned int hash, G1StringDedupEntry** list);
 156 
 157   // Removes the given table entry from the table.
 158   void remove(G1StringDedupEntry** pentry, uint worker_id);
 159 
 160   // Transfers a table entry from the current table to the destination table.
 161   void transfer(G1StringDedupEntry** pentry, G1StringDedupTable* dest);
 162 
 163   // Returns an existing character array in the given hash bucket, or NULL
 164   // if no matching character array exists.
 165   typeArrayOop lookup(typeArrayOop value, unsigned int hash,
 166                       G1StringDedupEntry** list, uintx &count);
 167 
 168   // Returns an existing character array in the table, or inserts a new
 169   // table entry if no matching character array exists.
 170   typeArrayOop lookup_or_add_inner(typeArrayOop value, unsigned int hash);
 171 
 172   // Thread safe lookup or add of table entry
 173   static typeArrayOop lookup_or_add(typeArrayOop value, unsigned int hash) {
 174     // Protect the table from concurrent access. Also note that this lock
 175     // acts as a fence for _table, which could have been replaced by a new
 176     // instance if the table was resized or rehashed.
 177     MutexLockerEx ml(StringDedupTable_lock, Mutex::_no_safepoint_check_flag);
 178     return _table->lookup_or_add_inner(value, hash);
 179   }
 180 
 181   // Returns true if the hashtable is currently using a Java compatible
 182   // hash function.
 183   static bool use_java_hash() {
 184     return _table->_hash_seed == 0;
 185   }
 186 
 187   static bool equals(typeArrayOop value1, typeArrayOop value2);
 188 
 189   // Computes the hash code for the given character array, using the
 190   // currently active hash function and hash seed.
 191   static unsigned int hash_code(typeArrayOop value);
 192 
 193   static uintx unlink_or_oops_do(G1StringDedupUnlinkOrOopsDoClosure* cl,
 194                                  size_t partition_begin,
 195                                  size_t partition_end,
 196                                  uint worker_id);
 197 
 198 public:
 199   static void create();
 200 
 201   // Deduplicates the given String object, or adds its backing
 202   // character array to the deduplication hashtable.
 203   static void deduplicate(oop java_string, G1StringDedupStat& stat);
 204 
 205   // If a table resize is needed, returns a newly allocated empty
 206   // hashtable of the proper size.
 207   static G1StringDedupTable* prepare_resize();
 208 
 209   // Installs a newly resized table as the currently active table
 210   // and deletes the previously active table.
 211   static void finish_resize(G1StringDedupTable* resized_table);
 212 
 213   // If a table rehash is needed, returns a newly allocated empty
 214   // hashtable and updates the hash seed.
 215   static G1StringDedupTable* prepare_rehash();
 216 
 217   // Transfers rehashed entries from the currently active table into
 218   // the new table. Installs the new table as the currently active table
 219   // and deletes the previously active table.
 220   static void finish_rehash(G1StringDedupTable* rehashed_table);
 221 
 222   // If the table entry cache has grown too large, trim it down according to policy
 223   static void trim_entry_cache();
 224 
 225   static void unlink_or_oops_do(G1StringDedupUnlinkOrOopsDoClosure* cl, uint worker_id);
 226 
 227   static void print_statistics();
 228   static void verify();
 229 };
 230 
 231 #endif // SHARE_VM_GC_G1_G1STRINGDEDUPTABLE_HPP