src/share/vm/classfile/symbolTable.hpp

Mon, 25 Jun 2012 21:33:35 -0400

author
coleenp
date
Mon, 25 Jun 2012 21:33:35 -0400
changeset 3875
246d977b51f2
parent 3865
e9140bf80b4a
child 3900
d2a62e0f25eb
permissions
-rw-r--r--

7178670: runtime/7158800/BadUtf8.java fails in SymbolTable::rehash_table
Summary: Cannot delete _buckets and HashtableEntries in shared space (CDS)
Reviewed-by: acorn, kvn, dlong, dcubed, kamg

duke@435 1 /*
coleenp@3682 2 * Copyright (c) 1997, 2012, Oracle and/or its affiliates. All rights reserved.
duke@435 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
duke@435 4 *
duke@435 5 * This code is free software; you can redistribute it and/or modify it
duke@435 6 * under the terms of the GNU General Public License version 2 only, as
duke@435 7 * published by the Free Software Foundation.
duke@435 8 *
duke@435 9 * This code is distributed in the hope that it will be useful, but WITHOUT
duke@435 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
duke@435 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
duke@435 12 * version 2 for more details (a copy is included in the LICENSE file that
duke@435 13 * accompanied this code).
duke@435 14 *
duke@435 15 * You should have received a copy of the GNU General Public License version
duke@435 16 * 2 along with this work; if not, write to the Free Software Foundation,
duke@435 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
duke@435 18 *
trims@1907 19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
trims@1907 20 * or visit www.oracle.com if you need additional information or have any
trims@1907 21 * questions.
duke@435 22 *
duke@435 23 */
duke@435 24
stefank@2314 25 #ifndef SHARE_VM_CLASSFILE_SYMBOLTABLE_HPP
stefank@2314 26 #define SHARE_VM_CLASSFILE_SYMBOLTABLE_HPP
stefank@2314 27
stefank@2314 28 #include "memory/allocation.inline.hpp"
coleenp@2497 29 #include "oops/symbol.hpp"
stefank@2314 30 #include "utilities/hashtable.hpp"
stefank@2314 31
coleenp@2497 32 // The symbol table holds all Symbol*s and corresponding interned strings.
coleenp@2497 33 // Symbol*s and literal strings should be canonicalized.
duke@435 34 //
duke@435 35 // The interned strings are created lazily.
duke@435 36 //
duke@435 37 // It is implemented as an open hash table with a fixed number of buckets.
duke@435 38 //
duke@435 39 // %note:
duke@435 40 // - symbolTableEntrys are allocated in blocks to reduce the space overhead.
duke@435 41
duke@435 42 class BoolObjectClosure;
coleenp@3865 43 class outputStream;
duke@435 44
duke@435 45
coleenp@2497 46 // Class to hold a newly created or referenced Symbol* temporarily in scope.
coleenp@2497 47 // new_symbol() and lookup() will create a Symbol* if not already in the
coleenp@2497 48 // symbol table and add to the symbol's reference count.
coleenp@2497 49 // probe() and lookup_only() will increment the refcount if symbol is found.
coleenp@2497 50 class TempNewSymbol : public StackObj {
coleenp@2497 51 Symbol* _temp;
coleenp@2497 52
coleenp@2497 53 public:
coleenp@2497 54 TempNewSymbol() : _temp(NULL) {}
coleenp@2497 55 // Creating or looking up a symbol increments the symbol's reference count
coleenp@2497 56 TempNewSymbol(Symbol *s) : _temp(s) {}
coleenp@2497 57
coleenp@2497 58 // Operator= increments reference count.
coleenp@2497 59 void operator=(const TempNewSymbol &s) {
coleenp@2497 60 _temp = s._temp;
coleenp@2497 61 if (_temp !=NULL) _temp->increment_refcount();
coleenp@2497 62 }
coleenp@2497 63
coleenp@2497 64 // Decrement reference counter so it can go away if it's unique
coleenp@2497 65 ~TempNewSymbol() { if (_temp != NULL) _temp->decrement_refcount(); }
coleenp@2497 66
coleenp@2497 67 // Operators so they can be used like Symbols
coleenp@2497 68 Symbol* operator -> () const { return _temp; }
coleenp@2497 69 bool operator == (Symbol* o) const { return _temp == o; }
coleenp@2497 70 // Sneaky conversion function
coleenp@2497 71 operator Symbol*() { return _temp; }
coleenp@2497 72 };
coleenp@2497 73
coleenp@2497 74 class SymbolTable : public Hashtable<Symbol*> {
duke@435 75 friend class VMStructs;
coleenp@2497 76 friend class ClassFileParser;
duke@435 77
duke@435 78 private:
duke@435 79 // The symbol table
duke@435 80 static SymbolTable* _the_table;
duke@435 81
coleenp@3865 82 // Set if one bucket is out of balance due to hash algorithm deficiency
coleenp@3865 83 static bool _needs_rehashing;
coleenp@3865 84 static jint _seed;
coleenp@3865 85
coleenp@2497 86 // For statistics
coleenp@2497 87 static int symbols_removed;
coleenp@2497 88 static int symbols_counted;
coleenp@2497 89
coleenp@3682 90 Symbol* allocate_symbol(const u1* name, int len, bool c_heap, TRAPS); // Assumes no characters larger than 0x7F
coleenp@2497 91
duke@435 92 // Adding elements
coleenp@3682 93 Symbol* basic_add(int index, u1* name, int len, unsigned int hashValue,
coleenp@3682 94 bool c_heap, TRAPS);
coleenp@3682 95
coleenp@3682 96 bool basic_add(Handle class_loader, constantPoolHandle cp, int names_count,
duke@435 97 const char** names, int* lengths, int* cp_indices,
duke@435 98 unsigned int* hashValues, TRAPS);
duke@435 99
coleenp@3682 100 static void new_symbols(Handle class_loader, constantPoolHandle cp,
coleenp@3682 101 int names_count,
coleenp@2497 102 const char** name, int* lengths,
coleenp@2497 103 int* cp_indices, unsigned int* hashValues,
coleenp@2497 104 TRAPS) {
coleenp@3682 105 add(class_loader, cp, names_count, name, lengths, cp_indices, hashValues, THREAD);
coleenp@2497 106 }
coleenp@2497 107
duke@435 108 // Table size
duke@435 109 enum {
duke@435 110 symbol_table_size = 20011
duke@435 111 };
duke@435 112
coleenp@2497 113 Symbol* lookup(int index, const char* name, int len, unsigned int hash);
duke@435 114
duke@435 115 SymbolTable()
coleenp@2497 116 : Hashtable<Symbol*>(symbol_table_size, sizeof (HashtableEntry<Symbol*>)) {}
duke@435 117
duke@435 118 SymbolTable(HashtableBucket* t, int number_of_entries)
coleenp@2497 119 : Hashtable<Symbol*>(symbol_table_size, sizeof (HashtableEntry<Symbol*>), t,
duke@435 120 number_of_entries) {}
duke@435 121
coleenp@3682 122 // Arena for permanent symbols (null class loader) that are never unloaded
coleenp@3682 123 static Arena* _arena;
coleenp@3682 124 static Arena* arena() { return _arena; } // called for statistics
duke@435 125
coleenp@3682 126 static void initialize_symbols(int arena_alloc_size = 0);
coleenp@3865 127
coleenp@3865 128 static bool use_alternate_hashcode() { return _seed != 0; }
coleenp@3865 129 static jint seed() { return _seed; }
coleenp@3865 130
coleenp@3865 131 unsigned int new_hash(Symbol* sym);
duke@435 132 public:
duke@435 133 enum {
coleenp@3682 134 symbol_alloc_batch_size = 8,
coleenp@3682 135 // Pick initial size based on java -version size measurements
coleenp@3682 136 symbol_alloc_arena_size = 360*K
duke@435 137 };
duke@435 138
duke@435 139 // The symbol table
duke@435 140 static SymbolTable* the_table() { return _the_table; }
duke@435 141
duke@435 142 static void create_table() {
duke@435 143 assert(_the_table == NULL, "One symbol table allowed.");
duke@435 144 _the_table = new SymbolTable();
coleenp@3682 145 initialize_symbols(symbol_alloc_arena_size);
duke@435 146 }
duke@435 147
duke@435 148 static void create_table(HashtableBucket* t, int length,
duke@435 149 int number_of_entries) {
duke@435 150 assert(_the_table == NULL, "One symbol table allowed.");
duke@435 151 assert(length == symbol_table_size * sizeof(HashtableBucket),
duke@435 152 "bad shared symbol size.");
duke@435 153 _the_table = new SymbolTable(t, number_of_entries);
coleenp@3682 154 // if CDS give symbol table a default arena size since most symbols
coleenp@3682 155 // are already allocated in the shared misc section.
coleenp@3682 156 initialize_symbols();
duke@435 157 }
duke@435 158
coleenp@3875 159 static unsigned int hash_symbol(const char* s, int len);
coleenp@3865 160
coleenp@2497 161 static Symbol* lookup(const char* name, int len, TRAPS);
duke@435 162 // lookup only, won't add. Also calculate hash.
coleenp@2497 163 static Symbol* lookup_only(const char* name, int len, unsigned int& hash);
duke@435 164 // Only copy to C string to be added if lookup failed.
coleenp@2497 165 static Symbol* lookup(const Symbol* sym, int begin, int end, TRAPS);
coleenp@2497 166
coleenp@2497 167 static void release(Symbol* sym);
duke@435 168
phh@3427 169 // Look up the address of the literal in the SymbolTable for this Symbol*
phh@3427 170 static Symbol** lookup_symbol_addr(Symbol* sym);
phh@3427 171
jrose@1100 172 // jchar (utf16) version of lookups
coleenp@2497 173 static Symbol* lookup_unicode(const jchar* name, int len, TRAPS);
coleenp@2497 174 static Symbol* lookup_only_unicode(const jchar* name, int len, unsigned int& hash);
jrose@1100 175
coleenp@3682 176 static void add(Handle class_loader, constantPoolHandle cp, int names_count,
duke@435 177 const char** names, int* lengths, int* cp_indices,
duke@435 178 unsigned int* hashValues, TRAPS);
duke@435 179
coleenp@2497 180 // Release any dead symbols
coleenp@2497 181 static void unlink();
coleenp@2497 182
coleenp@2497 183 // iterate over symbols
coleenp@2497 184 static void symbols_do(SymbolClosure *cl);
coleenp@2497 185
coleenp@2497 186 // Symbol creation
coleenp@2497 187 static Symbol* new_symbol(const char* utf8_buffer, int length, TRAPS) {
coleenp@2497 188 assert(utf8_buffer != NULL, "just checking");
coleenp@2497 189 return lookup(utf8_buffer, length, THREAD);
duke@435 190 }
coleenp@2497 191 static Symbol* new_symbol(const char* name, TRAPS) {
coleenp@2497 192 return new_symbol(name, (int)strlen(name), THREAD);
coleenp@2497 193 }
coleenp@2497 194 static Symbol* new_symbol(const Symbol* sym, int begin, int end, TRAPS) {
coleenp@2497 195 assert(begin <= end && end <= sym->utf8_length(), "just checking");
coleenp@2497 196 return lookup(sym, begin, end, THREAD);
duke@435 197 }
duke@435 198
coleenp@3682 199 // Create a symbol in the arena for symbols that are not deleted
coleenp@3682 200 static Symbol* new_permanent_symbol(const char* name, TRAPS);
coleenp@3682 201
duke@435 202 // Symbol lookup
coleenp@2497 203 static Symbol* lookup(int index, const char* name, int len, TRAPS);
duke@435 204
duke@435 205 // Needed for preloading classes in signatures when compiling.
duke@435 206 // Returns the symbol is already present in symbol table, otherwise
duke@435 207 // NULL. NO ALLOCATION IS GUARANTEED!
coleenp@2497 208 static Symbol* probe(const char* name, int len) {
jrose@1100 209 unsigned int ignore_hash;
jrose@1100 210 return lookup_only(name, len, ignore_hash);
jrose@1100 211 }
coleenp@2497 212 static Symbol* probe_unicode(const jchar* name, int len) {
jrose@1100 213 unsigned int ignore_hash;
jrose@1100 214 return lookup_only_unicode(name, len, ignore_hash);
jrose@1100 215 }
duke@435 216
duke@435 217 // Histogram
duke@435 218 static void print_histogram() PRODUCT_RETURN;
coleenp@2497 219 static void print() PRODUCT_RETURN;
duke@435 220
duke@435 221 // Debugging
duke@435 222 static void verify();
coleenp@3865 223 static void dump(outputStream* st);
duke@435 224
duke@435 225 // Sharing
duke@435 226 static void copy_buckets(char** top, char*end) {
coleenp@2497 227 the_table()->Hashtable<Symbol*>::copy_buckets(top, end);
duke@435 228 }
duke@435 229 static void copy_table(char** top, char*end) {
coleenp@2497 230 the_table()->Hashtable<Symbol*>::copy_table(top, end);
duke@435 231 }
duke@435 232 static void reverse(void* boundary = NULL) {
coleenp@2497 233 the_table()->Hashtable<Symbol*>::reverse(boundary);
duke@435 234 }
coleenp@3865 235
coleenp@3865 236 // Rehash the symbol table if it gets out of balance
coleenp@3865 237 static void rehash_table();
coleenp@3865 238 static bool needs_rehashing() { return _needs_rehashing; }
duke@435 239 };
duke@435 240
coleenp@3865 241
coleenp@2497 242 class StringTable : public Hashtable<oop> {
duke@435 243 friend class VMStructs;
duke@435 244
duke@435 245 private:
duke@435 246 // The string table
duke@435 247 static StringTable* _the_table;
duke@435 248
coleenp@3865 249 // Set if one bucket is out of balance due to hash algorithm deficiency
coleenp@3865 250 static bool _needs_rehashing;
coleenp@3865 251 static jint _seed;
coleenp@3865 252
duke@435 253 static oop intern(Handle string_or_null, jchar* chars, int length, TRAPS);
duke@435 254 oop basic_add(int index, Handle string_or_null, jchar* name, int len,
duke@435 255 unsigned int hashValue, TRAPS);
duke@435 256
duke@435 257 oop lookup(int index, jchar* chars, int length, unsigned int hashValue);
duke@435 258
jcoomes@2660 259 StringTable() : Hashtable<oop>((int)StringTableSize,
jcoomes@2660 260 sizeof (HashtableEntry<oop>)) {}
duke@435 261
duke@435 262 StringTable(HashtableBucket* t, int number_of_entries)
jcoomes@2660 263 : Hashtable<oop>((int)StringTableSize, sizeof (HashtableEntry<oop>), t,
jcoomes@2660 264 number_of_entries) {}
duke@435 265
coleenp@3865 266 static bool use_alternate_hashcode() { return _seed != 0; }
coleenp@3865 267 static jint seed() { return _seed; }
coleenp@3865 268
coleenp@3865 269 unsigned int new_hash(oop s);
duke@435 270 public:
duke@435 271 // The string table
duke@435 272 static StringTable* the_table() { return _the_table; }
duke@435 273
duke@435 274 static void create_table() {
duke@435 275 assert(_the_table == NULL, "One string table allowed.");
duke@435 276 _the_table = new StringTable();
duke@435 277 }
duke@435 278
duke@435 279 static void create_table(HashtableBucket* t, int length,
duke@435 280 int number_of_entries) {
duke@435 281 assert(_the_table == NULL, "One string table allowed.");
jcoomes@2660 282 assert((size_t)length == StringTableSize * sizeof(HashtableBucket),
duke@435 283 "bad shared string size.");
duke@435 284 _the_table = new StringTable(t, number_of_entries);
duke@435 285 }
duke@435 286
duke@435 287 // GC support
duke@435 288 // Delete pointers to otherwise-unreachable objects.
coleenp@2497 289 static void unlink(BoolObjectClosure* cl);
duke@435 290
duke@435 291 // Invoke "f->do_oop" on the locations of all oops in the table.
coleenp@2497 292 static void oops_do(OopClosure* f);
duke@435 293
coleenp@3865 294 // Hashing algorithm, used as the hash value used by the
coleenp@3865 295 // StringTable for bucket selection and comparison (stored in the
coleenp@3865 296 // HashtableEntry structures). This is used in the String.intern() method.
coleenp@3875 297 static unsigned int hash_string(const jchar* s, int len);
coleenp@3865 298
coleenp@3865 299 // Internal test.
coleenp@3865 300 static void test_alt_hash() PRODUCT_RETURN;
coleenp@3865 301
duke@435 302 // Probing
coleenp@2497 303 static oop lookup(Symbol* symbol);
duke@435 304
duke@435 305 // Interning
coleenp@2497 306 static oop intern(Symbol* symbol, TRAPS);
duke@435 307 static oop intern(oop string, TRAPS);
duke@435 308 static oop intern(const char *utf8_string, TRAPS);
duke@435 309
duke@435 310 // Debugging
duke@435 311 static void verify();
coleenp@3865 312 static void dump(outputStream* st);
duke@435 313
duke@435 314 // Sharing
duke@435 315 static void copy_buckets(char** top, char*end) {
coleenp@2497 316 the_table()->Hashtable<oop>::copy_buckets(top, end);
duke@435 317 }
duke@435 318 static void copy_table(char** top, char*end) {
coleenp@2497 319 the_table()->Hashtable<oop>::copy_table(top, end);
duke@435 320 }
duke@435 321 static void reverse() {
coleenp@2497 322 the_table()->Hashtable<oop>::reverse();
duke@435 323 }
coleenp@3865 324
coleenp@3865 325 // Rehash the symbol table if it gets out of balance
coleenp@3865 326 static void rehash_table();
coleenp@3865 327 static bool needs_rehashing() { return _needs_rehashing; }
duke@435 328 };
stefank@2314 329 #endif // SHARE_VM_CLASSFILE_SYMBOLTABLE_HPP

mercurial