src/share/vm/classfile/symbolTable.cpp

Sat, 01 Dec 2007 00:00:00 +0000

author
duke
date
Sat, 01 Dec 2007 00:00:00 +0000
changeset 435
a61af66fc99e
child 1040
98cb887364d3
permissions
-rw-r--r--

Initial load

duke@435 1 /*
duke@435 2 * Copyright 1997-2006 Sun Microsystems, Inc. All Rights Reserved.
duke@435 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
duke@435 4 *
duke@435 5 * This code is free software; you can redistribute it and/or modify it
duke@435 6 * under the terms of the GNU General Public License version 2 only, as
duke@435 7 * published by the Free Software Foundation.
duke@435 8 *
duke@435 9 * This code is distributed in the hope that it will be useful, but WITHOUT
duke@435 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
duke@435 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
duke@435 12 * version 2 for more details (a copy is included in the LICENSE file that
duke@435 13 * accompanied this code).
duke@435 14 *
duke@435 15 * You should have received a copy of the GNU General Public License version
duke@435 16 * 2 along with this work; if not, write to the Free Software Foundation,
duke@435 17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
duke@435 18 *
duke@435 19 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
duke@435 20 * CA 95054 USA or visit www.sun.com if you need additional information or
duke@435 21 * have any questions.
duke@435 22 *
duke@435 23 */
duke@435 24
duke@435 25 # include "incls/_precompiled.incl"
duke@435 26 # include "incls/_symbolTable.cpp.incl"
duke@435 27
duke@435 28 // --------------------------------------------------------------------------
duke@435 29
duke@435 30 SymbolTable* SymbolTable::_the_table = NULL;
duke@435 31
duke@435 32 // Lookup a symbol in a bucket.
duke@435 33
duke@435 34 symbolOop SymbolTable::lookup(int index, const char* name,
duke@435 35 int len, unsigned int hash) {
duke@435 36 for (HashtableEntry* e = bucket(index); e != NULL; e = e->next()) {
duke@435 37 if (e->hash() == hash) {
duke@435 38 symbolOop sym = symbolOop(e->literal());
duke@435 39 if (sym->equals(name, len)) {
duke@435 40 return sym;
duke@435 41 }
duke@435 42 }
duke@435 43 }
duke@435 44 return NULL;
duke@435 45 }
duke@435 46
duke@435 47
duke@435 48 // We take care not to be blocking while holding the
duke@435 49 // SymbolTable_lock. Otherwise, the system might deadlock, since the
duke@435 50 // symboltable is used during compilation (VM_thread) The lock free
duke@435 51 // synchronization is simplified by the fact that we do not delete
duke@435 52 // entries in the symbol table during normal execution (only during
duke@435 53 // safepoints).
duke@435 54
duke@435 55 symbolOop SymbolTable::lookup(const char* name, int len, TRAPS) {
duke@435 56 unsigned int hashValue = hash_symbol(name, len);
duke@435 57 int index = the_table()->hash_to_index(hashValue);
duke@435 58
duke@435 59 symbolOop s = the_table()->lookup(index, name, len, hashValue);
duke@435 60
duke@435 61 // Found
duke@435 62 if (s != NULL) return s;
duke@435 63
duke@435 64 // Otherwise, add to symbol to table
duke@435 65 return the_table()->basic_add(index, (u1*)name, len, hashValue, CHECK_NULL);
duke@435 66 }
duke@435 67
duke@435 68 symbolOop SymbolTable::lookup(symbolHandle sym, int begin, int end, TRAPS) {
duke@435 69 char* buffer;
duke@435 70 int index, len;
duke@435 71 unsigned int hashValue;
duke@435 72 char* name;
duke@435 73 {
duke@435 74 debug_only(No_Safepoint_Verifier nsv;)
duke@435 75
duke@435 76 name = (char*)sym->base() + begin;
duke@435 77 len = end - begin;
duke@435 78 hashValue = hash_symbol(name, len);
duke@435 79 index = the_table()->hash_to_index(hashValue);
duke@435 80 symbolOop s = the_table()->lookup(index, name, len, hashValue);
duke@435 81
duke@435 82 // Found
duke@435 83 if (s != NULL) return s;
duke@435 84 }
duke@435 85
duke@435 86 // Otherwise, add to symbol to table. Copy to a C string first.
duke@435 87 char stack_buf[128];
duke@435 88 ResourceMark rm(THREAD);
duke@435 89 if (len <= 128) {
duke@435 90 buffer = stack_buf;
duke@435 91 } else {
duke@435 92 buffer = NEW_RESOURCE_ARRAY_IN_THREAD(THREAD, char, len);
duke@435 93 }
duke@435 94 for (int i=0; i<len; i++) {
duke@435 95 buffer[i] = name[i];
duke@435 96 }
duke@435 97 // Make sure there is no safepoint in the code above since name can't move.
duke@435 98 // We can't include the code in No_Safepoint_Verifier because of the
duke@435 99 // ResourceMark.
duke@435 100
duke@435 101 return the_table()->basic_add(index, (u1*)buffer, len, hashValue, CHECK_NULL);
duke@435 102 }
duke@435 103
duke@435 104 symbolOop SymbolTable::lookup_only(const char* name, int len,
duke@435 105 unsigned int& hash) {
duke@435 106 hash = hash_symbol(name, len);
duke@435 107 int index = the_table()->hash_to_index(hash);
duke@435 108
duke@435 109 return the_table()->lookup(index, name, len, hash);
duke@435 110 }
duke@435 111
duke@435 112 void SymbolTable::add(constantPoolHandle cp, int names_count,
duke@435 113 const char** names, int* lengths, int* cp_indices,
duke@435 114 unsigned int* hashValues, TRAPS) {
duke@435 115 SymbolTable* table = the_table();
duke@435 116 bool added = table->basic_add(cp, names_count, names, lengths,
duke@435 117 cp_indices, hashValues, CHECK);
duke@435 118 if (!added) {
duke@435 119 // do it the hard way
duke@435 120 for (int i=0; i<names_count; i++) {
duke@435 121 int index = table->hash_to_index(hashValues[i]);
duke@435 122 symbolOop sym = table->basic_add(index, (u1*)names[i], lengths[i],
duke@435 123 hashValues[i], CHECK);
duke@435 124 cp->symbol_at_put(cp_indices[i], sym);
duke@435 125 }
duke@435 126 }
duke@435 127 }
duke@435 128
duke@435 129 // Needed for preloading classes in signatures when compiling.
duke@435 130
duke@435 131 symbolOop SymbolTable::probe(const char* name, int len) {
duke@435 132 unsigned int hashValue = hash_symbol(name, len);
duke@435 133 int index = the_table()->hash_to_index(hashValue);
duke@435 134 return the_table()->lookup(index, name, len, hashValue);
duke@435 135 }
duke@435 136
duke@435 137
duke@435 138 symbolOop SymbolTable::basic_add(int index, u1 *name, int len,
duke@435 139 unsigned int hashValue, TRAPS) {
duke@435 140 assert(!Universe::heap()->is_in_reserved(name) || GC_locker::is_active(),
duke@435 141 "proposed name of symbol must be stable");
duke@435 142
duke@435 143 // We assume that lookup() has been called already, that it failed,
duke@435 144 // and symbol was not found. We create the symbol here.
duke@435 145 symbolKlass* sk = (symbolKlass*) Universe::symbolKlassObj()->klass_part();
duke@435 146 symbolOop s_oop = sk->allocate_symbol(name, len, CHECK_NULL);
duke@435 147 symbolHandle sym (THREAD, s_oop);
duke@435 148
duke@435 149 // Allocation must be done before grapping the SymbolTable_lock lock
duke@435 150 MutexLocker ml(SymbolTable_lock, THREAD);
duke@435 151
duke@435 152 assert(sym->equals((char*)name, len), "symbol must be properly initialized");
duke@435 153
duke@435 154 // Since look-up was done lock-free, we need to check if another
duke@435 155 // thread beat us in the race to insert the symbol.
duke@435 156
duke@435 157 symbolOop test = lookup(index, (char*)name, len, hashValue);
duke@435 158 if (test != NULL) {
duke@435 159 // A race occured and another thread introduced the symbol, this one
duke@435 160 // will be dropped and collected.
duke@435 161 return test;
duke@435 162 }
duke@435 163
duke@435 164 HashtableEntry* entry = new_entry(hashValue, sym());
duke@435 165 add_entry(index, entry);
duke@435 166 return sym();
duke@435 167 }
duke@435 168
duke@435 169 bool SymbolTable::basic_add(constantPoolHandle cp, int names_count,
duke@435 170 const char** names, int* lengths,
duke@435 171 int* cp_indices, unsigned int* hashValues,
duke@435 172 TRAPS) {
duke@435 173 symbolKlass* sk = (symbolKlass*) Universe::symbolKlassObj()->klass_part();
duke@435 174 symbolOop sym_oops[symbol_alloc_batch_size];
duke@435 175 bool allocated = sk->allocate_symbols(names_count, names, lengths,
duke@435 176 sym_oops, CHECK_false);
duke@435 177 if (!allocated) {
duke@435 178 return false;
duke@435 179 }
duke@435 180 symbolHandle syms[symbol_alloc_batch_size];
duke@435 181 int i;
duke@435 182 for (i=0; i<names_count; i++) {
duke@435 183 syms[i] = symbolHandle(THREAD, sym_oops[i]);
duke@435 184 }
duke@435 185
duke@435 186 // Allocation must be done before grabbing the SymbolTable_lock lock
duke@435 187 MutexLocker ml(SymbolTable_lock, THREAD);
duke@435 188
duke@435 189 for (i=0; i<names_count; i++) {
duke@435 190 assert(syms[i]->equals(names[i], lengths[i]), "symbol must be properly initialized");
duke@435 191 // Since look-up was done lock-free, we need to check if another
duke@435 192 // thread beat us in the race to insert the symbol.
duke@435 193 int index = hash_to_index(hashValues[i]);
duke@435 194 symbolOop test = lookup(index, names[i], lengths[i], hashValues[i]);
duke@435 195 if (test != NULL) {
duke@435 196 // A race occured and another thread introduced the symbol, this one
duke@435 197 // will be dropped and collected. Use test instead.
duke@435 198 cp->symbol_at_put(cp_indices[i], test);
duke@435 199 } else {
duke@435 200 symbolOop sym = syms[i]();
duke@435 201 HashtableEntry* entry = new_entry(hashValues[i], sym);
duke@435 202 add_entry(index, entry);
duke@435 203 cp->symbol_at_put(cp_indices[i], sym);
duke@435 204 }
duke@435 205 }
duke@435 206
duke@435 207 return true;
duke@435 208 }
duke@435 209
duke@435 210
duke@435 211 void SymbolTable::verify() {
duke@435 212 for (int i = 0; i < the_table()->table_size(); ++i) {
duke@435 213 HashtableEntry* p = the_table()->bucket(i);
duke@435 214 for ( ; p != NULL; p = p->next()) {
duke@435 215 symbolOop s = symbolOop(p->literal());
duke@435 216 guarantee(s != NULL, "symbol is NULL");
duke@435 217 s->verify();
duke@435 218 guarantee(s->is_perm(), "symbol not in permspace");
duke@435 219 unsigned int h = hash_symbol((char*)s->bytes(), s->utf8_length());
duke@435 220 guarantee(p->hash() == h, "broken hash in symbol table entry");
duke@435 221 guarantee(the_table()->hash_to_index(h) == i,
duke@435 222 "wrong index in symbol table");
duke@435 223 }
duke@435 224 }
duke@435 225 }
duke@435 226
duke@435 227
duke@435 228 //---------------------------------------------------------------------------
duke@435 229 // Non-product code
duke@435 230
duke@435 231 #ifndef PRODUCT
duke@435 232
duke@435 233 void SymbolTable::print_histogram() {
duke@435 234 MutexLocker ml(SymbolTable_lock);
duke@435 235 const int results_length = 100;
duke@435 236 int results[results_length];
duke@435 237 int i,j;
duke@435 238
duke@435 239 // initialize results to zero
duke@435 240 for (j = 0; j < results_length; j++) {
duke@435 241 results[j] = 0;
duke@435 242 }
duke@435 243
duke@435 244 int total = 0;
duke@435 245 int max_symbols = 0;
duke@435 246 int out_of_range = 0;
duke@435 247 for (i = 0; i < the_table()->table_size(); i++) {
duke@435 248 HashtableEntry* p = the_table()->bucket(i);
duke@435 249 for ( ; p != NULL; p = p->next()) {
duke@435 250 int counter = symbolOop(p->literal())->utf8_length();
duke@435 251 total += counter;
duke@435 252 if (counter < results_length) {
duke@435 253 results[counter]++;
duke@435 254 } else {
duke@435 255 out_of_range++;
duke@435 256 }
duke@435 257 max_symbols = MAX2(max_symbols, counter);
duke@435 258 }
duke@435 259 }
duke@435 260 tty->print_cr("Symbol Table:");
duke@435 261 tty->print_cr("%8s %5d", "Total ", total);
duke@435 262 tty->print_cr("%8s %5d", "Maximum", max_symbols);
duke@435 263 tty->print_cr("%8s %3.2f", "Average",
duke@435 264 ((float) total / (float) the_table()->table_size()));
duke@435 265 tty->print_cr("%s", "Histogram:");
duke@435 266 tty->print_cr(" %s %29s", "Length", "Number chains that length");
duke@435 267 for (i = 0; i < results_length; i++) {
duke@435 268 if (results[i] > 0) {
duke@435 269 tty->print_cr("%6d %10d", i, results[i]);
duke@435 270 }
duke@435 271 }
duke@435 272 int line_length = 70;
duke@435 273 tty->print_cr("%s %30s", " Length", "Number chains that length");
duke@435 274 for (i = 0; i < results_length; i++) {
duke@435 275 if (results[i] > 0) {
duke@435 276 tty->print("%4d", i);
duke@435 277 for (j = 0; (j < results[i]) && (j < line_length); j++) {
duke@435 278 tty->print("%1s", "*");
duke@435 279 }
duke@435 280 if (j == line_length) {
duke@435 281 tty->print("%1s", "+");
duke@435 282 }
duke@435 283 tty->cr();
duke@435 284 }
duke@435 285 }
duke@435 286 tty->print_cr(" %s %d: %d\n", "Number chains longer than",
duke@435 287 results_length, out_of_range);
duke@435 288 }
duke@435 289
duke@435 290 #endif // PRODUCT
duke@435 291
duke@435 292 // --------------------------------------------------------------------------
duke@435 293
duke@435 294 #ifdef ASSERT
duke@435 295 class StableMemoryChecker : public StackObj {
duke@435 296 enum { _bufsize = wordSize*4 };
duke@435 297
duke@435 298 address _region;
duke@435 299 jint _size;
duke@435 300 u1 _save_buf[_bufsize];
duke@435 301
duke@435 302 int sample(u1* save_buf) {
duke@435 303 if (_size <= _bufsize) {
duke@435 304 memcpy(save_buf, _region, _size);
duke@435 305 return _size;
duke@435 306 } else {
duke@435 307 // copy head and tail
duke@435 308 memcpy(&save_buf[0], _region, _bufsize/2);
duke@435 309 memcpy(&save_buf[_bufsize/2], _region + _size - _bufsize/2, _bufsize/2);
duke@435 310 return (_bufsize/2)*2;
duke@435 311 }
duke@435 312 }
duke@435 313
duke@435 314 public:
duke@435 315 StableMemoryChecker(const void* region, jint size) {
duke@435 316 _region = (address) region;
duke@435 317 _size = size;
duke@435 318 sample(_save_buf);
duke@435 319 }
duke@435 320
duke@435 321 bool verify() {
duke@435 322 u1 check_buf[sizeof(_save_buf)];
duke@435 323 int check_size = sample(check_buf);
duke@435 324 return (0 == memcmp(_save_buf, check_buf, check_size));
duke@435 325 }
duke@435 326
duke@435 327 void set_region(const void* region) { _region = (address) region; }
duke@435 328 };
duke@435 329 #endif
duke@435 330
duke@435 331
duke@435 332 // --------------------------------------------------------------------------
duke@435 333
duke@435 334
duke@435 335 // Compute the hash value for a java.lang.String object which would
duke@435 336 // contain the characters passed in. This hash value is used for at
duke@435 337 // least two purposes.
duke@435 338 //
duke@435 339 // (a) As the hash value used by the StringTable for bucket selection
duke@435 340 // and comparison (stored in the HashtableEntry structures). This
duke@435 341 // is used in the String.intern() method.
duke@435 342 //
duke@435 343 // (b) As the hash value used by the String object itself, in
duke@435 344 // String.hashCode(). This value is normally calculate in Java code
duke@435 345 // in the String.hashCode method(), but is precomputed for String
duke@435 346 // objects in the shared archive file.
duke@435 347 //
duke@435 348 // For this reason, THIS ALGORITHM MUST MATCH String.hashCode().
duke@435 349
duke@435 350 int StringTable::hash_string(jchar* s, int len) {
duke@435 351 unsigned h = 0;
duke@435 352 while (len-- > 0) {
duke@435 353 h = 31*h + (unsigned) *s;
duke@435 354 s++;
duke@435 355 }
duke@435 356 return h;
duke@435 357 }
duke@435 358
duke@435 359
duke@435 360 StringTable* StringTable::_the_table = NULL;
duke@435 361
duke@435 362 oop StringTable::lookup(int index, jchar* name,
duke@435 363 int len, unsigned int hash) {
duke@435 364 for (HashtableEntry* l = bucket(index); l != NULL; l = l->next()) {
duke@435 365 if (l->hash() == hash) {
duke@435 366 if (java_lang_String::equals(l->literal(), name, len)) {
duke@435 367 return l->literal();
duke@435 368 }
duke@435 369 }
duke@435 370 }
duke@435 371 return NULL;
duke@435 372 }
duke@435 373
duke@435 374
duke@435 375 oop StringTable::basic_add(int index, Handle string_or_null, jchar* name,
duke@435 376 int len, unsigned int hashValue, TRAPS) {
duke@435 377 debug_only(StableMemoryChecker smc(name, len * sizeof(name[0])));
duke@435 378 assert(!Universe::heap()->is_in_reserved(name) || GC_locker::is_active(),
duke@435 379 "proposed name of symbol must be stable");
duke@435 380
duke@435 381 Handle string;
duke@435 382 // try to reuse the string if possible
duke@435 383 if (!string_or_null.is_null() && string_or_null()->is_perm()) {
duke@435 384 string = string_or_null;
duke@435 385 } else {
duke@435 386 string = java_lang_String::create_tenured_from_unicode(name, len, CHECK_NULL);
duke@435 387 }
duke@435 388
duke@435 389 // Allocation must be done before grapping the SymbolTable_lock lock
duke@435 390 MutexLocker ml(StringTable_lock, THREAD);
duke@435 391
duke@435 392 assert(java_lang_String::equals(string(), name, len),
duke@435 393 "string must be properly initialized");
duke@435 394
duke@435 395 // Since look-up was done lock-free, we need to check if another
duke@435 396 // thread beat us in the race to insert the symbol.
duke@435 397
duke@435 398 oop test = lookup(index, name, len, hashValue); // calls lookup(u1*, int)
duke@435 399 if (test != NULL) {
duke@435 400 // Entry already added
duke@435 401 return test;
duke@435 402 }
duke@435 403
duke@435 404 HashtableEntry* entry = new_entry(hashValue, string());
duke@435 405 add_entry(index, entry);
duke@435 406 return string();
duke@435 407 }
duke@435 408
duke@435 409
duke@435 410 oop StringTable::lookup(symbolOop symbol) {
duke@435 411 ResourceMark rm;
duke@435 412 int length;
duke@435 413 jchar* chars = symbol->as_unicode(length);
duke@435 414 unsigned int hashValue = hash_string(chars, length);
duke@435 415 int index = the_table()->hash_to_index(hashValue);
duke@435 416 return the_table()->lookup(index, chars, length, hashValue);
duke@435 417 }
duke@435 418
duke@435 419
duke@435 420 oop StringTable::intern(Handle string_or_null, jchar* name,
duke@435 421 int len, TRAPS) {
duke@435 422 unsigned int hashValue = hash_string(name, len);
duke@435 423 int index = the_table()->hash_to_index(hashValue);
duke@435 424 oop string = the_table()->lookup(index, name, len, hashValue);
duke@435 425
duke@435 426 // Found
duke@435 427 if (string != NULL) return string;
duke@435 428
duke@435 429 // Otherwise, add to symbol to table
duke@435 430 return the_table()->basic_add(index, string_or_null, name, len,
duke@435 431 hashValue, CHECK_NULL);
duke@435 432 }
duke@435 433
duke@435 434 oop StringTable::intern(symbolOop symbol, TRAPS) {
duke@435 435 if (symbol == NULL) return NULL;
duke@435 436 ResourceMark rm(THREAD);
duke@435 437 int length;
duke@435 438 jchar* chars = symbol->as_unicode(length);
duke@435 439 Handle string;
duke@435 440 oop result = intern(string, chars, length, CHECK_NULL);
duke@435 441 return result;
duke@435 442 }
duke@435 443
duke@435 444
duke@435 445 oop StringTable::intern(oop string, TRAPS)
duke@435 446 {
duke@435 447 if (string == NULL) return NULL;
duke@435 448 ResourceMark rm(THREAD);
duke@435 449 int length;
duke@435 450 Handle h_string (THREAD, string);
duke@435 451 jchar* chars = java_lang_String::as_unicode_string(string, length);
duke@435 452 oop result = intern(h_string, chars, length, CHECK_NULL);
duke@435 453 return result;
duke@435 454 }
duke@435 455
duke@435 456
duke@435 457 oop StringTable::intern(const char* utf8_string, TRAPS) {
duke@435 458 if (utf8_string == NULL) return NULL;
duke@435 459 ResourceMark rm(THREAD);
duke@435 460 int length = UTF8::unicode_length(utf8_string);
duke@435 461 jchar* chars = NEW_RESOURCE_ARRAY(jchar, length);
duke@435 462 UTF8::convert_to_unicode(utf8_string, chars, length);
duke@435 463 Handle string;
duke@435 464 oop result = intern(string, chars, length, CHECK_NULL);
duke@435 465 return result;
duke@435 466 }
duke@435 467
duke@435 468 void StringTable::verify() {
duke@435 469 for (int i = 0; i < the_table()->table_size(); ++i) {
duke@435 470 HashtableEntry* p = the_table()->bucket(i);
duke@435 471 for ( ; p != NULL; p = p->next()) {
duke@435 472 oop s = p->literal();
duke@435 473 guarantee(s != NULL, "interned string is NULL");
duke@435 474 guarantee(s->is_perm(), "interned string not in permspace");
duke@435 475
duke@435 476 int length;
duke@435 477 jchar* chars = java_lang_String::as_unicode_string(s, length);
duke@435 478 unsigned int h = hash_string(chars, length);
duke@435 479 guarantee(p->hash() == h, "broken hash in string table entry");
duke@435 480 guarantee(the_table()->hash_to_index(h) == i,
duke@435 481 "wrong index in string table");
duke@435 482 }
duke@435 483 }
duke@435 484 }

mercurial