blob: d35b1c10b6c3ad820581f83d732830dcdb2ff6ae [file] [log] [blame]
// Copyright (c) 2012, the Dart project authors. Please see the AUTHORS file
// for details. All rights reserved. Use of this source code is governed by a
// BSD-style license that can be found in the LICENSE file.
#include "vm/symbols.h"
#include "vm/handles.h"
#include "vm/handles_impl.h"
#include "vm/isolate.h"
#include "vm/object.h"
#include "vm/object_store.h"
#include "vm/raw_object.h"
#include "vm/snapshot_ids.h"
#include "vm/unicode.h"
#include "vm/visitor.h"
namespace dart {
RawString* Symbols::predefined_[Symbols::kNumberOfOneCharCodeSymbols];
String* Symbols::symbol_handles_[Symbols::kMaxPredefinedId];
static const char* names[] = {
NULL,
#define DEFINE_SYMBOL_LITERAL(symbol, literal) \
literal,
PREDEFINED_SYMBOLS_LIST(DEFINE_SYMBOL_LITERAL)
#undef DEFINE_SYMBOL_LITERAL
};
intptr_t Symbols::num_of_grows_;
intptr_t Symbols::collision_count_[kMaxCollisionBuckets];
DEFINE_FLAG(bool, dump_symbol_stats, false, "Dump symbol table statistics");
const char* Symbols::Name(SymbolId symbol) {
ASSERT((symbol > kIllegal) && (symbol < kNullCharId));
return names[symbol];
}
void Symbols::InitOnce(Isolate* isolate) {
// Should only be run by the vm isolate.
ASSERT(isolate == Dart::vm_isolate());
if (FLAG_dump_symbol_stats) {
num_of_grows_ = 0;
for (intptr_t i = 0; i < kMaxCollisionBuckets; i++) {
collision_count_[i] = 0;
}
}
// Create and setup a symbol table in the vm isolate.
SetupSymbolTable(isolate);
// Create all predefined symbols.
ASSERT((sizeof(names) / sizeof(const char*)) == Symbols::kNullCharId);
ObjectStore* object_store = isolate->object_store();
Array& symbol_table = Array::Handle();
// First set up all the predefined string symbols.
for (intptr_t i = 1; i < Symbols::kNullCharId; i++) {
// The symbol_table needs to be reloaded as it might have grown in the
// previous iteration.
symbol_table = object_store->symbol_table();
String* str = String::ReadOnlyHandle();
*str = OneByteString::New(names[i], Heap::kOld);
Add(symbol_table, *str);
symbol_handles_[i] = str;
}
Object::RegisterSingletonClassNames();
// Add Latin1 characters as Symbols, so that Symbols::FromCharCode is fast.
for (intptr_t c = 0; c < kNumberOfOneCharCodeSymbols; c++) {
// The symbol_table needs to be reloaded as it might have grown in the
// previous iteration.
symbol_table = object_store->symbol_table();
intptr_t idx = (kNullCharId + c);
ASSERT(idx < kMaxPredefinedId);
ASSERT(Utf::IsLatin1(c));
uint8_t ch = static_cast<uint8_t>(c);
String* str = String::ReadOnlyHandle();
*str = OneByteString::New(&ch, 1, Heap::kOld);
Add(symbol_table, *str);
predefined_[c] = str->raw();
symbol_handles_[idx] = str;
}
}
void Symbols::SetupSymbolTable(Isolate* isolate) {
ASSERT(isolate != NULL);
// Setup the symbol table used within the String class.
const int initial_size = (isolate == Dart::vm_isolate()) ?
kInitialVMIsolateSymtabSize : kInitialSymtabSize;
const Array& array = Array::Handle(Array::New(initial_size + 1));
// Last element contains the count of used slots.
array.SetAt(initial_size, Smi::Handle(Smi::New(0)));
isolate->object_store()->set_symbol_table(array);
}
intptr_t Symbols::Size(Isolate* isolate) {
ASSERT(isolate != NULL);
Array& symbol_table = Array::Handle(isolate,
isolate->object_store()->symbol_table());
intptr_t table_size_index = symbol_table.Length() - 1;
dart::Smi& used = Smi::Handle();
used ^= symbol_table.At(table_size_index);
return used.Value();
}
void Symbols::Add(const Array& symbol_table, const String& str) {
// Should only be run by the vm isolate.
ASSERT(Isolate::Current() == Dart::vm_isolate());
intptr_t hash = str.Hash();
intptr_t index = FindIndex(symbol_table, str, 0, str.Length(), hash);
ASSERT(symbol_table.At(index) == String::null());
InsertIntoSymbolTable(symbol_table, str, index);
}
RawString* Symbols::New(const char* cstr) {
ASSERT(cstr != NULL);
intptr_t array_len = strlen(cstr);
const uint8_t* utf8_array = reinterpret_cast<const uint8_t*>(cstr);
return Symbols::FromUTF8(utf8_array, array_len);
}
RawString* Symbols::FromUTF8(const uint8_t* utf8_array, intptr_t array_len) {
if (array_len == 0 || utf8_array == NULL) {
return FromLatin1(reinterpret_cast<uint8_t*>(NULL), 0);
}
Utf8::Type type;
intptr_t len = Utf8::CodeUnitCount(utf8_array, array_len, &type);
ASSERT(len != 0);
Zone* zone = Isolate::Current()->current_zone();
if (type == Utf8::kLatin1) {
uint8_t* characters = zone->Alloc<uint8_t>(len);
Utf8::DecodeToLatin1(utf8_array, array_len, characters, len);
return FromLatin1(characters, len);
}
ASSERT((type == Utf8::kBMP) || (type == Utf8::kSupplementary));
uint16_t* characters = zone->Alloc<uint16_t>(len);
Utf8::DecodeToUTF16(utf8_array, array_len, characters, len);
return FromUTF16(characters, len);
}
RawString* Symbols::FromLatin1(const uint8_t* latin1_array, intptr_t len) {
return NewSymbol(latin1_array, len, String::FromLatin1);
}
RawString* Symbols::FromUTF16(const uint16_t* utf16_array, intptr_t len) {
return NewSymbol(utf16_array, len, String::FromUTF16);
}
RawString* Symbols::FromUTF32(const int32_t* utf32_array, intptr_t len) {
return NewSymbol(utf32_array, len, String::FromUTF32);
}
template<typename CharacterType, typename CallbackType>
RawString* Symbols::NewSymbol(const CharacterType* characters,
intptr_t len,
CallbackType new_string) {
Isolate* isolate = Isolate::Current();
String& symbol = String::Handle(isolate, String::null());
Array& symbol_table = Array::Handle(isolate, Array::null());
// Calculate the String hash for this sequence of characters.
intptr_t hash = String::Hash(characters, len);
// First check if a symbol exists in the vm isolate for these characters.
symbol_table = Dart::vm_isolate()->object_store()->symbol_table();
intptr_t index = FindIndex(symbol_table, characters, len, hash);
symbol ^= symbol_table.At(index);
if (symbol.IsNull()) {
// Now try in the symbol table of the current isolate.
symbol_table = isolate->object_store()->symbol_table();
index = FindIndex(symbol_table, characters, len, hash);
// Since we leave enough room in the table to guarantee, that we find an
// empty spot, index is the insertion point if symbol is null.
symbol ^= symbol_table.At(index);
if (symbol.IsNull()) {
// Allocate new result string.
symbol = (*new_string)(characters, len, Heap::kOld);
symbol.SetHash(hash); // Remember the calculated hash value.
InsertIntoSymbolTable(symbol_table, symbol, index);
}
}
ASSERT(symbol.IsSymbol());
return symbol.raw();
}
template RawString* Symbols::NewSymbol(const uint8_t* characters,
intptr_t len,
RawString* (*new_string)(const uint8_t*,
intptr_t,
Heap::Space));
template RawString* Symbols::NewSymbol(const uint16_t* characters,
intptr_t len,
RawString* (*new_string)(const uint16_t*,
intptr_t,
Heap::Space));
template RawString* Symbols::NewSymbol(const int32_t* characters,
intptr_t len,
RawString* (*new_string)(const int32_t*,
intptr_t,
Heap::Space));
RawString* Symbols::New(const String& str) {
if (str.IsSymbol()) {
return str.raw();
}
return New(str, 0, str.Length());
}
RawString* Symbols::New(const String& str, intptr_t begin_index, intptr_t len) {
ASSERT(begin_index >= 0);
ASSERT(len >= 0);
ASSERT((begin_index + len) <= str.Length());
Isolate* isolate = Isolate::Current();
ASSERT(isolate != Dart::vm_isolate());
String& symbol = String::Handle(isolate, String::null());
Array& symbol_table = Array::Handle(isolate, Array::null());
// Calculate the String hash for this sequence of characters.
intptr_t hash = (begin_index == 0 && len == str.Length()) ? str.Hash() :
String::Hash(str, begin_index, len);
// First check if a symbol exists in the vm isolate for these characters.
symbol_table = Dart::vm_isolate()->object_store()->symbol_table();
intptr_t index = FindIndex(symbol_table, str, begin_index, len, hash);
symbol ^= symbol_table.At(index);
if (symbol.IsNull()) {
// Now try in the symbol table of the current isolate.
symbol_table = isolate->object_store()->symbol_table();
index = FindIndex(symbol_table, str, begin_index, len, hash);
// Since we leave enough room in the table to guarantee, that we find an
// empty spot, index is the insertion point if symbol is null.
symbol ^= symbol_table.At(index);
if (symbol.IsNull()) {
if (str.IsOld() && begin_index == 0 && len == str.Length()) {
// Reuse the incoming str as the symbol value.
symbol = str.raw();
} else {
// Allocate a copy in old space.
symbol = String::SubString(str, begin_index, len, Heap::kOld);
symbol.SetHash(hash);
}
InsertIntoSymbolTable(symbol_table, symbol, index);
}
}
ASSERT(symbol.IsSymbol());
return symbol.raw();
}
RawString* Symbols::FromCharCode(int32_t char_code) {
if (char_code > kMaxOneCharCodeSymbol) {
return FromUTF32(&char_code, 1);
}
return predefined_[char_code];
}
void Symbols::DumpStats() {
if (FLAG_dump_symbol_stats) {
intptr_t table_size = 0;
dart::Smi& used = Smi::Handle();
Array& symbol_table = Array::Handle(Array::null());
// First dump VM symbol table stats.
symbol_table = Dart::vm_isolate()->object_store()->symbol_table();
table_size = symbol_table.Length() - 1;
used ^= symbol_table.At(table_size);
OS::Print("VM Isolate: Number of symbols : %"Pd"\n", used.Value());
OS::Print("VM Isolate: Symbol table capacity : %"Pd"\n", table_size);
// Now dump regular isolate symbol table stats.
symbol_table = Isolate::Current()->object_store()->symbol_table();
table_size = symbol_table.Length() - 1;
used ^= symbol_table.At(table_size);
OS::Print("Isolate: Number of symbols : %"Pd"\n", used.Value());
OS::Print("Isolate: Symbol table capacity : %"Pd"\n", table_size);
// Dump overall collision and growth counts.
OS::Print("Number of symbol table grows = %"Pd"\n", num_of_grows_);
OS::Print("Collision counts on add and lookup :\n");
intptr_t i = 0;
for (i = 0; i < (kMaxCollisionBuckets - 1); i++) {
OS::Print(" %"Pd" collisions => %"Pd"\n", i, collision_count_[i]);
}
OS::Print(" > %"Pd" collisions => %"Pd"\n", i, collision_count_[i]);
}
}
void Symbols::GrowSymbolTable(const Array& symbol_table) {
// TODO(iposva): Avoid exponential growth.
num_of_grows_ += 1;
intptr_t table_size = symbol_table.Length() - 1;
intptr_t new_table_size = table_size * 2;
Array& new_symbol_table = Array::Handle(Array::New(new_table_size + 1));
// Copy all elements from the original symbol table to the newly allocated
// array.
String& element = String::Handle();
dart::Object& new_element = Object::Handle();
for (intptr_t i = 0; i < table_size; i++) {
element ^= symbol_table.At(i);
if (!element.IsNull()) {
intptr_t hash = element.Hash();
intptr_t index = hash % new_table_size;
new_element = new_symbol_table.At(index);
intptr_t num_collisions = 0;
while (!new_element.IsNull()) {
index = (index + 1) % new_table_size; // Move to next element.
new_element = new_symbol_table.At(index);
num_collisions += 1;
}
if (FLAG_dump_symbol_stats) {
if (num_collisions >= kMaxCollisionBuckets) {
num_collisions = (kMaxCollisionBuckets - 1);
}
collision_count_[num_collisions] += 1;
}
new_symbol_table.SetAt(index, element);
}
}
// Copy used count.
new_element = symbol_table.At(table_size);
new_symbol_table.SetAt(new_table_size, new_element);
// Remember the new symbol table now.
Isolate::Current()->object_store()->set_symbol_table(new_symbol_table);
}
void Symbols::InsertIntoSymbolTable(const Array& symbol_table,
const String& symbol,
intptr_t index) {
intptr_t table_size = symbol_table.Length() - 1;
symbol.SetCanonical(); // Mark object as being canonical.
symbol_table.SetAt(index, symbol); // Remember the new symbol.
dart::Smi& used = Smi::Handle();
used ^= symbol_table.At(table_size);
intptr_t used_elements = used.Value() + 1; // One more element added.
used = Smi::New(used_elements);
symbol_table.SetAt(table_size, used); // Update used count.
// Rehash if symbol_table is 75% full.
if (used_elements > ((table_size / 4) * 3)) {
GrowSymbolTable(symbol_table);
}
}
template<typename T>
intptr_t Symbols::FindIndex(const Array& symbol_table,
const T* characters,
intptr_t len,
intptr_t hash) {
// Last element of the array is the number of used elements.
intptr_t table_size = symbol_table.Length() - 1;
intptr_t index = hash % table_size;
intptr_t num_collisions = 0;
String& symbol = String::Handle();
symbol ^= symbol_table.At(index);
while (!symbol.IsNull() && !symbol.Equals(characters, len)) {
index = (index + 1) % table_size; // Move to next element.
symbol ^= symbol_table.At(index);
num_collisions += 1;
}
if (FLAG_dump_symbol_stats) {
if (num_collisions >= kMaxCollisionBuckets) {
num_collisions = (kMaxCollisionBuckets - 1);
}
collision_count_[num_collisions] += 1;
}
return index; // Index of symbol if found or slot into which to add symbol.
}
template intptr_t Symbols::FindIndex(const Array& symbol_table,
const uint8_t* characters,
intptr_t len,
intptr_t hash);
template intptr_t Symbols::FindIndex(const Array& symbol_table,
const uint16_t* characters,
intptr_t len,
intptr_t hash);
template intptr_t Symbols::FindIndex(const Array& symbol_table,
const int32_t* characters,
intptr_t len,
intptr_t hash);
intptr_t Symbols::FindIndex(const Array& symbol_table,
const String& str,
intptr_t begin_index,
intptr_t len,
intptr_t hash) {
// Last element of the array is the number of used elements.
intptr_t table_size = symbol_table.Length() - 1;
intptr_t index = hash % table_size;
intptr_t num_collisions = 0;
String& symbol = String::Handle();
symbol ^= symbol_table.At(index);
while (!symbol.IsNull() && !symbol.Equals(str, begin_index, len)) {
index = (index + 1) % table_size; // Move to next element.
symbol ^= symbol_table.At(index);
num_collisions += 1;
}
if (FLAG_dump_symbol_stats) {
if (num_collisions >= kMaxCollisionBuckets) {
num_collisions = (kMaxCollisionBuckets - 1);
}
collision_count_[num_collisions] += 1;
}
return index; // Index of symbol if found or slot into which to add symbol.
}
intptr_t Symbols::LookupVMSymbol(RawObject* obj) {
for (intptr_t i = 1; i < Symbols::kMaxPredefinedId; i++) {
if (symbol_handles_[i]->raw() == obj) {
return (i + kMaxPredefinedObjectIds);
}
}
return kInvalidIndex;
}
RawObject* Symbols::GetVMSymbol(intptr_t object_id) {
ASSERT(IsVMSymbolId(object_id));
intptr_t i = (object_id - kMaxPredefinedObjectIds);
if ((i > kIllegal) && (i < Symbols::kMaxPredefinedId)) {
return symbol_handles_[i]->raw();
}
return Object::null();
}
} // namespace dart