// -*- mode: c++; c-basic-offset: 4 -*- /* * This file is part of the KDE libraries * Copyright (C) 2005, 2006 Apple Computer, Inc. * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Library General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Library General Public License for more details. * * You should have received a copy of the GNU Library General Public License * along with this library; see the file COPYING.LIB. If not, write to * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, * Boston, MA 02110-1301, USA. * */ #ifndef WTF_HashTable_h #define WTF_HashTable_h #include "FastMalloc.h" #include "HashTraits.h" #include namespace WTF { #define DUMP_HASHTABLE_STATS 0 #define CHECK_HASHTABLE_CONSISTENCY 0 #ifdef NDEBUG #define CHECK_HASHTABLE_ITERATORS 0 #else #define CHECK_HASHTABLE_ITERATORS 1 #endif #if DUMP_HASHTABLE_STATS struct HashTableStats { ~HashTableStats(); static int numAccesses; static int numCollisions; static int collisionGraph[4096]; static int maxCollisions; static int numRehashes; static int numRemoves; static int numReinserts; static void recordCollisionAtCount(int count); }; #endif template class HashTable; template class HashTableIterator; template class HashTableConstIterator; #if CHECK_HASHTABLE_ITERATORS template void addIterator(const HashTable*, HashTableConstIterator*); template void removeIterator(HashTableConstIterator*); #else template inline void addIterator(const HashTable*, HashTableConstIterator*) { } template inline void removeIterator(HashTableConstIterator*) { } #endif template class HashTableConstIterator { private: typedef HashTable HashTableType; typedef HashTableIterator iterator; typedef HashTableConstIterator const_iterator; typedef Value ValueType; typedef const ValueType& ReferenceType; typedef const ValueType* PointerType; friend class HashTable; friend class HashTableIterator; void skipEmptyBuckets() { while (m_position != m_endPosition && HashTableType::isEmptyOrDeletedBucket(*m_position)) ++m_position; } HashTableConstIterator(const HashTableType* table, PointerType position, PointerType endPosition) : m_position(position), m_endPosition(endPosition) { addIterator(table, this); skipEmptyBuckets(); } public: HashTableConstIterator() { addIterator(0, this); } // default copy, assignment and destructor are OK if CHECK_HASHTABLE_ITERATORS is 0 #if CHECK_HASHTABLE_ITERATORS ~HashTableConstIterator() { removeIterator(this); } HashTableConstIterator(const const_iterator& other) : m_position(other.m_position), m_endPosition(other.m_endPosition) { addIterator(other.m_table, this); } const_iterator& operator=(const const_iterator& other) { m_position = other.m_position; m_endPosition = other.m_endPosition; removeIterator(this); addIterator(other.m_table, this); return *this; } #endif PointerType get() const { checkValidity(); return m_position; } ReferenceType operator*() const { return *get(); } PointerType operator->() const { return get(); } const_iterator& operator++() { checkValidity(); assert(m_position != m_endPosition); ++m_position; skipEmptyBuckets(); return *this; } // postfix ++ intentionally omitted // Comparison. bool operator==(const const_iterator& other) const { checkValidity(other); return m_position == other.m_position; } bool operator!=(const const_iterator& other) const { checkValidity(other); return m_position != other.m_position; } private: void checkValidity() const { #if CHECK_HASHTABLE_ITERATORS assert(m_table); #endif } #if CHECK_HASHTABLE_ITERATORS void checkValidity(const const_iterator& other) const { assert(m_table); assert(other.m_table); assert(m_table == other.m_table); } #else void checkValidity(const const_iterator&) const { } #endif PointerType m_position; PointerType m_endPosition; #if CHECK_HASHTABLE_ITERATORS public: mutable const HashTableType* m_table; mutable const_iterator* m_next; mutable const_iterator* m_previous; #endif }; template class HashTableIterator { private: typedef HashTable HashTableType; typedef HashTableIterator iterator; typedef HashTableConstIterator const_iterator; typedef Value ValueType; typedef ValueType& ReferenceType; typedef ValueType* PointerType; friend class HashTable; HashTableIterator(HashTableType* table, PointerType pos, PointerType end) : m_iterator(table, pos, end) { } public: HashTableIterator() { } // default copy, assignment and destructor are OK PointerType get() const { return const_cast(m_iterator.get()); } ReferenceType operator*() const { return *get(); } PointerType operator->() const { return get(); } iterator& operator++() { ++m_iterator; return *this; } // postfix ++ intentionally omitted // Comparison. bool operator==(const iterator& other) const { return m_iterator == other.m_iterator; } bool operator!=(const iterator& other) const { return m_iterator != other.m_iterator; } operator const_iterator() const { return m_iterator; } private: const_iterator m_iterator; }; using std::swap; #if !COMPILER(MSVC) // Visual C++ has a swap for pairs defined. // swap pairs by component, in case of pair members that specialize swap template inline void swap(pair& a, pair& b) { swap(a.first, b.first); swap(a.second, b.second); } #endif template struct Mover; template struct Mover { static void move(T& from, T& to) { swap(from, to); } }; template struct Mover { static void move(T& from, T& to) { to = from; } }; template class IdentityHashTranslator { public: static unsigned hash(const Key& key) { return HashFunctions::hash(key); } static bool equal(const Key& a, const Key& b) { return HashFunctions::equal(a, b); } static void translate(Value& location, const Key&, const Value& value, unsigned) { location = value; } }; template class HashTable { public: typedef HashTableIterator iterator; typedef HashTableConstIterator const_iterator; typedef Traits ValueTraits; typedef Key KeyType; typedef Value ValueType; typedef IdentityHashTranslator IdentityTranslatorType; HashTable(); ~HashTable() { invalidateIterators(); deallocateTable(m_table, m_tableSize); } HashTable(const HashTable&); void swap(HashTable&); HashTable& operator=(const HashTable&); iterator begin() { return makeIterator(m_table); } iterator end() { return makeIterator(m_table + m_tableSize); } const_iterator begin() const { return makeConstIterator(m_table); } const_iterator end() const { return makeConstIterator(m_table + m_tableSize); } int size() const { return m_keyCount; } int capacity() const { return m_tableSize; } bool isEmpty() const { return !m_keyCount; } pair add(const ValueType& value) { return add(Extractor::extract(value), value); } // A special version of add() that finds the object by hashing and comparing // with some other type, to avoid the cost of type conversion if the object is already // in the table. template pair add(const T& key, const Extra&); iterator find(const KeyType& key) { return find(key); } const_iterator find(const KeyType& key) const { return find(key); } bool contains(const KeyType& key) const { return contains(key); } template iterator find(const T&); template const_iterator find(const T&) const; template bool contains(const T&) const; void remove(const KeyType&); void remove(iterator); void clear(); static bool isEmptyBucket(const ValueType& value) { return Extractor::extract(value) == KeyTraits::emptyValue(); } static bool isDeletedBucket(const ValueType& value) { return Extractor::extract(value) == KeyTraits::deletedValue(); } static bool isEmptyOrDeletedBucket(const ValueType& value) { return isEmptyBucket(value) || isDeletedBucket(value); } private: static ValueType* allocateTable(int size); static void deallocateTable(ValueType* table, int size); typedef pair LookupType; typedef pair FullLookupType; LookupType lookup(const Key& key) { return lookup(key).first; } template FullLookupType lookup(const T&); void remove(ValueType*); bool shouldExpand() const { return (m_keyCount + m_deletedCount) * m_maxLoad >= m_tableSize; } bool mustRehashInPlace() const { return m_keyCount * m_minLoad < m_tableSize * 2; } bool shouldShrink() const { return m_keyCount * m_minLoad < m_tableSize && m_tableSize > m_minTableSize; } void expand(); void shrink() { rehash(m_tableSize / 2); } void rehash(int newTableSize); void reinsert(ValueType&); static void initializeBucket(ValueType& bucket) { new (&bucket) ValueType(Traits::emptyValue()); } static void deleteBucket(ValueType& bucket) { assignDeleted(bucket); } FullLookupType makeLookupResult(ValueType* position, bool found, unsigned hash) { return FullLookupType(LookupType(position, found), hash); } iterator makeIterator(ValueType* pos) { return iterator(this, pos, m_table + m_tableSize); } const_iterator makeConstIterator(ValueType* pos) const { return const_iterator(this, pos, m_table + m_tableSize); } #if CHECK_HASHTABLE_CONSISTENCY void checkTableConsistency() const; void checkTableConsistencyExceptSize() const; #else static void checkTableConsistency() { } static void checkTableConsistencyExceptSize() { } #endif #if CHECK_HASHTABLE_ITERATORS void invalidateIterators(); #else static void invalidateIterators() { } #endif static const int m_minTableSize = 64; static const int m_maxLoad = 2; static const int m_minLoad = 6; ValueType* m_table; int m_tableSize; int m_tableSizeMask; int m_keyCount; int m_deletedCount; #if CHECK_HASHTABLE_ITERATORS public: mutable const_iterator* m_iterators; #endif }; template inline HashTable::HashTable() : m_table(0) , m_tableSize(0) , m_tableSizeMask(0) , m_keyCount(0) , m_deletedCount(0) #if CHECK_HASHTABLE_ITERATORS , m_iterators(0) #endif { } template template inline typename HashTable::FullLookupType HashTable::lookup(const T& key) { assert(m_table); unsigned h = HashTranslator::hash(key); int sizeMask = m_tableSizeMask; int i = h & sizeMask; int k = 0; #if DUMP_HASHTABLE_STATS ++HashTableStats::numAccesses; int probeCount = 0; #endif ValueType *table = m_table; ValueType *entry; ValueType *deletedEntry = 0; while (!isEmptyBucket(*(entry = table + i))) { if (isDeletedBucket(*entry)) deletedEntry = entry; else if (HashTranslator::equal(Extractor::extract(*entry), key)) return makeLookupResult(entry, true, h); #if DUMP_HASHTABLE_STATS ++probeCount; HashTableStats::recordCollisionAtCount(probeCount); #endif if (k == 0) k = 1 | (h % sizeMask); i = (i + k) & sizeMask; } return makeLookupResult(deletedEntry ? deletedEntry : entry, false, h); } template template inline pair::iterator, bool> HashTable::add(const T& key, const Extra &extra) { invalidateIterators(); if (!m_table) expand(); checkTableConsistency(); FullLookupType lookupResult = lookup(key); ValueType *entry = lookupResult.first.first; bool found = lookupResult.first.second; unsigned h = lookupResult.second; if (found) return std::make_pair(makeIterator(entry), false); if (isDeletedBucket(*entry)) --m_deletedCount; HashTranslator::translate(*entry, key, extra, h); ++m_keyCount; if (shouldExpand()) { // FIXME: this makes an extra copy on expand. Probably not that bad since // expand is rare, but would be better to have a version of expand that can // follow a pivot entry and return the new position KeyType enteredKey = Extractor::extract(*entry); expand(); return std::make_pair(find(enteredKey), true); } checkTableConsistency(); return std::make_pair(makeIterator(entry), true); } template inline void HashTable::reinsert(ValueType& entry) { assert(m_table); assert(!lookup(Extractor::extract(entry)).second); assert(!isDeletedBucket(*(lookup(Extractor::extract(entry)).first))); #if DUMP_HASHTABLE_STATS ++HashTableStats::numReinserts; #endif Mover::move(entry, *(lookup(Extractor::extract(entry)).first)); } template template typename HashTable::iterator HashTable::find(const T& key) { if (!m_table) return end(); LookupType result = lookup(key).first; if (!result.second) return end(); return makeIterator(result.first); } template template typename HashTable::const_iterator HashTable::find(const T& key) const { if (!m_table) return end(); LookupType result = const_cast(this)->lookup(key).first; if (!result.second) return end(); return makeConstIterator(result.first); } template template bool HashTable::contains(const T& key) const { if (!m_table) return false; return const_cast(this)->lookup(key).first.second; } template void HashTable::remove(ValueType* pos) { invalidateIterators(); checkTableConsistency(); #if DUMP_HASHTABLE_STATS ++HashTableStats::numRemoves; #endif deleteBucket(*pos); ++m_deletedCount; --m_keyCount; if (shouldShrink()) shrink(); checkTableConsistency(); } template inline void HashTable::remove(iterator it) { if (it == end()) return; remove(const_cast(it.m_iterator.m_position)); } template inline void HashTable::remove(const KeyType& key) { remove(find(key)); } template Value *HashTable::allocateTable(int size) { // would use a template member function with explicit specializations here, but // gcc doesn't appear to support that if (Traits::emptyValueIsZero) return static_cast(fastCalloc(size, sizeof(ValueType))); ValueType* result = static_cast(fastMalloc(size * sizeof(ValueType))); for (int i = 0; i < size; i++) initializeBucket(result[i]); return result; } template void HashTable::deallocateTable(ValueType *table, int size) { if (Traits::needsDestruction) for (int i = 0; i < size; ++i) table[i].~ValueType(); fastFree(table); } template void HashTable::expand() { int newSize; if (m_tableSize == 0) newSize = m_minTableSize; else if (mustRehashInPlace()) newSize = m_tableSize; else newSize = m_tableSize * 2; rehash(newSize); } template void HashTable::rehash(int newTableSize) { checkTableConsistencyExceptSize(); int oldTableSize = m_tableSize; ValueType *oldTable = m_table; #if DUMP_HASHTABLE_STATS if (oldTableSize != 0) ++HashTableStats::numRehashes; #endif m_tableSize = newTableSize; m_tableSizeMask = newTableSize - 1; m_table = allocateTable(newTableSize); for (int i = 0; i != oldTableSize; ++i) if (!isEmptyOrDeletedBucket(oldTable[i])) reinsert(oldTable[i]); m_deletedCount = 0; deallocateTable(oldTable, oldTableSize); checkTableConsistency(); } template void HashTable::clear() { invalidateIterators(); deallocateTable(m_table, m_tableSize); m_table = 0; m_tableSize = 0; m_tableSizeMask = 0; m_keyCount = 0; } template HashTable::HashTable(const HashTable& other) : m_table(0) , m_tableSize(0) , m_tableSizeMask(0) , m_keyCount(0) , m_deletedCount(0) #if CHECK_HASHTABLE_ITERATORS , m_iterators(0) #endif { // Copy the hash table the dumb way, by adding each element to the new table. // It might be more efficient to copy the table slots, but it's not clear that efficiency is needed. const_iterator end = other.end(); for (const_iterator it = other.begin(); it != end; ++it) add(*it); } template void HashTable::swap(HashTable& other) { invalidateIterators(); other.invalidateIterators(); ValueType *tmp_table = m_table; m_table = other.m_table; other.m_table = tmp_table; int tmp_tableSize = m_tableSize; m_tableSize = other.m_tableSize; other.m_tableSize = tmp_tableSize; int tmp_tableSizeMask = m_tableSizeMask; m_tableSizeMask = other.m_tableSizeMask; other.m_tableSizeMask = tmp_tableSizeMask; int tmp_keyCount = m_keyCount; m_keyCount = other.m_keyCount; other.m_keyCount = tmp_keyCount; int tmp_deletedCount = m_deletedCount; m_deletedCount = other.m_deletedCount; other.m_deletedCount = tmp_deletedCount; } template HashTable& HashTable::operator=(const HashTable& other) { HashTable tmp(other); swap(tmp); return *this; } #if CHECK_HASHTABLE_CONSISTENCY template void HashTable::checkTableConsistency() const { checkTableConsistencyExceptSize(); assert(!shouldExpand()); assert(!shouldShrink()); } template void HashTable::checkTableConsistencyExceptSize() const { if (!m_table) return; int count = 0; int deletedCount = 0; for (int j = 0; j < m_tableSize; ++j) { ValueType *entry = m_table + j; if (isEmptyBucket(*entry)) continue; if (isDeletedBucket(*entry)) { ++deletedCount; continue; } const_iterator it = find(Extractor::extract(*entry)); assert(entry == it.m_position); ++count; } assert(count == m_keyCount); assert(deletedCount == m_deletedCount); assert(m_tableSize >= m_minTableSize); assert(m_tableSizeMask); assert(m_tableSize == m_tableSizeMask + 1); } #endif // CHECK_HASHTABLE_CONSISTENCY #if CHECK_HASHTABLE_ITERATORS template void HashTable::invalidateIterators() { const_iterator* next; for (const_iterator* p = m_iterators; p; p = next) { next = p->m_next; p->m_table = 0; p->m_next = 0; p->m_previous = 0; } m_iterators = 0; } template void addIterator(const HashTable* table, HashTableConstIterator* it) { it->m_table = table; it->m_previous = 0; // Insert iterator at head of doubly-linked list of iterators. if (!table) { it->m_next = 0; } else { assert(table->m_iterators != it); it->m_next = table->m_iterators; table->m_iterators = it; if (it->m_next) { assert(!it->m_next->m_previous); it->m_next->m_previous = it; } } } template void removeIterator(HashTableConstIterator* it) { typedef HashTable HashTableType; typedef HashTableConstIterator const_iterator; // Delete iterator from doubly-linked list of iterators. if (!it->m_table) { assert(!it->m_next); assert(!it->m_previous); } else { if (it->m_next) { assert(it->m_next->m_previous == it); it->m_next->m_previous = it->m_previous; } if (it->m_previous) { assert(it->m_table->m_iterators != it); assert(it->m_previous->m_next == it); it->m_previous->m_next = it->m_next; } else { assert(it->m_table->m_iterators == it); it->m_table->m_iterators = it->m_next; } } it->m_table = 0; it->m_next = 0; it->m_previous = 0; } #endif // CHECK_HASHTABLE_ITERATORS // iterator adapters template struct HashTableConstIteratorAdapter { HashTableConstIteratorAdapter(const typename HashTableType::const_iterator& impl) : m_impl(impl) {} const ValueType* get() const { return (const ValueType*)m_impl.get(); } const ValueType& operator*() const { return *get(); } const ValueType* operator->() const { return get(); } HashTableConstIteratorAdapter& operator++() { ++m_impl; return *this; } // postfix ++ intentionally omitted typename HashTableType::const_iterator m_impl; }; template struct HashTableIteratorAdapter { HashTableIteratorAdapter(const typename HashTableType::iterator& impl) : m_impl(impl) {} ValueType* get() const { return (ValueType*)m_impl.get(); } ValueType& operator*() const { return *get(); } ValueType* operator->() const { return get(); } HashTableIteratorAdapter& operator++() { ++m_impl; return *this; } // postfix ++ intentionally omitted operator HashTableConstIteratorAdapter() { typename HashTableType::const_iterator i = m_impl; return i; } typename HashTableType::iterator m_impl; }; template inline bool operator==(const HashTableConstIteratorAdapter& a, const HashTableConstIteratorAdapter& b) { return a.m_impl == b.m_impl; } template inline bool operator!=(const HashTableConstIteratorAdapter& a, const HashTableConstIteratorAdapter& b) { return a.m_impl != b.m_impl; } template inline bool operator==(const HashTableIteratorAdapter& a, const HashTableIteratorAdapter& b) { return a.m_impl == b.m_impl; } template inline bool operator!=(const HashTableIteratorAdapter& a, const HashTableIteratorAdapter& b) { return a.m_impl != b.m_impl; } // reference count manager template struct NeedsRef { static const bool value = ValueTraits::needsRef && !ValueStorageTraits::needsRef; }; template struct NeedsRef, ValueStorageTraits> { typedef typename ValueStorageTraits::FirstTraits FirstStorageTraits; typedef typename ValueStorageTraits::SecondTraits SecondStorageTraits; static const bool firstNeedsRef = NeedsRef::value; static const bool secondNeedsRef = NeedsRef::value; static const bool value = firstNeedsRef || secondNeedsRef; }; template struct RefCounterBase; template struct RefCounterBase { typedef typename ValueStorageTraits::TraitType ValueStorageType; static void ref(const ValueStorageType&) { } static void deref(const ValueStorageType&) { } }; template struct RefCounterBase { typedef typename ValueStorageTraits::TraitType ValueStorageType; static void ref(const ValueStorageType& v) { ValueTraits::ref(v); } static void deref(const ValueStorageType& v) { ValueTraits::deref(v); } }; template struct RefCounter { typedef typename ValueTraits::TraitType ValueType; typedef typename ValueStorageTraits::TraitType ValueStorageType; static const bool needsRef = NeedsRef::value; typedef RefCounterBase Base; static void ref(const ValueStorageType& v) { Base::ref(v); } static void deref(const ValueStorageType& v) { Base::deref(v); } }; template struct RefCounter, ValueStorageTraits> { typedef typename FirstTraits::TraitType FirstType; typedef typename SecondTraits::TraitType SecondType; typedef typename ValueStorageTraits::FirstTraits FirstStorageTraits; typedef typename ValueStorageTraits::SecondTraits SecondStorageTraits; typedef typename ValueStorageTraits::TraitType ValueStorageType; static const bool firstNeedsRef = NeedsRef::value; static const bool secondNeedsRef = NeedsRef::value; typedef RefCounterBase FirstBase; typedef RefCounterBase SecondBase; static void ref(const ValueStorageType& v) { FirstBase::ref(v.first); SecondBase::ref(v.second); } static void deref(const ValueStorageType& v) { FirstBase::deref(v.first); SecondBase::deref(v.second); } }; template struct HashTableRefCounterBase; template struct HashTableRefCounterBase { static void refAll(HashTableType&) { } static void derefAll(HashTableType&) { } }; template struct HashTableRefCounterBase { typedef typename HashTableType::iterator iterator; typedef RefCounter ValueRefCounter; static void refAll(HashTableType&); static void derefAll(HashTableType&); }; template void HashTableRefCounterBase::refAll(HashTableType& table) { iterator end = table.end(); for (iterator it = table.begin(); it != end; ++it) ValueRefCounter::ref(*it); } template void HashTableRefCounterBase::derefAll(HashTableType& table) { iterator end = table.end(); for (iterator it = table.begin(); it != end; ++it) ValueRefCounter::deref(*it); } template struct HashTableRefCounter { static const bool needsRef = NeedsRef::value; typedef HashTableRefCounterBase Base; static void refAll(HashTableType& table) { Base::refAll(table); } static void derefAll(HashTableType& table) { Base::derefAll(table); } }; // helper template for HashMap and HashSet. template struct Assigner; template struct Assigner { typedef union { FromType m_from; ToType m_to; } UnionType; static void assign(const FromType& from, ToType& to) { reinterpret_cast(&to)->m_from = from; } }; template struct Assigner { static void assign(const FromType& from, ToType& to) { ToType oldTo = to; memcpy(&to, &from, sizeof(FromType)); FromTraits::ref(to); FromTraits::deref(oldTo); } }; template struct Assigner { static void assign(const FromType& from, FromType& to) { to = from; } }; template struct Assigner { static void assign(const FromType& from, FromType& to) { to = from; } }; } // namespace WTF #endif // WTF_HashTable_h