include/mcld/ADT/HashBase.tcc - platform/frameworks/compile/mclinker - Git at Google

 //===- HashBase.tcc -------------------------------------------------------===//
 //
 //                     The MCLinker Project
 //
 // This file is distributed under the University of Illinois Open Source
 // License. See LICENSE.TXT for details.
 //
 //===----------------------------------------------------------------------===//

 //===----------------------------------------------------------------------===//
 // internal non-member functions
 //===----------------------------------------------------------------------===//
 inline static unsigned int compute_bucket_count(unsigned int pNumOfBuckets) {
   static const unsigned int bucket_size[] = {
       1,     3,     17,    37,    67,    97,     197,
       419,   977,   2593,  4099,  8209,  12289,  16411,
       20483, 32771, 49157, 65537, 98317, 131101, 196613};

   const unsigned int buckets_count =
       sizeof(bucket_size) / sizeof(bucket_size[0]);
   unsigned int idx = 0;
   do {
     if (pNumOfBuckets < bucket_size[idx]) {
       return bucket_size[idx];
     }
     ++idx;
   } while (idx < buckets_count);

   return (pNumOfBuckets + 131101);  // rare case. increase constantly
 }

 //===----------------------------------------------------------------------===//
 // template implementation of HashBucket
 //===----------------------------------------------------------------------===//
 template <typename DataType>
 typename HashBucket<DataType>::entry_type*
 HashBucket<DataType>::getEmptyBucket() {
   static entry_type* empty_bucket = reinterpret_cast<entry_type*>(0x0);
   return empty_bucket;
 }

 template <typename DataType>
 typename HashBucket<DataType>::entry_type*
 HashBucket<DataType>::getTombstone() {
   static entry_type* tombstone = reinterpret_cast<entry_type*>(0x1);
   return tombstone;
 }

 //===----------------------------------------------------------------------===//
 // template implementation of HashTableImpl
 //===----------------------------------------------------------------------===//
 template <typename HashEntryTy, typename HashFunctionTy>
 HashTableImpl<HashEntryTy, HashFunctionTy>::HashTableImpl()
     : m_Buckets(0),
       m_NumOfBuckets(0),
       m_NumOfEntries(0),
       m_NumOfTombstones(0),
       m_Hasher() {
 }

 template <typename HashEntryTy, typename HashFunctionTy>
 HashTableImpl<HashEntryTy, HashFunctionTy>::HashTableImpl(
     unsigned int pInitSize)
     : m_Hasher() {
   if (pInitSize) {
     init(pInitSize);
     return;
   }

   m_Buckets = 0;
   m_NumOfBuckets = 0;
   m_NumOfEntries = 0;
   m_NumOfTombstones = 0;
 }

 template <typename HashEntryTy, typename HashFunctionTy>
 HashTableImpl<HashEntryTy, HashFunctionTy>::~HashTableImpl() {
   clear();
 }

 /// empty - check if the hash table is empty
 template <typename HashEntryTy, typename HashFunctionTy>
 bool HashTableImpl<HashEntryTy, HashFunctionTy>::empty() const {
   return (m_NumOfEntries == 0);
 }

 /// init - initialize the hash table.
 template <typename HashEntryTy, typename HashFunctionTy>
 void HashTableImpl<HashEntryTy, HashFunctionTy>::init(unsigned int pInitSize) {
   m_NumOfBuckets =
       pInitSize ? compute_bucket_count(pInitSize) : NumOfInitBuckets;

   m_NumOfEntries = 0;
   m_NumOfTombstones = 0;

   /** calloc also set bucket.Item = bucket_type::getEmptyStone() **/
   m_Buckets = (bucket_type*)calloc(m_NumOfBuckets, sizeof(bucket_type));
 }

 /// clear - clear the hash table.
 template <typename HashEntryTy, typename HashFunctionTy>
 void HashTableImpl<HashEntryTy, HashFunctionTy>::clear() {
   free(m_Buckets);

   m_Buckets = 0;
   m_NumOfBuckets = 0;
   m_NumOfEntries = 0;
   m_NumOfTombstones = 0;
 }

 /// lookUpBucketFor - look up the bucket whose key is pKey
 template <typename HashEntryTy, typename HashFunctionTy>
 unsigned int HashTableImpl<HashEntryTy, HashFunctionTy>::lookUpBucketFor(
     const typename HashTableImpl<HashEntryTy, HashFunctionTy>::key_type& pKey) {
   if (m_NumOfBuckets == 0) {
     // NumOfBuckets is changed after init(pInitSize)
     init(NumOfInitBuckets);
   }

   unsigned int full_hash = m_Hasher(pKey);
   unsigned int index = full_hash % m_NumOfBuckets;

   const unsigned int probe = 1;
   int firstTombstone = -1;

   // linear probing
   while (true) {
     bucket_type& bucket = m_Buckets[index];
     // If we found an empty bucket, this key isn't in the table yet, return it.
     if (bucket_type::getEmptyBucket() == bucket.Entry) {
       if (firstTombstone != -1) {
         m_Buckets[firstTombstone].FullHashValue = full_hash;
         return firstTombstone;
       }

       bucket.FullHashValue = full_hash;
       return index;
     }

     if (bucket_type::getTombstone() == bucket.Entry) {
       if (firstTombstone == -1) {
         firstTombstone = index;
       }
     } else if (bucket.FullHashValue == full_hash) {
       if (bucket.Entry->compare(pKey)) {
         return index;
       }
     }

     index += probe;
     if (index == m_NumOfBuckets)
       index = 0;
   }
 }

 template <typename HashEntryTy, typename HashFunctionTy>
 int HashTableImpl<HashEntryTy, HashFunctionTy>::findKey(
     const typename HashTableImpl<HashEntryTy, HashFunctionTy>::key_type& pKey)
     const {
   if (m_NumOfBuckets == 0)
     return -1;

   unsigned int full_hash = m_Hasher(pKey);
   unsigned int index = full_hash % m_NumOfBuckets;

   const unsigned int probe = 1;
   // linear probing
   while (true) {
     bucket_type& bucket = m_Buckets[index];

     if (bucket_type::getEmptyBucket() == bucket.Entry)
       return -1;

     if (bucket_type::getTombstone() == bucket.Entry) {
       // Ignore tombstones.
     } else if (full_hash == bucket.FullHashValue) {
       // get string, compare, if match, return index
       if (bucket.Entry->compare(pKey))
         return index;
     }
     index += probe;
     if (index == m_NumOfBuckets)
       index = 0;
   }
 }

 template <typename HashEntryTy, typename HashFunctionTy>
 void HashTableImpl<HashEntryTy, HashFunctionTy>::mayRehash() {
   unsigned int new_size;
   // If the hash table is now more than 3/4 full, or if fewer than 1/8 of
   // the buckets are empty (meaning that many are filled with tombstones),
   // grow/rehash the table.
   if ((m_NumOfEntries << 2) > m_NumOfBuckets * 3)
     new_size = compute_bucket_count(m_NumOfBuckets);
   else if (((m_NumOfBuckets - (m_NumOfEntries + m_NumOfTombstones)) << 3) <
            m_NumOfBuckets)
     new_size = m_NumOfBuckets;
   else
     return;

   doRehash(new_size);
 }

 template <typename HashEntryTy, typename HashFunctionTy>
 void HashTableImpl<HashEntryTy, HashFunctionTy>::doRehash(
     unsigned int pNewSize) {
   bucket_type* new_table = (bucket_type*)calloc(pNewSize, sizeof(bucket_type));

   // Rehash all the items into their new buckets.  Luckily :) we already have
   // the hash values available, so we don't have to recall hash function again.
   for (bucket_type* IB = m_Buckets, * E = m_Buckets + m_NumOfBuckets; IB != E;
        ++IB) {
     if (IB->Entry != bucket_type::getEmptyBucket() &&
         IB->Entry != bucket_type::getTombstone()) {
       // Fast case, bucket available.
       unsigned full_hash = IB->FullHashValue;
       unsigned new_bucket = full_hash % pNewSize;
       if (bucket_type::getEmptyBucket() == new_table[new_bucket].Entry) {
         new_table[new_bucket].Entry = IB->Entry;
         new_table[new_bucket].FullHashValue = full_hash;
         continue;
       }

       // Otherwise probe for a spot.
       const unsigned int probe = 1;
       do {
         new_bucket += probe;
         if (new_bucket == pNewSize)
           new_bucket = 0;
       } while (new_table[new_bucket].Entry != bucket_type::getEmptyBucket());

       // Finally found a slot.  Fill it in.
       new_table[new_bucket].Entry = IB->Entry;
       new_table[new_bucket].FullHashValue = full_hash;
     }
   }

   free(m_Buckets);

   m_Buckets = new_table;
   m_NumOfBuckets = pNewSize;
   m_NumOfTombstones = 0;
 }
	//===- HashBase.tcc -------------------------------------------------------===//
	//
	// The MCLinker Project
	//
	// This file is distributed under the University of Illinois Open Source
	// License. See LICENSE.TXT for details.
	//
	//===----------------------------------------------------------------------===//

	//===----------------------------------------------------------------------===//
	// internal non-member functions
	//===----------------------------------------------------------------------===//
	inline static unsigned int compute_bucket_count(unsigned int pNumOfBuckets) {
	static const unsigned int bucket_size[] = {
	1, 3, 17, 37, 67, 97, 197,
	419, 977, 2593, 4099, 8209, 12289, 16411,
	20483, 32771, 49157, 65537, 98317, 131101, 196613};

	const unsigned int buckets_count =
	sizeof(bucket_size) / sizeof(bucket_size[0]);
	unsigned int idx = 0;
	do {
	if (pNumOfBuckets < bucket_size[idx]) {
	return bucket_size[idx];
	}
	++idx;
	} while (idx < buckets_count);

	return (pNumOfBuckets + 131101); // rare case. increase constantly
	}

	//===----------------------------------------------------------------------===//
	// template implementation of HashBucket
	//===----------------------------------------------------------------------===//
	template <typename DataType>
	typename HashBucket<DataType>::entry_type*
	HashBucket<DataType>::getEmptyBucket() {
	static entry_type* empty_bucket = reinterpret_cast<entry_type*>(0x0);
	return empty_bucket;
	}

	template <typename DataType>
	typename HashBucket<DataType>::entry_type*
	HashBucket<DataType>::getTombstone() {
	static entry_type* tombstone = reinterpret_cast<entry_type*>(0x1);
	return tombstone;
	}

	//===----------------------------------------------------------------------===//
	// template implementation of HashTableImpl
	//===----------------------------------------------------------------------===//
	template <typename HashEntryTy, typename HashFunctionTy>
	HashTableImpl<HashEntryTy, HashFunctionTy>::HashTableImpl()
	: m_Buckets(0),
	m_NumOfBuckets(0),
	m_NumOfEntries(0),
	m_NumOfTombstones(0),
	m_Hasher() {
	}

	template <typename HashEntryTy, typename HashFunctionTy>
	HashTableImpl<HashEntryTy, HashFunctionTy>::HashTableImpl(
	unsigned int pInitSize)
	: m_Hasher() {
	if (pInitSize) {
	init(pInitSize);
	return;
	}

	m_Buckets = 0;
	m_NumOfBuckets = 0;
	m_NumOfEntries = 0;
	m_NumOfTombstones = 0;
	}

	template <typename HashEntryTy, typename HashFunctionTy>
	HashTableImpl<HashEntryTy, HashFunctionTy>::~HashTableImpl() {
	clear();
	}

	/// empty - check if the hash table is empty
	template <typename HashEntryTy, typename HashFunctionTy>
	bool HashTableImpl<HashEntryTy, HashFunctionTy>::empty() const {
	return (m_NumOfEntries == 0);
	}

	/// init - initialize the hash table.
	template <typename HashEntryTy, typename HashFunctionTy>
	void HashTableImpl<HashEntryTy, HashFunctionTy>::init(unsigned int pInitSize) {
	m_NumOfBuckets =
	pInitSize ? compute_bucket_count(pInitSize) : NumOfInitBuckets;

	m_NumOfEntries = 0;
	m_NumOfTombstones = 0;

	/ calloc also set bucket.Item = bucket_type::getEmptyStone() /
	m_Buckets = (bucket_type*)calloc(m_NumOfBuckets, sizeof(bucket_type));
	}

	/// clear - clear the hash table.
	template <typename HashEntryTy, typename HashFunctionTy>
	void HashTableImpl<HashEntryTy, HashFunctionTy>::clear() {
	free(m_Buckets);

	m_Buckets = 0;
	m_NumOfBuckets = 0;
	m_NumOfEntries = 0;
	m_NumOfTombstones = 0;
	}

	/// lookUpBucketFor - look up the bucket whose key is pKey
	template <typename HashEntryTy, typename HashFunctionTy>
	unsigned int HashTableImpl<HashEntryTy, HashFunctionTy>::lookUpBucketFor(
	const typename HashTableImpl<HashEntryTy, HashFunctionTy>::key_type& pKey) {
	if (m_NumOfBuckets == 0) {
	// NumOfBuckets is changed after init(pInitSize)
	init(NumOfInitBuckets);
	}

	unsigned int full_hash = m_Hasher(pKey);
	unsigned int index = full_hash % m_NumOfBuckets;

	const unsigned int probe = 1;
	int firstTombstone = -1;

	// linear probing
	while (true) {
	bucket_type& bucket = m_Buckets[index];
	// If we found an empty bucket, this key isn't in the table yet, return it.
	if (bucket_type::getEmptyBucket() == bucket.Entry) {
	if (firstTombstone != -1) {
	m_Buckets[firstTombstone].FullHashValue = full_hash;
	return firstTombstone;
	}

	bucket.FullHashValue = full_hash;
	return index;
	}

	if (bucket_type::getTombstone() == bucket.Entry) {
	if (firstTombstone == -1) {
	firstTombstone = index;
	}
	} else if (bucket.FullHashValue == full_hash) {
	if (bucket.Entry->compare(pKey)) {
	return index;
	}
	}

	index += probe;
	if (index == m_NumOfBuckets)
	index = 0;
	}
	}

	template <typename HashEntryTy, typename HashFunctionTy>
	int HashTableImpl<HashEntryTy, HashFunctionTy>::findKey(
	const typename HashTableImpl<HashEntryTy, HashFunctionTy>::key_type& pKey)
	const {
	if (m_NumOfBuckets == 0)
	return -1;

	unsigned int full_hash = m_Hasher(pKey);
	unsigned int index = full_hash % m_NumOfBuckets;

	const unsigned int probe = 1;
	// linear probing
	while (true) {
	bucket_type& bucket = m_Buckets[index];

	if (bucket_type::getEmptyBucket() == bucket.Entry)
	return -1;

	if (bucket_type::getTombstone() == bucket.Entry) {
	// Ignore tombstones.
	} else if (full_hash == bucket.FullHashValue) {
	// get string, compare, if match, return index
	if (bucket.Entry->compare(pKey))
	return index;
	}
	index += probe;
	if (index == m_NumOfBuckets)
	index = 0;
	}
	}

	template <typename HashEntryTy, typename HashFunctionTy>
	void HashTableImpl<HashEntryTy, HashFunctionTy>::mayRehash() {
	unsigned int new_size;
	// If the hash table is now more than 3/4 full, or if fewer than 1/8 of
	// the buckets are empty (meaning that many are filled with tombstones),
	// grow/rehash the table.
	if ((m_NumOfEntries << 2) > m_NumOfBuckets * 3)
	new_size = compute_bucket_count(m_NumOfBuckets);
	else if (((m_NumOfBuckets - (m_NumOfEntries + m_NumOfTombstones)) << 3) <
	m_NumOfBuckets)
	new_size = m_NumOfBuckets;
	else
	return;

	doRehash(new_size);
	}

	template <typename HashEntryTy, typename HashFunctionTy>
	void HashTableImpl<HashEntryTy, HashFunctionTy>::doRehash(
	unsigned int pNewSize) {
	bucket_type* new_table = (bucket_type*)calloc(pNewSize, sizeof(bucket_type));

	// Rehash all the items into their new buckets. Luckily :) we already have
	// the hash values available, so we don't have to recall hash function again.
	for (bucket_type* IB = m_Buckets, * E = m_Buckets + m_NumOfBuckets; IB != E;
	++IB) {
	if (IB->Entry != bucket_type::getEmptyBucket() &&
	IB->Entry != bucket_type::getTombstone()) {
	// Fast case, bucket available.
	unsigned full_hash = IB->FullHashValue;
	unsigned new_bucket = full_hash % pNewSize;
	if (bucket_type::getEmptyBucket() == new_table[new_bucket].Entry) {
	new_table[new_bucket].Entry = IB->Entry;
	new_table[new_bucket].FullHashValue = full_hash;
	continue;
	}

	// Otherwise probe for a spot.
	const unsigned int probe = 1;
	do {
	new_bucket += probe;
	if (new_bucket == pNewSize)
	new_bucket = 0;
	} while (new_table[new_bucket].Entry != bucket_type::getEmptyBucket());

	// Finally found a slot. Fill it in.
	new_table[new_bucket].Entry = IB->Entry;
	new_table[new_bucket].FullHashValue = full_hash;
	}
	}

	free(m_Buckets);

	m_Buckets = new_table;
	m_NumOfBuckets = pNewSize;
	m_NumOfTombstones = 0;
	}