mirror of
https://github.com/pocoproject/poco.git
synced 2024-12-15 03:21:09 +01:00
420 lines
10 KiB
C
420 lines
10 KiB
C
|
//
|
||
|
// SimpleHashTable.h
|
||
|
//
|
||
|
// $Id: //poco/1.4/Foundation/include/Poco/SimpleHashTable.h#1 $
|
||
|
//
|
||
|
// Library: Foundation
|
||
|
// Package: Hashing
|
||
|
// Module: SimpleHashTable
|
||
|
//
|
||
|
// Definition of the SimpleHashTable class.
|
||
|
//
|
||
|
// Copyright (c) 2006, Applied Informatics Software Engineering GmbH.
|
||
|
// and Contributors.
|
||
|
//
|
||
|
// Permission is hereby granted, free of charge, to any person or organization
|
||
|
// obtaining a copy of the software and accompanying documentation covered by
|
||
|
// this license (the "Software") to use, reproduce, display, distribute,
|
||
|
// execute, and transmit the Software, and to prepare derivative works of the
|
||
|
// Software, and to permit third-parties to whom the Software is furnished to
|
||
|
// do so, all subject to the following:
|
||
|
//
|
||
|
// The copyright notices in the Software and this entire statement, including
|
||
|
// the above license grant, this restriction and the following disclaimer,
|
||
|
// must be included in all copies of the Software, in whole or in part, and
|
||
|
// all derivative works of the Software, unless such copies or derivative
|
||
|
// works are solely in the form of machine-executable object code generated by
|
||
|
// a source language processor.
|
||
|
//
|
||
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||
|
// FITNESS FOR A PARTICULAR PURPOSE, TITLE AND NON-INFRINGEMENT. IN NO EVENT
|
||
|
// SHALL THE COPYRIGHT HOLDERS OR ANYONE DISTRIBUTING THE SOFTWARE BE LIABLE
|
||
|
// FOR ANY DAMAGES OR OTHER LIABILITY, WHETHER IN CONTRACT, TORT OR OTHERWISE,
|
||
|
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
||
|
// DEALINGS IN THE SOFTWARE.
|
||
|
//
|
||
|
|
||
|
|
||
|
#ifndef Foundation_SimpleHashTable_INCLUDED
|
||
|
#define Foundation_SimpleHashTable_INCLUDED
|
||
|
|
||
|
|
||
|
#include "Poco/Foundation.h"
|
||
|
#include "Poco/Exception.h"
|
||
|
#include "Poco/HashFunction.h"
|
||
|
#include "Poco/HashStatistic.h"
|
||
|
#include <vector>
|
||
|
#include <map>
|
||
|
#include <cstddef>
|
||
|
#include <algorithm>
|
||
|
|
||
|
|
||
|
namespace Poco {
|
||
|
|
||
|
|
||
|
//@ deprecated
|
||
|
template <class Key, class Value, class KeyHashFunction = HashFunction<Key> >
|
||
|
class SimpleHashTable
|
||
|
/// A SimpleHashTable stores a key value pair that can be looked up via a hashed key.
|
||
|
///
|
||
|
/// In comparision to a HashTable, this class handles collisions by sequentially searching the next
|
||
|
/// free location. This also means that the maximum size of this table is limited, i.e. if the hash table
|
||
|
/// is full, it will throw an exception and that this class does not support remove operations.
|
||
|
/// On the plus side it is faster than the HashTable.
|
||
|
///
|
||
|
/// This class is NOT thread safe.
|
||
|
{
|
||
|
public:
|
||
|
class HashEntry
|
||
|
{
|
||
|
public:
|
||
|
Key key;
|
||
|
Value value;
|
||
|
HashEntry(const Key k, const Value v): key(k), value(v)
|
||
|
{
|
||
|
}
|
||
|
};
|
||
|
|
||
|
typedef std::vector<HashEntry*> HashTableVector;
|
||
|
|
||
|
SimpleHashTable(UInt32 capacity = 251): _entries(capacity, 0), _size(0), _capacity(capacity)
|
||
|
/// Creates the SimpleHashTable.
|
||
|
{
|
||
|
}
|
||
|
|
||
|
SimpleHashTable(const SimpleHashTable& ht):
|
||
|
_size(ht._size),
|
||
|
_capacity(ht._capacity)
|
||
|
{
|
||
|
_entries.reserve(ht._capacity);
|
||
|
for (typename HashTableVector::iterator it = ht._entries.begin(); it != ht._entries.end(); ++it)
|
||
|
{
|
||
|
if (*it)
|
||
|
_entries.push_back(new HashEntry(*it));
|
||
|
else
|
||
|
_entries.push_back(0);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
~SimpleHashTable()
|
||
|
/// Destroys the SimpleHashTable.
|
||
|
{
|
||
|
clear();
|
||
|
}
|
||
|
|
||
|
SimpleHashTable& operator = (const SimpleHashTable& ht)
|
||
|
{
|
||
|
if (this != &ht)
|
||
|
{
|
||
|
SimpleHashTable tmp(ht);
|
||
|
swap(tmp);
|
||
|
}
|
||
|
return *this;
|
||
|
}
|
||
|
|
||
|
void swap(SimpleHashTable& ht)
|
||
|
{
|
||
|
using std::swap;
|
||
|
swap(_entries, ht._entries);
|
||
|
swap(_size, ht._size);
|
||
|
swap(_capacity, ht._capacity);
|
||
|
}
|
||
|
|
||
|
void clear()
|
||
|
{
|
||
|
for (typename HashTableVector::iterator it = _entries.begin(); it != _entries.end(); ++it)
|
||
|
{
|
||
|
delete *it;
|
||
|
*it = 0;
|
||
|
}
|
||
|
_size = 0;
|
||
|
}
|
||
|
|
||
|
UInt32 insert(const Key& key, const Value& value)
|
||
|
/// Returns the hash value of the inserted item.
|
||
|
/// Throws an exception if the entry was already inserted
|
||
|
{
|
||
|
UInt32 hsh = hash(key);
|
||
|
insertRaw(key, hsh, value);
|
||
|
return hsh;
|
||
|
}
|
||
|
|
||
|
Value& insertRaw(const Key& key, UInt32 hsh, const Value& value)
|
||
|
/// Returns the hash value of the inserted item.
|
||
|
/// Throws an exception if the entry was already inserted
|
||
|
{
|
||
|
UInt32 pos = hsh;
|
||
|
if (!_entries[pos])
|
||
|
_entries[pos] = new HashEntry(key, value);
|
||
|
else
|
||
|
{
|
||
|
UInt32 origHash = hsh;
|
||
|
while (_entries[hsh % _capacity])
|
||
|
{
|
||
|
if (_entries[hsh % _capacity]->key == key)
|
||
|
throw ExistsException();
|
||
|
if (hsh - origHash > _capacity)
|
||
|
throw PoolOverflowException("SimpleHashTable full");
|
||
|
hsh++;
|
||
|
}
|
||
|
pos = hsh % _capacity;
|
||
|
_entries[pos] = new HashEntry(key, value);
|
||
|
}
|
||
|
_size++;
|
||
|
return _entries[pos]->value;
|
||
|
}
|
||
|
|
||
|
UInt32 update(const Key& key, const Value& value)
|
||
|
/// Returns the hash value of the inserted item.
|
||
|
/// Replaces an existing entry if it finds one
|
||
|
{
|
||
|
UInt32 hsh = hash(key);
|
||
|
updateRaw(key, hsh, value);
|
||
|
return hsh;
|
||
|
}
|
||
|
|
||
|
void updateRaw(const Key& key, UInt32 hsh, const Value& value)
|
||
|
/// Returns the hash value of the inserted item.
|
||
|
/// Replaces an existing entry if it finds one
|
||
|
{
|
||
|
if (!_entries[hsh])
|
||
|
_entries[hsh] = new HashEntry(key, value);
|
||
|
else
|
||
|
{
|
||
|
UInt32 origHash = hsh;
|
||
|
while (_entries[hsh % _capacity])
|
||
|
{
|
||
|
if (_entries[hsh % _capacity]->key == key)
|
||
|
{
|
||
|
_entries[hsh % _capacity]->value = value;
|
||
|
return;
|
||
|
}
|
||
|
if (hsh - origHash > _capacity)
|
||
|
throw PoolOverflowException("SimpleHashTable full");
|
||
|
hsh++;
|
||
|
}
|
||
|
_entries[hsh % _capacity] = new HashEntry(key, value);
|
||
|
}
|
||
|
_size++;
|
||
|
}
|
||
|
|
||
|
UInt32 hash(const Key& key) const
|
||
|
{
|
||
|
return _hash(key, _capacity);
|
||
|
}
|
||
|
|
||
|
const Value& get(const Key& key) const
|
||
|
/// Throws an exception if the value does not exist
|
||
|
{
|
||
|
UInt32 hsh = hash(key);
|
||
|
return getRaw(key, hsh);
|
||
|
}
|
||
|
|
||
|
const Value& getRaw(const Key& key, UInt32 hsh) const
|
||
|
/// Throws an exception if the value does not exist
|
||
|
{
|
||
|
UInt32 origHash = hsh;
|
||
|
while (true)
|
||
|
{
|
||
|
if (_entries[hsh % _capacity])
|
||
|
{
|
||
|
if (_entries[hsh % _capacity]->key == key)
|
||
|
{
|
||
|
return _entries[hsh % _capacity]->value;
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
throw InvalidArgumentException("value not found");
|
||
|
if (hsh - origHash > _capacity)
|
||
|
throw InvalidArgumentException("value not found");
|
||
|
hsh++;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
Value& get(const Key& key)
|
||
|
/// Throws an exception if the value does not exist
|
||
|
{
|
||
|
UInt32 hsh = hash(key);
|
||
|
return const_cast<Value&>(getRaw(key, hsh));
|
||
|
}
|
||
|
|
||
|
const Value& operator [] (const Key& key) const
|
||
|
{
|
||
|
return get(key);
|
||
|
}
|
||
|
|
||
|
Value& operator [] (const Key& key)
|
||
|
{
|
||
|
UInt32 hsh = hash(key);
|
||
|
UInt32 origHash = hsh;
|
||
|
while (true)
|
||
|
{
|
||
|
if (_entries[hsh % _capacity])
|
||
|
{
|
||
|
if (_entries[hsh % _capacity]->key == key)
|
||
|
{
|
||
|
return _entries[hsh % _capacity]->value;
|
||
|
}
|
||
|
}
|
||
|
else return insertRaw(key, hsh, Value());
|
||
|
if (hsh - origHash > _capacity)
|
||
|
return insertRaw(key, hsh, Value());
|
||
|
hsh++;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
const Key& getKeyRaw(const Key& key, UInt32 hsh)
|
||
|
/// Throws an exception if the key does not exist. returns a reference to the internally
|
||
|
/// stored key. Useful when someone does an insert and wants for performance reason only to store
|
||
|
/// a pointer to the key in another collection
|
||
|
{
|
||
|
UInt32 origHash = hsh;
|
||
|
while (true)
|
||
|
{
|
||
|
if (_entries[hsh % _capacity])
|
||
|
{
|
||
|
if (_entries[hsh % _capacity]->key == key)
|
||
|
{
|
||
|
return _entries[hsh % _capacity]->key;
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
throw InvalidArgumentException("key not found");
|
||
|
|
||
|
if (hsh - origHash > _capacity)
|
||
|
throw InvalidArgumentException("key not found");
|
||
|
hsh++;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
bool get(const Key& key, Value& v) const
|
||
|
/// Sets v to the found value, returns false if no value was found
|
||
|
{
|
||
|
UInt32 hsh = hash(key);
|
||
|
return getRaw(key, hsh, v);
|
||
|
}
|
||
|
|
||
|
bool getRaw(const Key& key, UInt32 hsh, Value& v) const
|
||
|
/// Sets v to the found value, returns false if no value was found
|
||
|
{
|
||
|
UInt32 origHash = hsh;
|
||
|
while (true)
|
||
|
{
|
||
|
if (_entries[hsh % _capacity])
|
||
|
{
|
||
|
if (_entries[hsh % _capacity]->key == key)
|
||
|
{
|
||
|
v = _entries[hsh % _capacity]->value;
|
||
|
return true;
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
return false;
|
||
|
if (hsh - origHash > _capacity)
|
||
|
return false;
|
||
|
hsh++;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
bool exists(const Key& key) const
|
||
|
{
|
||
|
UInt32 hsh = hash(key);
|
||
|
return existsRaw(key, hsh);
|
||
|
}
|
||
|
|
||
|
bool existsRaw(const Key& key, UInt32 hsh) const
|
||
|
{
|
||
|
UInt32 origHash = hsh;
|
||
|
while (true)
|
||
|
{
|
||
|
if (_entries[hsh % _capacity])
|
||
|
{
|
||
|
if (_entries[hsh % _capacity]->key == key)
|
||
|
{
|
||
|
return true;
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
return false;
|
||
|
if (hsh - origHash > _capacity)
|
||
|
return false;
|
||
|
hsh++;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
std::size_t size() const
|
||
|
/// Returns the number of elements already inserted into the SimpleHashTable
|
||
|
{
|
||
|
return _size;
|
||
|
}
|
||
|
|
||
|
UInt32 capacity() const
|
||
|
{
|
||
|
return _capacity;
|
||
|
}
|
||
|
|
||
|
void resize(UInt32 newSize)
|
||
|
/// Resizes the hashtable, rehashes all existing entries. Expensive!
|
||
|
{
|
||
|
if (_capacity != newSize)
|
||
|
{
|
||
|
SimpleHashTable tmp(newSize);
|
||
|
swap(tmp);
|
||
|
for (typename HashTableVector::const_iterator it = tmp._entries.begin(); it != tmp._entries.end(); ++it)
|
||
|
{
|
||
|
if (*it)
|
||
|
{
|
||
|
insertRaw((*it)->key, hash((*it)->key), (*it)->value);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
HashStatistic currentState(bool details = false) const
|
||
|
/// Returns the current internal state
|
||
|
{
|
||
|
UInt32 numberOfEntries = (UInt32)_size;
|
||
|
UInt32 numZeroEntries = 0;
|
||
|
UInt32 maxEntriesPerHash = 0;
|
||
|
std::vector<UInt32> detailedEntriesPerHash;
|
||
|
#ifdef _DEBUG
|
||
|
UInt32 totalSize = 0;
|
||
|
#endif
|
||
|
for (int i=0; i < _capacity; ++i)
|
||
|
{
|
||
|
if (_entries[i])
|
||
|
{
|
||
|
maxEntriesPerHash = 1;
|
||
|
UInt32 size = 1;
|
||
|
if (details)
|
||
|
detailedEntriesPerHash.push_back(size);
|
||
|
#ifdef DEBUG
|
||
|
totalSize += size;
|
||
|
#endif
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
numZeroEntries++;
|
||
|
if (details)
|
||
|
detailedEntriesPerHash.push_back(0);
|
||
|
}
|
||
|
}
|
||
|
poco_assert_dbg(totalSize == numberOfEntries);
|
||
|
|
||
|
return HashStatistic(_capacity, numberOfEntries, numZeroEntries, maxEntriesPerHash, detailedEntriesPerHash);
|
||
|
}
|
||
|
|
||
|
private:
|
||
|
HashTableVector _entries;
|
||
|
std::size_t _size;
|
||
|
UInt32 _capacity;
|
||
|
KeyHashFunction _hash;
|
||
|
};
|
||
|
|
||
|
|
||
|
} // namespace Poco
|
||
|
|
||
|
|
||
|
#endif // Foundation_HashTable_INCLUDED
|