2020-01-18 09:38:21 +01:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
|
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions are met:
|
|
|
|
*
|
|
|
|
* 1. Redistributions of source code must retain the above copyright notice, this
|
|
|
|
* list of conditions and the following disclaimer.
|
|
|
|
*
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
* this list of conditions and the following disclaimer in the documentation
|
|
|
|
* and/or other materials provided with the distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
|
|
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
|
|
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
|
|
|
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
|
|
|
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
#pragma once
|
|
|
|
|
2019-06-27 16:36:31 +02:00
|
|
|
#include <AK/Assertions.h>
|
|
|
|
#include <AK/SinglyLinkedList.h>
|
|
|
|
#include <AK/StdLibExtras.h>
|
2019-07-31 10:12:45 +02:00
|
|
|
#include <AK/TemporaryChange.h>
|
2019-06-27 16:36:31 +02:00
|
|
|
#include <AK/Traits.h>
|
2018-10-10 11:53:07 +02:00
|
|
|
|
|
|
|
namespace AK {
|
|
|
|
|
2020-02-16 02:01:18 +01:00
|
|
|
template<typename T, typename>
|
2019-05-28 11:53:16 +02:00
|
|
|
class HashTable;
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2019-06-27 15:57:49 +02:00
|
|
|
template<typename HashTableType, typename ElementType, typename BucketIteratorType>
|
|
|
|
class HashTableIterator {
|
|
|
|
public:
|
|
|
|
bool operator!=(const HashTableIterator& other) const
|
|
|
|
{
|
|
|
|
if (m_is_end && other.m_is_end)
|
|
|
|
return false;
|
|
|
|
return &m_table != &other.m_table
|
|
|
|
|| m_is_end != other.m_is_end
|
|
|
|
|| m_bucket_index != other.m_bucket_index
|
|
|
|
|| m_bucket_iterator != other.m_bucket_iterator;
|
|
|
|
}
|
|
|
|
bool operator==(const HashTableIterator& other) const { return !(*this != other); }
|
|
|
|
ElementType& operator*() { return *m_bucket_iterator; }
|
|
|
|
ElementType* operator->() { return m_bucket_iterator.operator->(); }
|
|
|
|
HashTableIterator& operator++()
|
|
|
|
{
|
|
|
|
skip_to_next();
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
void skip_to_next()
|
|
|
|
{
|
|
|
|
while (!m_is_end) {
|
|
|
|
if (m_bucket_iterator.is_end()) {
|
|
|
|
++m_bucket_index;
|
|
|
|
if (m_bucket_index >= m_table.capacity()) {
|
|
|
|
m_is_end = true;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
m_bucket_iterator = m_table.bucket(m_bucket_index).begin();
|
|
|
|
} else {
|
|
|
|
++m_bucket_iterator;
|
|
|
|
}
|
|
|
|
if (!m_bucket_iterator.is_end())
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
friend HashTableType;
|
|
|
|
|
2020-02-26 23:49:58 +11:00
|
|
|
explicit HashTableIterator(HashTableType& table, bool is_end, BucketIteratorType bucket_iterator = {}, size_t bucket_index = 0)
|
2019-06-27 15:57:49 +02:00
|
|
|
: m_table(table)
|
|
|
|
, m_bucket_index(bucket_index)
|
|
|
|
, m_is_end(is_end)
|
|
|
|
, m_bucket_iterator(bucket_iterator)
|
|
|
|
{
|
2019-07-31 10:12:45 +02:00
|
|
|
ASSERT(!table.m_clearing);
|
|
|
|
ASSERT(!table.m_rehashing);
|
2020-02-26 23:49:58 +11:00
|
|
|
if (!is_end && !m_table.is_empty() && m_bucket_iterator.is_end()) {
|
2019-06-27 15:57:49 +02:00
|
|
|
m_bucket_iterator = m_table.bucket(0).begin();
|
|
|
|
if (m_bucket_iterator.is_end())
|
|
|
|
skip_to_next();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
HashTableType& m_table;
|
2020-02-24 09:42:52 +01:00
|
|
|
size_t m_bucket_index { 0 };
|
2019-06-27 15:57:49 +02:00
|
|
|
bool m_is_end { false };
|
|
|
|
BucketIteratorType m_bucket_iterator;
|
|
|
|
};
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
template<typename T, typename TraitsForT>
|
|
|
|
class HashTable {
|
|
|
|
private:
|
2019-06-27 16:36:31 +02:00
|
|
|
using Bucket = SinglyLinkedList<T>;
|
2018-10-10 11:53:07 +02:00
|
|
|
|
|
|
|
public:
|
2019-05-28 11:53:16 +02:00
|
|
|
HashTable() {}
|
2019-06-24 11:57:54 +02:00
|
|
|
HashTable(const HashTable& other)
|
|
|
|
{
|
|
|
|
ensure_capacity(other.size());
|
|
|
|
for (auto& it : other)
|
|
|
|
set(it);
|
|
|
|
}
|
|
|
|
HashTable& operator=(const HashTable& other)
|
|
|
|
{
|
|
|
|
if (this != &other) {
|
|
|
|
clear();
|
|
|
|
ensure_capacity(other.size());
|
|
|
|
for (auto& it : other)
|
|
|
|
set(it);
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
HashTable(HashTable&& other)
|
2018-10-10 11:53:07 +02:00
|
|
|
: m_buckets(other.m_buckets)
|
|
|
|
, m_size(other.m_size)
|
|
|
|
, m_capacity(other.m_capacity)
|
|
|
|
{
|
|
|
|
other.m_size = 0;
|
|
|
|
other.m_capacity = 0;
|
|
|
|
other.m_buckets = nullptr;
|
|
|
|
}
|
|
|
|
HashTable& operator=(HashTable&& other)
|
|
|
|
{
|
|
|
|
if (this != &other) {
|
2019-02-04 08:53:12 +01:00
|
|
|
clear();
|
2018-10-10 11:53:07 +02:00
|
|
|
m_buckets = other.m_buckets;
|
|
|
|
m_size = other.m_size;
|
|
|
|
m_capacity = other.m_capacity;
|
|
|
|
other.m_size = 0;
|
|
|
|
other.m_capacity = 0;
|
|
|
|
other.m_buckets = nullptr;
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
~HashTable() { clear(); }
|
2018-12-21 02:10:45 +01:00
|
|
|
bool is_empty() const { return !m_size; }
|
2020-02-24 09:42:52 +01:00
|
|
|
size_t size() const { return m_size; }
|
|
|
|
size_t capacity() const { return m_capacity; }
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2020-02-24 09:42:52 +01:00
|
|
|
void ensure_capacity(size_t capacity)
|
2019-05-27 13:07:20 +02:00
|
|
|
{
|
|
|
|
ASSERT(capacity >= size());
|
|
|
|
rehash(capacity);
|
|
|
|
}
|
|
|
|
|
2018-11-07 01:38:51 +01:00
|
|
|
void set(const T&);
|
2018-10-10 11:53:07 +02:00
|
|
|
void set(T&&);
|
|
|
|
bool contains(const T&) const;
|
|
|
|
void clear();
|
|
|
|
|
2019-08-04 19:20:20 +02:00
|
|
|
using Iterator = HashTableIterator<HashTable, T, typename Bucket::Iterator>;
|
2019-06-27 15:57:49 +02:00
|
|
|
friend Iterator;
|
2018-12-21 02:10:45 +01:00
|
|
|
Iterator begin() { return Iterator(*this, is_empty()); }
|
2018-10-10 11:53:07 +02:00
|
|
|
Iterator end() { return Iterator(*this, true); }
|
|
|
|
|
2019-08-04 19:20:20 +02:00
|
|
|
using ConstIterator = HashTableIterator<const HashTable, const T, typename Bucket::ConstIterator>;
|
2019-06-27 15:57:49 +02:00
|
|
|
friend ConstIterator;
|
2018-12-21 02:10:45 +01:00
|
|
|
ConstIterator begin() const { return ConstIterator(*this, is_empty()); }
|
2018-10-10 11:53:07 +02:00
|
|
|
ConstIterator end() const { return ConstIterator(*this, true); }
|
|
|
|
|
2019-06-29 21:09:40 +02:00
|
|
|
template<typename Finder>
|
|
|
|
Iterator find(unsigned hash, Finder finder)
|
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return end();
|
2020-02-24 09:42:52 +01:00
|
|
|
size_t bucket_index;
|
2019-06-29 21:09:40 +02:00
|
|
|
auto& bucket = lookup_with_hash(hash, &bucket_index);
|
|
|
|
auto bucket_iterator = bucket.find(finder);
|
|
|
|
if (bucket_iterator != bucket.end())
|
|
|
|
return Iterator(*this, false, bucket_iterator, bucket_index);
|
|
|
|
return end();
|
|
|
|
}
|
|
|
|
|
|
|
|
template<typename Finder>
|
|
|
|
ConstIterator find(unsigned hash, Finder finder) const
|
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return end();
|
2020-02-24 09:42:52 +01:00
|
|
|
size_t bucket_index;
|
2019-06-29 21:09:40 +02:00
|
|
|
auto& bucket = lookup_with_hash(hash, &bucket_index);
|
|
|
|
auto bucket_iterator = bucket.find(finder);
|
|
|
|
if (bucket_iterator != bucket.end())
|
|
|
|
return ConstIterator(*this, false, bucket_iterator, bucket_index);
|
|
|
|
return end();
|
|
|
|
}
|
|
|
|
|
|
|
|
Iterator find(const T& value)
|
|
|
|
{
|
|
|
|
return find(TraitsForT::hash(value), [&](auto& other) { return TraitsForT::equals(value, other); });
|
|
|
|
}
|
|
|
|
|
|
|
|
ConstIterator find(const T& value) const
|
|
|
|
{
|
|
|
|
return find(TraitsForT::hash(value), [&](auto& other) { return TraitsForT::equals(value, other); });
|
|
|
|
}
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2018-10-13 14:22:09 +02:00
|
|
|
void remove(const T& value)
|
|
|
|
{
|
|
|
|
auto it = find(value);
|
|
|
|
if (it != end())
|
|
|
|
remove(it);
|
|
|
|
}
|
|
|
|
|
2018-10-25 12:35:49 +02:00
|
|
|
void remove(Iterator);
|
2018-10-13 14:22:09 +02:00
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
private:
|
2020-02-24 09:42:52 +01:00
|
|
|
Bucket& lookup(const T&, size_t* bucket_index = nullptr);
|
|
|
|
const Bucket& lookup(const T&, size_t* bucket_index = nullptr) const;
|
2019-06-29 21:09:40 +02:00
|
|
|
|
2020-02-24 09:42:52 +01:00
|
|
|
Bucket& lookup_with_hash(unsigned hash, size_t* bucket_index)
|
2019-06-29 21:09:40 +02:00
|
|
|
{
|
|
|
|
if (bucket_index)
|
|
|
|
*bucket_index = hash % m_capacity;
|
|
|
|
return m_buckets[hash % m_capacity];
|
|
|
|
}
|
|
|
|
|
2020-02-24 09:42:52 +01:00
|
|
|
const Bucket& lookup_with_hash(unsigned hash, size_t* bucket_index) const
|
2019-06-29 21:09:40 +02:00
|
|
|
{
|
|
|
|
if (bucket_index)
|
|
|
|
*bucket_index = hash % m_capacity;
|
|
|
|
return m_buckets[hash % m_capacity];
|
|
|
|
}
|
|
|
|
|
2020-02-24 09:42:52 +01:00
|
|
|
void rehash(size_t capacity);
|
2018-11-07 01:38:51 +01:00
|
|
|
void insert(const T&);
|
2018-10-10 11:53:07 +02:00
|
|
|
void insert(T&&);
|
|
|
|
|
2020-02-24 09:42:52 +01:00
|
|
|
Bucket& bucket(size_t index) { return m_buckets[index]; }
|
|
|
|
const Bucket& bucket(size_t index) const { return m_buckets[index]; }
|
2019-06-27 15:57:49 +02:00
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
Bucket* m_buckets { nullptr };
|
|
|
|
|
2020-02-24 09:42:52 +01:00
|
|
|
size_t m_size { 0 };
|
|
|
|
size_t m_capacity { 0 };
|
2019-07-31 10:12:45 +02:00
|
|
|
bool m_clearing { false };
|
|
|
|
bool m_rehashing { false };
|
2018-10-10 11:53:07 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
template<typename T, typename TraitsForT>
|
|
|
|
void HashTable<T, TraitsForT>::set(T&& value)
|
|
|
|
{
|
|
|
|
if (!m_capacity)
|
|
|
|
rehash(1);
|
|
|
|
auto& bucket = lookup(value);
|
2019-06-27 15:57:49 +02:00
|
|
|
for (auto& e : bucket) {
|
2019-06-29 19:14:03 +02:00
|
|
|
if (TraitsForT::equals(e, value)) {
|
2019-03-25 04:23:17 +01:00
|
|
|
e = move(value);
|
2018-10-10 11:53:07 +02:00
|
|
|
return;
|
2019-03-25 04:23:17 +01:00
|
|
|
}
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
if (size() >= capacity()) {
|
|
|
|
rehash(size() + 1);
|
2018-10-17 10:55:43 +02:00
|
|
|
insert(move(value));
|
2018-10-10 11:53:07 +02:00
|
|
|
} else {
|
2019-06-27 15:57:49 +02:00
|
|
|
bucket.append(move(value));
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
m_size++;
|
|
|
|
}
|
|
|
|
|
2018-11-07 01:38:51 +01:00
|
|
|
template<typename T, typename TraitsForT>
|
|
|
|
void HashTable<T, TraitsForT>::set(const T& value)
|
|
|
|
{
|
|
|
|
if (!m_capacity)
|
|
|
|
rehash(1);
|
|
|
|
auto& bucket = lookup(value);
|
2019-06-27 15:57:49 +02:00
|
|
|
for (auto& e : bucket) {
|
2019-06-29 19:14:03 +02:00
|
|
|
if (TraitsForT::equals(e, value)) {
|
2019-06-29 12:02:52 +02:00
|
|
|
e = value;
|
2018-11-07 01:38:51 +01:00
|
|
|
return;
|
2019-03-25 04:23:17 +01:00
|
|
|
}
|
2018-11-07 01:38:51 +01:00
|
|
|
}
|
|
|
|
if (size() >= capacity()) {
|
|
|
|
rehash(size() + 1);
|
|
|
|
insert(value);
|
|
|
|
} else {
|
2019-06-27 15:57:49 +02:00
|
|
|
bucket.append(value);
|
2018-11-07 01:38:51 +01:00
|
|
|
}
|
|
|
|
m_size++;
|
|
|
|
}
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
template<typename T, typename TraitsForT>
|
2020-02-24 09:42:52 +01:00
|
|
|
void HashTable<T, TraitsForT>::rehash(size_t new_capacity)
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
2019-08-25 17:47:32 +02:00
|
|
|
TemporaryChange<bool> change(m_rehashing, true);
|
2019-01-19 22:53:05 +01:00
|
|
|
new_capacity *= 2;
|
|
|
|
auto* new_buckets = new Bucket[new_capacity];
|
|
|
|
auto* old_buckets = m_buckets;
|
2020-02-24 09:42:52 +01:00
|
|
|
size_t old_capacity = m_capacity;
|
2019-01-19 22:53:05 +01:00
|
|
|
m_buckets = new_buckets;
|
|
|
|
m_capacity = new_capacity;
|
2018-10-10 11:53:07 +02:00
|
|
|
|
2020-02-24 09:42:52 +01:00
|
|
|
for (size_t i = 0; i < old_capacity; ++i) {
|
2019-06-27 15:57:49 +02:00
|
|
|
for (auto& value : old_buckets[i]) {
|
2018-10-17 10:55:43 +02:00
|
|
|
insert(move(value));
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-05-28 11:53:16 +02:00
|
|
|
delete[] old_buckets;
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename TraitsForT>
|
|
|
|
void HashTable<T, TraitsForT>::clear()
|
|
|
|
{
|
2019-08-25 17:47:32 +02:00
|
|
|
TemporaryChange<bool> change(m_clearing, true);
|
2019-01-30 19:32:54 +01:00
|
|
|
if (m_buckets) {
|
2019-05-28 11:53:16 +02:00
|
|
|
delete[] m_buckets;
|
2019-01-30 19:32:54 +01:00
|
|
|
m_buckets = nullptr;
|
|
|
|
}
|
2018-10-10 11:53:07 +02:00
|
|
|
m_capacity = 0;
|
|
|
|
m_size = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename TraitsForT>
|
|
|
|
void HashTable<T, TraitsForT>::insert(T&& value)
|
|
|
|
{
|
|
|
|
auto& bucket = lookup(value);
|
2019-06-27 15:57:49 +02:00
|
|
|
bucket.append(move(value));
|
2018-10-10 11:53:07 +02:00
|
|
|
}
|
|
|
|
|
2018-11-07 01:38:51 +01:00
|
|
|
template<typename T, typename TraitsForT>
|
|
|
|
void HashTable<T, TraitsForT>::insert(const T& value)
|
|
|
|
{
|
|
|
|
auto& bucket = lookup(value);
|
2019-06-27 15:57:49 +02:00
|
|
|
bucket.append(value);
|
2018-11-07 01:38:51 +01:00
|
|
|
}
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
template<typename T, typename TraitsForT>
|
|
|
|
bool HashTable<T, TraitsForT>::contains(const T& value) const
|
|
|
|
{
|
2018-12-21 02:10:45 +01:00
|
|
|
if (is_empty())
|
2018-10-10 11:53:07 +02:00
|
|
|
return false;
|
|
|
|
auto& bucket = lookup(value);
|
2019-06-27 15:57:49 +02:00
|
|
|
for (auto& e : bucket) {
|
2019-06-29 19:14:03 +02:00
|
|
|
if (TraitsForT::equals(e, value))
|
2018-10-10 11:53:07 +02:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2018-10-13 14:22:09 +02:00
|
|
|
template<typename T, typename TraitsForT>
|
2018-10-25 12:35:49 +02:00
|
|
|
void HashTable<T, TraitsForT>::remove(Iterator it)
|
2018-10-13 14:22:09 +02:00
|
|
|
{
|
2018-12-21 02:10:45 +01:00
|
|
|
ASSERT(!is_empty());
|
2019-06-27 15:57:49 +02:00
|
|
|
m_buckets[it.m_bucket_index].remove(it.m_bucket_iterator);
|
2018-10-13 14:22:09 +02:00
|
|
|
--m_size;
|
|
|
|
}
|
|
|
|
|
2018-10-10 11:53:07 +02:00
|
|
|
template<typename T, typename TraitsForT>
|
2020-02-24 09:42:52 +01:00
|
|
|
auto HashTable<T, TraitsForT>::lookup(const T& value, size_t* bucket_index) -> Bucket&
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
unsigned hash = TraitsForT::hash(value);
|
2019-01-19 22:53:05 +01:00
|
|
|
if (bucket_index)
|
|
|
|
*bucket_index = hash % m_capacity;
|
2018-10-10 11:53:07 +02:00
|
|
|
return m_buckets[hash % m_capacity];
|
|
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename TraitsForT>
|
2020-02-24 09:42:52 +01:00
|
|
|
auto HashTable<T, TraitsForT>::lookup(const T& value, size_t* bucket_index) const -> const Bucket&
|
2018-10-10 11:53:07 +02:00
|
|
|
{
|
|
|
|
unsigned hash = TraitsForT::hash(value);
|
2019-01-19 22:53:05 +01:00
|
|
|
if (bucket_index)
|
|
|
|
*bucket_index = hash % m_capacity;
|
2018-10-10 11:53:07 +02:00
|
|
|
return m_buckets[hash % m_capacity];
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
using AK::HashTable;
|