2020-01-18 08:38:21 +00:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
|
|
|
|
*
|
2021-04-22 08:24:48 +00:00
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
2020-01-18 08:38:21 +00:00
|
|
|
*/
|
|
|
|
|
2018-10-10 09:53:07 +00:00
|
|
|
#pragma once
|
|
|
|
|
2021-11-07 13:52:20 +00:00
|
|
|
#include <AK/Concepts.h>
|
2021-11-10 22:00:21 +00:00
|
|
|
#include <AK/Error.h>
|
2021-06-13 14:26:08 +00:00
|
|
|
#include <AK/Forward.h>
|
2020-10-15 21:34:07 +00:00
|
|
|
#include <AK/HashFunctions.h>
|
2019-06-27 14:36:31 +00:00
|
|
|
#include <AK/StdLibExtras.h>
|
2021-09-15 22:00:33 +00:00
|
|
|
#include <AK/Traits.h>
|
2020-10-15 21:34:07 +00:00
|
|
|
#include <AK/Types.h>
|
|
|
|
#include <AK/kmalloc.h>
|
2018-10-10 09:53:07 +00:00
|
|
|
|
|
|
|
namespace AK {
|
|
|
|
|
2020-07-06 21:44:33 +00:00
|
|
|
enum class HashSetResult {
|
|
|
|
InsertedNewEntry,
|
2021-06-08 20:42:07 +00:00
|
|
|
ReplacedExistingEntry,
|
|
|
|
KeptExistingEntry
|
|
|
|
};
|
|
|
|
|
|
|
|
enum class HashSetExistingEntryBehavior {
|
|
|
|
Keep,
|
|
|
|
Replace
|
2020-07-06 21:44:33 +00:00
|
|
|
};
|
|
|
|
|
2022-03-07 14:10:10 +00:00
|
|
|
// FIXME: Choose specific values so that we can do bit-based checks for various classes of state.
|
|
|
|
enum class BucketState : u8 {
|
|
|
|
Free = 0,
|
|
|
|
Used,
|
|
|
|
Deleted,
|
|
|
|
Rehashed,
|
|
|
|
End,
|
|
|
|
};
|
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
template<typename HashTableType, typename T, typename BucketType>
|
2019-06-27 13:57:49 +00:00
|
|
|
class HashTableIterator {
|
2020-10-15 21:34:07 +00:00
|
|
|
friend HashTableType;
|
|
|
|
|
2019-06-27 13:57:49 +00:00
|
|
|
public:
|
2020-10-15 21:34:07 +00:00
|
|
|
bool operator==(const HashTableIterator& other) const { return m_bucket == other.m_bucket; }
|
|
|
|
bool operator!=(const HashTableIterator& other) const { return m_bucket != other.m_bucket; }
|
|
|
|
T& operator*() { return *m_bucket->slot(); }
|
|
|
|
T* operator->() { return m_bucket->slot(); }
|
|
|
|
void operator++() { skip_to_next(); }
|
2019-06-27 13:57:49 +00:00
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
private:
|
2019-06-27 13:57:49 +00:00
|
|
|
void skip_to_next()
|
|
|
|
{
|
2020-10-15 21:34:07 +00:00
|
|
|
if (!m_bucket)
|
|
|
|
return;
|
|
|
|
do {
|
|
|
|
++m_bucket;
|
2022-03-07 14:10:10 +00:00
|
|
|
if (m_bucket->state == BucketState::Used)
|
2019-06-27 13:57:49 +00:00
|
|
|
return;
|
2022-03-07 14:10:10 +00:00
|
|
|
} while (m_bucket->state != BucketState::End);
|
|
|
|
if (m_bucket->state == BucketState::End)
|
2020-10-15 21:34:07 +00:00
|
|
|
m_bucket = nullptr;
|
2019-06-27 13:57:49 +00:00
|
|
|
}
|
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
explicit HashTableIterator(BucketType* bucket)
|
|
|
|
: m_bucket(bucket)
|
2019-06-27 13:57:49 +00:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
BucketType* m_bucket { nullptr };
|
2019-06-27 13:57:49 +00:00
|
|
|
};
|
|
|
|
|
2021-06-13 14:26:08 +00:00
|
|
|
template<typename OrderedHashTableType, typename T, typename BucketType>
|
|
|
|
class OrderedHashTableIterator {
|
|
|
|
friend OrderedHashTableType;
|
|
|
|
|
|
|
|
public:
|
|
|
|
bool operator==(const OrderedHashTableIterator& other) const { return m_bucket == other.m_bucket; }
|
|
|
|
bool operator!=(const OrderedHashTableIterator& other) const { return m_bucket != other.m_bucket; }
|
|
|
|
T& operator*() { return *m_bucket->slot(); }
|
|
|
|
T* operator->() { return m_bucket->slot(); }
|
|
|
|
void operator++() { m_bucket = m_bucket->next; }
|
|
|
|
void operator--() { m_bucket = m_bucket->previous; }
|
|
|
|
|
|
|
|
private:
|
|
|
|
explicit OrderedHashTableIterator(BucketType* bucket)
|
|
|
|
: m_bucket(bucket)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
BucketType* m_bucket { nullptr };
|
|
|
|
};
|
|
|
|
|
|
|
|
template<typename T, typename TraitsForT, bool IsOrdered>
|
2018-10-10 09:53:07 +00:00
|
|
|
class HashTable {
|
2020-10-16 06:32:35 +00:00
|
|
|
static constexpr size_t load_factor_in_percent = 60;
|
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
struct Bucket {
|
2022-03-07 14:10:10 +00:00
|
|
|
BucketState state;
|
2020-10-15 21:34:07 +00:00
|
|
|
alignas(T) u8 storage[sizeof(T)];
|
|
|
|
|
|
|
|
T* slot() { return reinterpret_cast<T*>(storage); }
|
|
|
|
const T* slot() const { return reinterpret_cast<const T*>(storage); }
|
|
|
|
};
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2021-06-13 14:26:08 +00:00
|
|
|
struct OrderedBucket {
|
|
|
|
OrderedBucket* previous;
|
|
|
|
OrderedBucket* next;
|
2022-03-07 14:10:10 +00:00
|
|
|
BucketState state;
|
2021-06-13 14:26:08 +00:00
|
|
|
alignas(T) u8 storage[sizeof(T)];
|
|
|
|
T* slot() { return reinterpret_cast<T*>(storage); }
|
|
|
|
const T* slot() const { return reinterpret_cast<const T*>(storage); }
|
|
|
|
};
|
|
|
|
|
|
|
|
using BucketType = Conditional<IsOrdered, OrderedBucket, Bucket>;
|
|
|
|
|
|
|
|
struct CollectionData {
|
|
|
|
};
|
|
|
|
|
|
|
|
struct OrderedCollectionData {
|
|
|
|
BucketType* head { nullptr };
|
|
|
|
BucketType* tail { nullptr };
|
|
|
|
};
|
|
|
|
|
|
|
|
using CollectionDataType = Conditional<IsOrdered, OrderedCollectionData, CollectionData>;
|
|
|
|
|
2018-10-10 09:53:07 +00:00
|
|
|
public:
|
2021-01-10 23:29:28 +00:00
|
|
|
HashTable() = default;
|
2021-04-11 08:24:35 +00:00
|
|
|
explicit HashTable(size_t capacity) { rehash(capacity); }
|
2020-10-17 13:44:43 +00:00
|
|
|
|
|
|
|
~HashTable()
|
|
|
|
{
|
|
|
|
if (!m_buckets)
|
|
|
|
return;
|
|
|
|
|
|
|
|
for (size_t i = 0; i < m_capacity; ++i) {
|
2022-03-07 14:10:10 +00:00
|
|
|
if (m_buckets[i].state == BucketState::Used)
|
2020-10-17 13:44:43 +00:00
|
|
|
m_buckets[i].slot()->~T();
|
|
|
|
}
|
|
|
|
|
2021-07-11 11:22:58 +00:00
|
|
|
kfree_sized(m_buckets, size_in_bytes(m_capacity));
|
2020-10-17 13:44:43 +00:00
|
|
|
}
|
2020-10-15 21:34:07 +00:00
|
|
|
|
2019-06-24 09:57:54 +00:00
|
|
|
HashTable(const HashTable& other)
|
|
|
|
{
|
2020-10-15 21:34:07 +00:00
|
|
|
rehash(other.capacity());
|
2019-06-24 09:57:54 +00:00
|
|
|
for (auto& it : other)
|
|
|
|
set(it);
|
|
|
|
}
|
2020-10-15 21:34:07 +00:00
|
|
|
|
2019-06-24 09:57:54 +00:00
|
|
|
HashTable& operator=(const HashTable& other)
|
|
|
|
{
|
2020-10-17 13:08:09 +00:00
|
|
|
HashTable temporary(other);
|
|
|
|
swap(*this, temporary);
|
2019-06-24 09:57:54 +00:00
|
|
|
return *this;
|
|
|
|
}
|
2020-10-15 21:34:07 +00:00
|
|
|
|
2020-10-17 13:08:09 +00:00
|
|
|
HashTable(HashTable&& other) noexcept
|
2018-10-10 09:53:07 +00:00
|
|
|
: m_buckets(other.m_buckets)
|
2021-06-13 14:26:08 +00:00
|
|
|
, m_collection_data(other.m_collection_data)
|
2018-10-10 09:53:07 +00:00
|
|
|
, m_size(other.m_size)
|
|
|
|
, m_capacity(other.m_capacity)
|
2020-10-15 21:34:07 +00:00
|
|
|
, m_deleted_count(other.m_deleted_count)
|
2018-10-10 09:53:07 +00:00
|
|
|
{
|
|
|
|
other.m_size = 0;
|
|
|
|
other.m_capacity = 0;
|
2020-10-15 21:34:07 +00:00
|
|
|
other.m_deleted_count = 0;
|
2018-10-10 09:53:07 +00:00
|
|
|
other.m_buckets = nullptr;
|
2021-06-13 14:26:08 +00:00
|
|
|
if constexpr (IsOrdered)
|
|
|
|
other.m_collection_data = { nullptr, nullptr };
|
2018-10-10 09:53:07 +00:00
|
|
|
}
|
2020-10-15 21:34:07 +00:00
|
|
|
|
2020-10-17 13:08:09 +00:00
|
|
|
HashTable& operator=(HashTable&& other) noexcept
|
2018-10-10 09:53:07 +00:00
|
|
|
{
|
2021-05-30 12:23:23 +00:00
|
|
|
HashTable temporary { move(other) };
|
|
|
|
swap(*this, temporary);
|
2018-10-10 09:53:07 +00:00
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
2020-10-17 12:44:59 +00:00
|
|
|
friend void swap(HashTable& a, HashTable& b) noexcept
|
|
|
|
{
|
|
|
|
swap(a.m_buckets, b.m_buckets);
|
|
|
|
swap(a.m_size, b.m_size);
|
|
|
|
swap(a.m_capacity, b.m_capacity);
|
|
|
|
swap(a.m_deleted_count, b.m_deleted_count);
|
2021-06-13 14:26:08 +00:00
|
|
|
|
|
|
|
if constexpr (IsOrdered)
|
|
|
|
swap(a.m_collection_data, b.m_collection_data);
|
2020-10-17 12:44:59 +00:00
|
|
|
}
|
|
|
|
|
2021-11-06 20:12:16 +00:00
|
|
|
[[nodiscard]] bool is_empty() const { return m_size == 0; }
|
2021-04-11 08:25:22 +00:00
|
|
|
[[nodiscard]] size_t size() const { return m_size; }
|
|
|
|
[[nodiscard]] size_t capacity() const { return m_capacity; }
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
template<typename U, size_t N>
|
2021-11-10 22:00:21 +00:00
|
|
|
ErrorOr<void> try_set_from(U (&from_array)[N])
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
2021-11-10 22:00:21 +00:00
|
|
|
for (size_t i = 0; i < N; ++i)
|
|
|
|
TRY(try_set(from_array[i]));
|
|
|
|
return {};
|
2021-08-14 00:07:39 +00:00
|
|
|
}
|
|
|
|
template<typename U, size_t N>
|
|
|
|
void set_from(U (&from_array)[N])
|
|
|
|
{
|
2021-11-10 22:00:21 +00:00
|
|
|
MUST(try_set_from(from_array));
|
2020-10-15 21:34:07 +00:00
|
|
|
}
|
|
|
|
|
2020-02-24 08:42:52 +00:00
|
|
|
void ensure_capacity(size_t capacity)
|
2019-05-27 11:07:20 +00:00
|
|
|
{
|
2021-02-23 19:42:32 +00:00
|
|
|
VERIFY(capacity >= size());
|
2020-10-15 21:34:07 +00:00
|
|
|
rehash(capacity * 2);
|
2019-05-27 11:07:20 +00:00
|
|
|
}
|
|
|
|
|
2022-01-25 00:31:20 +00:00
|
|
|
ErrorOr<void> try_ensure_capacity(size_t capacity)
|
|
|
|
{
|
|
|
|
VERIFY(capacity >= size());
|
|
|
|
return try_rehash(capacity * 2);
|
|
|
|
}
|
|
|
|
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] bool contains(T const& value) const
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
|
|
|
return find(value) != end();
|
|
|
|
}
|
2020-08-16 09:04:00 +00:00
|
|
|
|
2021-11-07 13:52:20 +00:00
|
|
|
template<Concepts::HashCompatible<T> K>
|
|
|
|
requires(IsSame<TraitsForT, Traits<T>>) [[nodiscard]] bool contains(K const& value) const
|
|
|
|
{
|
|
|
|
return find(value) != end();
|
|
|
|
}
|
|
|
|
|
2021-06-13 14:26:08 +00:00
|
|
|
using Iterator = Conditional<IsOrdered,
|
|
|
|
OrderedHashTableIterator<HashTable, T, BucketType>,
|
|
|
|
HashTableIterator<HashTable, T, BucketType>>;
|
2020-10-15 21:34:07 +00:00
|
|
|
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] Iterator begin()
|
2020-08-16 09:04:00 +00:00
|
|
|
{
|
2021-06-13 14:26:08 +00:00
|
|
|
if constexpr (IsOrdered)
|
|
|
|
return Iterator(m_collection_data.head);
|
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
for (size_t i = 0; i < m_capacity; ++i) {
|
2022-03-07 14:10:10 +00:00
|
|
|
if (m_buckets[i].state == BucketState::Used)
|
2020-10-15 21:34:07 +00:00
|
|
|
return Iterator(&m_buckets[i]);
|
2020-08-16 09:04:00 +00:00
|
|
|
}
|
2020-10-15 21:34:07 +00:00
|
|
|
return end();
|
2020-08-16 09:04:00 +00:00
|
|
|
}
|
|
|
|
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] Iterator end()
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
|
|
|
return Iterator(nullptr);
|
|
|
|
}
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2021-06-13 14:26:08 +00:00
|
|
|
using ConstIterator = Conditional<IsOrdered,
|
|
|
|
OrderedHashTableIterator<const HashTable, const T, const BucketType>,
|
|
|
|
HashTableIterator<const HashTable, const T, const BucketType>>;
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] ConstIterator begin() const
|
2019-06-29 19:09:40 +00:00
|
|
|
{
|
2021-06-13 14:26:08 +00:00
|
|
|
if constexpr (IsOrdered)
|
|
|
|
return ConstIterator(m_collection_data.head);
|
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
for (size_t i = 0; i < m_capacity; ++i) {
|
2022-03-07 14:10:10 +00:00
|
|
|
if (m_buckets[i].state == BucketState::Used)
|
2020-10-15 21:34:07 +00:00
|
|
|
return ConstIterator(&m_buckets[i]);
|
|
|
|
}
|
2019-06-29 19:09:40 +00:00
|
|
|
return end();
|
|
|
|
}
|
|
|
|
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] ConstIterator end() const
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
|
|
|
return ConstIterator(nullptr);
|
|
|
|
}
|
|
|
|
|
|
|
|
void clear()
|
|
|
|
{
|
2020-10-17 13:44:43 +00:00
|
|
|
*this = HashTable();
|
2020-10-15 21:34:07 +00:00
|
|
|
}
|
2021-09-20 21:43:52 +00:00
|
|
|
void clear_with_capacity()
|
|
|
|
{
|
|
|
|
if constexpr (!Detail::IsTriviallyDestructible<T>) {
|
|
|
|
for (auto* bucket : *this)
|
|
|
|
bucket->~T();
|
|
|
|
}
|
|
|
|
__builtin_memset(m_buckets, 0, size_in_bytes(capacity()));
|
|
|
|
m_size = 0;
|
|
|
|
m_deleted_count = 0;
|
|
|
|
|
|
|
|
if constexpr (IsOrdered)
|
|
|
|
m_collection_data = { nullptr, nullptr };
|
|
|
|
else
|
2022-03-07 14:10:10 +00:00
|
|
|
m_buckets[m_capacity].state = BucketState::End;
|
2021-09-20 21:43:52 +00:00
|
|
|
}
|
2020-10-15 21:34:07 +00:00
|
|
|
|
2021-01-15 22:59:55 +00:00
|
|
|
template<typename U = T>
|
2021-11-10 22:00:21 +00:00
|
|
|
ErrorOr<HashSetResult> try_set(U&& value, HashSetExistingEntryBehavior existing_entry_behavior = HashSetExistingEntryBehavior::Replace)
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
2021-11-10 22:00:21 +00:00
|
|
|
auto* bucket = TRY(try_lookup_for_writing(value));
|
2022-03-07 14:10:10 +00:00
|
|
|
if (bucket->state == BucketState::Used) {
|
2021-09-07 10:56:50 +00:00
|
|
|
if (existing_entry_behavior == HashSetExistingEntryBehavior::Keep)
|
2021-06-08 20:42:07 +00:00
|
|
|
return HashSetResult::KeptExistingEntry;
|
2021-08-14 00:07:39 +00:00
|
|
|
(*bucket->slot()) = forward<U>(value);
|
2020-10-15 21:34:07 +00:00
|
|
|
return HashSetResult::ReplacedExistingEntry;
|
|
|
|
}
|
|
|
|
|
2021-08-14 00:07:39 +00:00
|
|
|
new (bucket->slot()) T(forward<U>(value));
|
2022-03-07 14:10:10 +00:00
|
|
|
if (bucket->state == BucketState::Deleted)
|
2020-10-15 21:34:07 +00:00
|
|
|
--m_deleted_count;
|
2022-03-07 14:10:10 +00:00
|
|
|
bucket->state = BucketState::Used;
|
2021-06-13 14:26:08 +00:00
|
|
|
|
|
|
|
if constexpr (IsOrdered) {
|
|
|
|
if (!m_collection_data.head) [[unlikely]] {
|
2021-08-14 00:07:39 +00:00
|
|
|
m_collection_data.head = bucket;
|
2021-06-13 14:26:08 +00:00
|
|
|
} else {
|
2021-08-14 00:07:39 +00:00
|
|
|
bucket->previous = m_collection_data.tail;
|
|
|
|
m_collection_data.tail->next = bucket;
|
2021-06-13 14:26:08 +00:00
|
|
|
}
|
2021-08-14 00:07:39 +00:00
|
|
|
m_collection_data.tail = bucket;
|
2021-06-13 14:26:08 +00:00
|
|
|
}
|
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
++m_size;
|
|
|
|
return HashSetResult::InsertedNewEntry;
|
|
|
|
}
|
2021-08-14 00:07:39 +00:00
|
|
|
template<typename U = T>
|
|
|
|
HashSetResult set(U&& value, HashSetExistingEntryBehavior existing_entry_behaviour = HashSetExistingEntryBehavior::Replace)
|
|
|
|
{
|
2021-11-10 22:00:21 +00:00
|
|
|
return MUST(try_set(forward<U>(value), existing_entry_behaviour));
|
2021-08-14 00:07:39 +00:00
|
|
|
}
|
2020-10-15 21:34:07 +00:00
|
|
|
|
2021-07-12 21:23:08 +00:00
|
|
|
template<typename TUnaryPredicate>
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] Iterator find(unsigned hash, TUnaryPredicate predicate)
|
2019-06-29 19:09:40 +00:00
|
|
|
{
|
2021-07-12 21:23:08 +00:00
|
|
|
return Iterator(lookup_with_hash(hash, move(predicate)));
|
2019-06-29 19:09:40 +00:00
|
|
|
}
|
|
|
|
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] Iterator find(T const& value)
|
2019-06-29 19:09:40 +00:00
|
|
|
{
|
|
|
|
return find(TraitsForT::hash(value), [&](auto& other) { return TraitsForT::equals(value, other); });
|
|
|
|
}
|
|
|
|
|
2021-07-12 21:23:08 +00:00
|
|
|
template<typename TUnaryPredicate>
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] ConstIterator find(unsigned hash, TUnaryPredicate predicate) const
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
2021-07-12 21:23:08 +00:00
|
|
|
return ConstIterator(lookup_with_hash(hash, move(predicate)));
|
2020-10-15 21:34:07 +00:00
|
|
|
}
|
|
|
|
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] ConstIterator find(T const& value) const
|
2019-06-29 19:09:40 +00:00
|
|
|
{
|
|
|
|
return find(TraitsForT::hash(value), [&](auto& other) { return TraitsForT::equals(value, other); });
|
|
|
|
}
|
2021-11-07 13:52:20 +00:00
|
|
|
// FIXME: Support for predicates, while guaranteeing that the predicate call
|
|
|
|
// does not call a non trivial constructor each time invoked
|
|
|
|
template<Concepts::HashCompatible<T> K>
|
|
|
|
requires(IsSame<TraitsForT, Traits<T>>) [[nodiscard]] Iterator find(K const& value)
|
|
|
|
{
|
2022-01-29 18:01:35 +00:00
|
|
|
return find(Traits<K>::hash(value), [&](auto& other) { return Traits<T>::equals(other, value); });
|
2021-11-07 13:52:20 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template<Concepts::HashCompatible<T> K, typename TUnaryPredicate>
|
|
|
|
requires(IsSame<TraitsForT, Traits<T>>) [[nodiscard]] Iterator find(K const& value, TUnaryPredicate predicate)
|
|
|
|
{
|
|
|
|
return find(Traits<K>::hash(value), move(predicate));
|
|
|
|
}
|
|
|
|
|
|
|
|
template<Concepts::HashCompatible<T> K>
|
|
|
|
requires(IsSame<TraitsForT, Traits<T>>) [[nodiscard]] ConstIterator find(K const& value) const
|
|
|
|
{
|
2022-01-29 18:01:35 +00:00
|
|
|
return find(Traits<K>::hash(value), [&](auto& other) { return Traits<T>::equals(other, value); });
|
2021-11-07 13:52:20 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template<Concepts::HashCompatible<T> K, typename TUnaryPredicate>
|
|
|
|
requires(IsSame<TraitsForT, Traits<T>>) [[nodiscard]] ConstIterator find(K const& value, TUnaryPredicate predicate) const
|
|
|
|
{
|
|
|
|
return find(Traits<K>::hash(value), move(predicate));
|
|
|
|
}
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2020-07-06 21:44:33 +00:00
|
|
|
bool remove(const T& value)
|
2018-10-13 12:22:09 +00:00
|
|
|
{
|
|
|
|
auto it = find(value);
|
2020-07-06 21:44:33 +00:00
|
|
|
if (it != end()) {
|
2018-10-13 12:22:09 +00:00
|
|
|
remove(it);
|
2020-07-06 21:44:33 +00:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
2018-10-13 12:22:09 +00:00
|
|
|
}
|
|
|
|
|
2021-12-15 14:18:30 +00:00
|
|
|
template<Concepts::HashCompatible<T> K>
|
|
|
|
requires(IsSame<TraitsForT, Traits<T>>) bool remove(K const& value)
|
|
|
|
{
|
|
|
|
auto it = find(value);
|
|
|
|
if (it != end()) {
|
|
|
|
remove(it);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2022-03-06 18:14:29 +00:00
|
|
|
void remove(Iterator iterator)
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
2021-02-23 19:42:32 +00:00
|
|
|
VERIFY(iterator.m_bucket);
|
2020-10-15 21:34:07 +00:00
|
|
|
auto& bucket = *iterator.m_bucket;
|
2022-03-07 14:10:10 +00:00
|
|
|
VERIFY(bucket.state == BucketState::Used);
|
2021-06-13 14:26:08 +00:00
|
|
|
|
2022-03-06 18:11:17 +00:00
|
|
|
delete_bucket(bucket);
|
2020-10-15 21:34:07 +00:00
|
|
|
--m_size;
|
|
|
|
++m_deleted_count;
|
2022-03-06 18:26:04 +00:00
|
|
|
|
|
|
|
shrink_if_needed();
|
2022-01-05 15:45:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template<typename TUnaryPredicate>
|
2022-01-05 15:57:45 +00:00
|
|
|
bool remove_all_matching(TUnaryPredicate predicate)
|
2022-01-05 15:45:42 +00:00
|
|
|
{
|
2022-03-06 18:11:17 +00:00
|
|
|
size_t removed_count = 0;
|
|
|
|
for (size_t i = 0; i < m_capacity; ++i) {
|
|
|
|
auto& bucket = m_buckets[i];
|
2022-03-07 14:10:10 +00:00
|
|
|
if (bucket.state == BucketState::Used && predicate(*bucket.slot())) {
|
2022-03-06 18:11:17 +00:00
|
|
|
delete_bucket(bucket);
|
|
|
|
++removed_count;
|
2022-01-05 15:57:45 +00:00
|
|
|
}
|
2022-01-05 15:45:42 +00:00
|
|
|
}
|
2022-03-06 18:11:17 +00:00
|
|
|
if (removed_count) {
|
|
|
|
m_deleted_count += removed_count;
|
|
|
|
m_size -= removed_count;
|
|
|
|
}
|
2022-03-06 18:26:04 +00:00
|
|
|
shrink_if_needed();
|
|
|
|
return removed_count;
|
2020-10-15 21:34:07 +00:00
|
|
|
}
|
2018-10-13 12:22:09 +00:00
|
|
|
|
2018-10-10 09:53:07 +00:00
|
|
|
private:
|
2020-10-15 21:34:07 +00:00
|
|
|
void insert_during_rehash(T&& value)
|
2019-06-29 19:09:40 +00:00
|
|
|
{
|
2020-10-15 21:34:07 +00:00
|
|
|
auto& bucket = lookup_for_writing(value);
|
|
|
|
new (bucket.slot()) T(move(value));
|
2022-03-07 14:10:10 +00:00
|
|
|
bucket.state = BucketState::Used;
|
2021-06-13 14:26:08 +00:00
|
|
|
|
|
|
|
if constexpr (IsOrdered) {
|
|
|
|
if (!m_collection_data.head) [[unlikely]] {
|
|
|
|
m_collection_data.head = &bucket;
|
|
|
|
} else {
|
|
|
|
bucket.previous = m_collection_data.tail;
|
|
|
|
m_collection_data.tail->next = &bucket;
|
|
|
|
}
|
|
|
|
m_collection_data.tail = &bucket;
|
|
|
|
}
|
2019-06-29 19:09:40 +00:00
|
|
|
}
|
|
|
|
|
2021-08-15 20:20:37 +00:00
|
|
|
[[nodiscard]] static constexpr size_t size_in_bytes(size_t capacity)
|
2021-07-11 11:22:58 +00:00
|
|
|
{
|
|
|
|
if constexpr (IsOrdered) {
|
|
|
|
return sizeof(BucketType) * capacity;
|
|
|
|
} else {
|
|
|
|
return sizeof(BucketType) * (capacity + 1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-11-10 22:00:21 +00:00
|
|
|
ErrorOr<void> try_rehash(size_t new_capacity)
|
2019-06-29 19:09:40 +00:00
|
|
|
{
|
2020-10-15 21:34:07 +00:00
|
|
|
new_capacity = max(new_capacity, static_cast<size_t>(4));
|
2021-06-13 14:26:08 +00:00
|
|
|
new_capacity = kmalloc_good_size(new_capacity * sizeof(BucketType)) / sizeof(BucketType);
|
2019-06-29 19:09:40 +00:00
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
auto* old_buckets = m_buckets;
|
2021-07-11 11:22:58 +00:00
|
|
|
auto old_capacity = m_capacity;
|
2021-06-13 14:26:08 +00:00
|
|
|
Iterator old_iter = begin();
|
|
|
|
|
2022-03-14 22:59:16 +00:00
|
|
|
auto* new_buckets = kcalloc(1, size_in_bytes(new_capacity));
|
2021-08-14 00:07:39 +00:00
|
|
|
if (!new_buckets)
|
2021-11-10 22:00:21 +00:00
|
|
|
return Error::from_errno(ENOMEM);
|
2021-06-13 14:26:08 +00:00
|
|
|
|
2021-08-14 00:07:39 +00:00
|
|
|
m_buckets = (BucketType*)new_buckets;
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
m_capacity = new_capacity;
|
|
|
|
m_deleted_count = 0;
|
2019-06-27 13:57:49 +00:00
|
|
|
|
2021-08-14 00:07:39 +00:00
|
|
|
if constexpr (IsOrdered)
|
|
|
|
m_collection_data = { nullptr, nullptr };
|
|
|
|
else
|
2022-03-07 14:10:10 +00:00
|
|
|
m_buckets[m_capacity].state = BucketState::End;
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
if (!old_buckets)
|
2021-11-10 22:00:21 +00:00
|
|
|
return {};
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2021-06-13 14:26:08 +00:00
|
|
|
for (auto it = move(old_iter); it != end(); ++it) {
|
|
|
|
insert_during_rehash(move(*it));
|
|
|
|
it->~T();
|
2019-03-25 03:23:17 +00:00
|
|
|
}
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2021-07-11 11:22:58 +00:00
|
|
|
kfree_sized(old_buckets, size_in_bytes(old_capacity));
|
2021-11-10 22:00:21 +00:00
|
|
|
return {};
|
2021-08-14 00:07:39 +00:00
|
|
|
}
|
|
|
|
void rehash(size_t new_capacity)
|
|
|
|
{
|
2021-11-10 22:00:21 +00:00
|
|
|
MUST(try_rehash(new_capacity));
|
2018-11-07 00:38:51 +00:00
|
|
|
}
|
|
|
|
|
2021-07-12 21:23:08 +00:00
|
|
|
template<typename TUnaryPredicate>
|
2021-07-21 16:18:29 +00:00
|
|
|
[[nodiscard]] BucketType* lookup_with_hash(unsigned hash, TUnaryPredicate predicate) const
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
|
|
|
if (is_empty())
|
|
|
|
return nullptr;
|
2021-04-02 01:52:32 +00:00
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
for (;;) {
|
2021-04-02 01:52:32 +00:00
|
|
|
auto& bucket = m_buckets[hash % m_capacity];
|
2020-10-15 21:34:07 +00:00
|
|
|
|
2022-03-07 14:10:10 +00:00
|
|
|
if (bucket.state == BucketState::Used && predicate(*bucket.slot()))
|
2020-10-15 21:34:07 +00:00
|
|
|
return &bucket;
|
|
|
|
|
2022-03-07 14:10:10 +00:00
|
|
|
if (bucket.state != BucketState::Used && bucket.state != BucketState::Deleted)
|
2020-10-15 21:34:07 +00:00
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
hash = double_hash(hash);
|
2018-10-10 09:53:07 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-11-10 22:00:21 +00:00
|
|
|
ErrorOr<BucketType*> try_lookup_for_writing(T const& value)
|
2020-10-15 21:34:07 +00:00
|
|
|
{
|
2021-08-14 00:07:39 +00:00
|
|
|
// FIXME: Maybe overrun the "allowed" load factor to avoid OOM
|
|
|
|
// If we are allowed to do that, separate that logic from
|
|
|
|
// the normal lookup_for_writing
|
2021-11-10 22:00:21 +00:00
|
|
|
if (should_grow())
|
|
|
|
TRY(try_rehash(capacity() * 2));
|
2021-04-02 02:02:33 +00:00
|
|
|
auto hash = TraitsForT::hash(value);
|
2021-06-13 14:26:08 +00:00
|
|
|
BucketType* first_empty_bucket = nullptr;
|
2020-10-15 21:34:07 +00:00
|
|
|
for (;;) {
|
2021-04-02 01:52:32 +00:00
|
|
|
auto& bucket = m_buckets[hash % m_capacity];
|
2021-04-02 02:02:33 +00:00
|
|
|
|
2022-03-07 14:10:10 +00:00
|
|
|
if (bucket.state == BucketState::Used && TraitsForT::equals(*bucket.slot(), value))
|
2021-08-14 00:07:39 +00:00
|
|
|
return &bucket;
|
2021-04-02 02:02:33 +00:00
|
|
|
|
2022-03-07 14:10:10 +00:00
|
|
|
if (bucket.state != BucketState::Used) {
|
2021-04-02 02:02:33 +00:00
|
|
|
if (!first_empty_bucket)
|
|
|
|
first_empty_bucket = &bucket;
|
|
|
|
|
2022-03-07 14:10:10 +00:00
|
|
|
if (bucket.state != BucketState::Deleted)
|
2021-08-14 00:07:39 +00:00
|
|
|
return const_cast<BucketType*>(first_empty_bucket);
|
2021-04-02 02:02:33 +00:00
|
|
|
}
|
|
|
|
|
2020-10-15 21:34:07 +00:00
|
|
|
hash = double_hash(hash);
|
|
|
|
}
|
|
|
|
}
|
2021-08-14 00:07:39 +00:00
|
|
|
[[nodiscard]] BucketType& lookup_for_writing(T const& value)
|
|
|
|
{
|
2021-11-10 22:00:21 +00:00
|
|
|
return *MUST(try_lookup_for_writing(value));
|
2021-08-14 00:07:39 +00:00
|
|
|
}
|
2018-10-13 12:22:09 +00:00
|
|
|
|
2021-04-11 08:25:22 +00:00
|
|
|
[[nodiscard]] size_t used_bucket_count() const { return m_size + m_deleted_count; }
|
|
|
|
[[nodiscard]] bool should_grow() const { return ((used_bucket_count() + 1) * 100) >= (m_capacity * load_factor_in_percent); }
|
2018-10-10 09:53:07 +00:00
|
|
|
|
2022-03-06 18:26:04 +00:00
|
|
|
void shrink_if_needed()
|
|
|
|
{
|
|
|
|
// Shrink if less than 20% of buckets are used, but never going below 16.
|
|
|
|
// These limits are totally arbitrary and can probably be improved.
|
|
|
|
bool should_shrink = m_size * 5 < m_capacity && m_capacity > 16;
|
|
|
|
if (!should_shrink)
|
|
|
|
return;
|
|
|
|
|
|
|
|
// NOTE: We ignore memory allocation failure here, since we can continue
|
|
|
|
// just fine with an oversized table.
|
|
|
|
(void)try_rehash(m_size * 2);
|
|
|
|
}
|
|
|
|
|
2022-03-06 18:11:17 +00:00
|
|
|
void delete_bucket(auto& bucket)
|
|
|
|
{
|
|
|
|
bucket.slot()->~T();
|
2022-03-07 14:10:10 +00:00
|
|
|
bucket.state = BucketState::Deleted;
|
2022-03-06 18:11:17 +00:00
|
|
|
|
|
|
|
if constexpr (IsOrdered) {
|
|
|
|
if (bucket.previous)
|
|
|
|
bucket.previous->next = bucket.next;
|
|
|
|
else
|
|
|
|
m_collection_data.head = bucket.next;
|
|
|
|
|
|
|
|
if (bucket.next)
|
|
|
|
bucket.next->previous = bucket.previous;
|
|
|
|
else
|
|
|
|
m_collection_data.tail = bucket.previous;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-13 14:26:08 +00:00
|
|
|
BucketType* m_buckets { nullptr };
|
|
|
|
|
|
|
|
[[no_unique_address]] CollectionDataType m_collection_data;
|
2020-10-15 21:34:07 +00:00
|
|
|
size_t m_size { 0 };
|
|
|
|
size_t m_capacity { 0 };
|
|
|
|
size_t m_deleted_count { 0 };
|
|
|
|
};
|
2018-10-10 09:53:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
using AK::HashTable;
|
2021-06-13 14:26:08 +00:00
|
|
|
using AK::OrderedHashTable;
|