2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @file HashTable.h
|
|
|
|
* @author apio (cloudapio.eu)
|
|
|
|
* @brief Table of values with best-case constant time lookup.
|
|
|
|
*
|
|
|
|
* @copyright Copyright (c) 2023, the Luna authors.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
2023-06-15 13:50:04 +00:00
|
|
|
#pragma once
|
|
|
|
#include <luna/Hash.h>
|
|
|
|
#include <luna/Heap.h>
|
|
|
|
#include <luna/Option.h>
|
|
|
|
|
2024-07-02 18:51:28 +00:00
|
|
|
template <typename K, typename V> class HashMap;
|
|
|
|
|
2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @brief A table of values with best-case constant time lookup.
|
|
|
|
*
|
|
|
|
* @tparam T The type of values to store.
|
|
|
|
*/
|
2023-06-15 13:50:04 +00:00
|
|
|
template <typename T> class HashTable
|
|
|
|
{
|
|
|
|
static constexpr usize GROW_RATE = 2;
|
2023-08-26 18:50:12 +00:00
|
|
|
static constexpr usize GROW_FACTOR = 2;
|
2023-08-27 18:48:50 +00:00
|
|
|
static constexpr usize INITIAL_CAPACITY = 32;
|
2023-06-15 13:50:04 +00:00
|
|
|
|
|
|
|
public:
|
2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @brief Try to insert a value into the table.
|
|
|
|
*
|
|
|
|
* @param value The value to insert.
|
|
|
|
* @return Result<bool> An error, true if the insertion succeeded, or false if the value already existed.
|
|
|
|
*/
|
2023-06-15 13:50:04 +00:00
|
|
|
Result<bool> try_set(const T& value)
|
|
|
|
{
|
|
|
|
T copy { value };
|
|
|
|
return try_set(move(copy));
|
|
|
|
}
|
|
|
|
|
2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @brief Try to insert a value into the table.
|
|
|
|
*
|
|
|
|
* @param value The value to insert.
|
|
|
|
* @return Result<bool> An error, true if the insertion succeeded, or false if the value already existed.
|
|
|
|
*/
|
2023-06-15 13:50:04 +00:00
|
|
|
Result<bool> try_set(T&& value)
|
|
|
|
{
|
2023-08-27 18:48:50 +00:00
|
|
|
if (should_grow()) TRY(rehash(m_capacity ? m_capacity * GROW_FACTOR : INITIAL_CAPACITY));
|
2023-06-15 13:50:04 +00:00
|
|
|
|
|
|
|
u64 index = hash(value, m_salt) % m_capacity;
|
|
|
|
|
2023-07-25 16:19:45 +00:00
|
|
|
check(m_size < m_capacity);
|
|
|
|
|
|
|
|
// NOTE: This should not end in an infinite loop if the table is full, since the table CANNOT be full
|
|
|
|
// (should_grow() returns true before it does). The check above verifies this.
|
2023-06-15 13:50:04 +00:00
|
|
|
while (true)
|
|
|
|
{
|
|
|
|
auto& bucket = m_buckets[index];
|
|
|
|
if (bucket.has_value())
|
|
|
|
{
|
|
|
|
if (*bucket == value) return false;
|
|
|
|
index++;
|
2023-07-25 16:19:45 +00:00
|
|
|
if (index == m_capacity)
|
|
|
|
index = 0; // Wrap around to avoid overflowing, seems like I assumed it would do that
|
|
|
|
// automatically for some reason... (facepalm).
|
2023-06-15 13:50:04 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
bucket = { move(value) };
|
|
|
|
m_size++;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @brief Find a value inside the table, returning a pointer to it if found.
|
|
|
|
*
|
|
|
|
* @param value The value to compare against.
|
|
|
|
* @return T* A pointer to the value inside the table if found, or nullptr if it was not found.
|
|
|
|
*/
|
2023-06-15 13:50:04 +00:00
|
|
|
T* try_find(const T& value)
|
|
|
|
{
|
|
|
|
if (!m_size) return nullptr;
|
|
|
|
|
|
|
|
check(m_capacity);
|
|
|
|
|
|
|
|
const u64 index = hash(value, m_salt) % m_capacity;
|
|
|
|
usize i = index;
|
|
|
|
|
|
|
|
do {
|
2023-07-21 19:04:25 +00:00
|
|
|
auto& bucket = m_buckets[i];
|
2023-06-15 13:50:04 +00:00
|
|
|
if (bucket.has_value())
|
|
|
|
{
|
|
|
|
if (*bucket == value) return bucket.value_ptr();
|
|
|
|
i++;
|
2023-07-25 16:19:45 +00:00
|
|
|
if (i == m_capacity) i = 0;
|
2023-06-15 13:50:04 +00:00
|
|
|
}
|
2023-07-21 19:04:25 +00:00
|
|
|
else
|
|
|
|
return nullptr;
|
2023-06-15 13:50:04 +00:00
|
|
|
} while (i != index);
|
|
|
|
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @brief Remove a value from this table.
|
|
|
|
*
|
|
|
|
* @param value The value to remove.
|
|
|
|
* @return true The value was successfully removed.
|
|
|
|
* @return false The value did not exist.
|
|
|
|
*/
|
2023-06-15 13:50:04 +00:00
|
|
|
bool try_remove(const T& value)
|
|
|
|
{
|
|
|
|
if (!m_size) return false;
|
|
|
|
|
|
|
|
check(m_capacity);
|
|
|
|
|
|
|
|
const u64 index = hash(value, m_salt) % m_capacity;
|
|
|
|
usize i = index;
|
|
|
|
|
|
|
|
do {
|
2023-07-21 19:04:25 +00:00
|
|
|
auto& bucket = m_buckets[i];
|
2023-06-15 13:50:04 +00:00
|
|
|
if (bucket.has_value())
|
|
|
|
{
|
|
|
|
if (*bucket == value)
|
|
|
|
{
|
|
|
|
bucket = {};
|
|
|
|
m_size--;
|
|
|
|
if (i != index) rehash(m_capacity);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
i++;
|
2023-07-25 16:19:45 +00:00
|
|
|
if (i == m_capacity) i = 0;
|
2023-06-15 13:50:04 +00:00
|
|
|
}
|
2023-07-21 19:04:25 +00:00
|
|
|
else
|
|
|
|
return false;
|
2023-06-15 13:50:04 +00:00
|
|
|
} while (i != index);
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @brief Clear the table.
|
|
|
|
*/
|
2023-06-15 13:50:04 +00:00
|
|
|
void clear()
|
|
|
|
{
|
2023-08-17 18:14:33 +00:00
|
|
|
if (m_capacity)
|
|
|
|
{
|
|
|
|
for (usize i = 0; i < m_capacity; i++) m_buckets[i].~Option();
|
|
|
|
|
|
|
|
free_impl(m_buckets);
|
|
|
|
m_capacity = m_size = 0;
|
|
|
|
}
|
|
|
|
}
|
2023-06-15 13:50:04 +00:00
|
|
|
|
2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @brief Return the number of values that can currently fit in the table.
|
|
|
|
*
|
|
|
|
* The number of actual entries will always be smaller than this (unless it is 0), since the table grows before
|
|
|
|
* the number of entries reaches the capacity.
|
|
|
|
*
|
|
|
|
* @return usize The current capacity.
|
|
|
|
*/
|
2023-08-17 18:14:33 +00:00
|
|
|
usize capacity() const
|
|
|
|
{
|
|
|
|
return m_capacity;
|
|
|
|
}
|
|
|
|
|
2023-08-26 18:50:12 +00:00
|
|
|
/**
|
|
|
|
* @brief Return the number of values currently contained in the table.
|
|
|
|
*
|
|
|
|
* @return usize The number of values contained.
|
|
|
|
*/
|
2023-08-17 18:14:33 +00:00
|
|
|
usize size() const
|
|
|
|
{
|
|
|
|
return m_size;
|
2023-06-15 13:50:04 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
~HashTable()
|
|
|
|
{
|
|
|
|
clear();
|
|
|
|
}
|
|
|
|
|
2024-07-02 18:51:28 +00:00
|
|
|
struct HashTableIterator
|
|
|
|
{
|
|
|
|
private:
|
|
|
|
HashTableIterator(usize index, HashTable<T>& table) : m_table(table)
|
|
|
|
{
|
|
|
|
if (index != -1)
|
|
|
|
{
|
|
|
|
m_index = index;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (usize i = 0; i < m_table.m_capacity; i++)
|
|
|
|
{
|
|
|
|
auto& opt = m_table.m_buckets[i];
|
|
|
|
if (opt.has_value())
|
|
|
|
{
|
|
|
|
m_index = i;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
m_index = m_table.m_capacity;
|
|
|
|
}
|
|
|
|
|
|
|
|
mutable usize m_index;
|
|
|
|
HashTable<T>& m_table;
|
|
|
|
|
|
|
|
public:
|
|
|
|
T& operator*()
|
|
|
|
{
|
|
|
|
return *m_table.m_buckets[m_index].value_ptr();
|
|
|
|
}
|
|
|
|
|
|
|
|
const T& operator*() const
|
|
|
|
{
|
|
|
|
return *m_table.m_buckets[m_index].value_ptr();
|
|
|
|
}
|
|
|
|
|
|
|
|
void operator++() const
|
|
|
|
{
|
|
|
|
for (usize i = m_index + 1; i < m_table.m_capacity; i++)
|
|
|
|
{
|
|
|
|
auto& opt = m_table.m_buckets[i];
|
|
|
|
if (opt.has_value())
|
|
|
|
{
|
|
|
|
m_index = i;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
m_index = m_table.m_capacity;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool operator!=(HashTableIterator& other) const
|
|
|
|
{
|
|
|
|
return m_index != other.m_index || &m_table != &other.m_table;
|
|
|
|
}
|
|
|
|
|
|
|
|
friend class HashTable<T>;
|
|
|
|
};
|
|
|
|
|
|
|
|
const HashTableIterator begin()
|
|
|
|
{
|
|
|
|
return { (usize)-1, *this };
|
|
|
|
}
|
|
|
|
|
|
|
|
const HashTableIterator end()
|
|
|
|
{
|
|
|
|
return { m_capacity, *this };
|
|
|
|
}
|
|
|
|
|
2023-06-15 13:50:04 +00:00
|
|
|
private:
|
|
|
|
bool should_grow()
|
|
|
|
{
|
|
|
|
return (m_capacity == 0) || ((m_size * GROW_RATE) >= m_capacity);
|
|
|
|
}
|
|
|
|
|
|
|
|
Result<void> rehash(usize new_capacity)
|
|
|
|
{
|
|
|
|
HashTable<T> new_table;
|
|
|
|
TRY(new_table.initialize(new_capacity));
|
|
|
|
|
|
|
|
if (m_capacity != 0)
|
|
|
|
{
|
|
|
|
for (usize i = 0; i < m_capacity; i++)
|
|
|
|
{
|
|
|
|
auto& opt = m_buckets[i];
|
|
|
|
if (opt.has_value())
|
|
|
|
{
|
|
|
|
auto value = opt.release_value();
|
|
|
|
TRY(new_table.try_set(move(value)));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
swap(this, &new_table);
|
|
|
|
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
Result<void> initialize(usize initial_capacity)
|
|
|
|
{
|
|
|
|
check(m_buckets == nullptr);
|
|
|
|
m_capacity = initial_capacity;
|
|
|
|
m_buckets = (Option<T>*)TRY(calloc_impl(initial_capacity, sizeof(Option<T>), false));
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
|
|
|
Option<T>* m_buckets { nullptr };
|
|
|
|
usize m_capacity { 0 };
|
|
|
|
usize m_size { 0 };
|
|
|
|
// FIXME: Randomize this to protect against hash table attacks.
|
|
|
|
u64 m_salt { 0 };
|
2024-07-02 18:51:28 +00:00
|
|
|
|
|
|
|
friend class HashTableIterator;
|
2023-06-15 13:50:04 +00:00
|
|
|
};
|