1#ifndef LIBTEDDY_DETAILS_HASH_TABLES_HPP
2#define LIBTEDDY_DETAILS_HASH_TABLES_HPP
4#include <libteddy/details/config.hpp>
5#include <libteddy/details/debug.hpp>
6#include <libteddy/details/node.hpp>
7#include <libteddy/details/tools.hpp>
21 static auto get_gte_capacity (int64 capacity) -> int64;
24 static constexpr int64 Capacities[] {
25 307, 617, 1'237, 2'477, 4'957,
26 9'923, 19'853, 39'709, 79'423, 158'849,
27 317'701, 635'413, 1'270'849, 2'541'701, 5'083'423,
28 10'166'857, 20'333'759, 40'667'527, 81'335'063, 162'670'129,
29 325'340'273, 650'680'571, 1'301'361'143, 2'602'722'289};
35template<
class Data,
class Degree>
48 auto operator* ()
const ->
node_t*;
51 auto get_bucket ()
const ->
node_t**;
58 auto move_to_next_bucket () ->
node_t*;
69template<
class Data,
class Degree>
74 using son_container =
typename node_t::son_container;
156 [[nodiscard]]
auto get_size () const -> int64;
161 auto
clear () ->
void;
189 auto rehash (int64 newCapacity) ->
void;
194 [[nodiscard]] auto get_load_factor () const ->
double;
217 [[nodiscard]] auto node_hash (son_container const& sons) const
227 [[nodiscard]] auto node_equals (
node_t*
node, son_container const& sons)
233 [[nodiscard]] auto callocate_buckets (int64 count) ->
node_t**;
238 [[nodiscard]] auto mallocate_buckets (int64 count) ->
node_t**;
241 static constexpr
double LOAD_THRESHOLD = 0.75;
253template<class Data, class Degree>
318 [[nodiscard]]
auto get_load_factor () const ->
double;
325 auto rehash (int64 newCapacity) ->
void;
330 [[nodiscard]] static auto callocate_entries (int64 count) -> cache_entry*;
335 cache_entry* entries_;
340inline auto
table_base::get_gte_capacity(int64 const desiredCapacity) -> int64
342 for (int64
const tableCapacity : Capacities)
344 if (tableCapacity > desiredCapacity)
346 return tableCapacity;
349 return Capacities[std::size(Capacities) - 1];
354template<
class Data,
class Degree>
356 node_t**
const firstBucket,
357 node_t**
const lastBucket
359 bucket_(firstBucket),
360 lastBucket_(lastBucket),
361 node_(this->move_to_next_bucket())
365template<
class Data,
class Degree>
366unique_table_iterator<Data, Degree>::unique_table_iterator(
367 node_t**
const bucket,
368 node_t**
const lastBucket,
372 lastBucket_(lastBucket),
377template<
class Data,
class Degree>
378auto unique_table_iterator<Data, Degree>::operator++ ()
379 -> unique_table_iterator&
381 node_ = node_->get_next();
385 node_ = this->move_to_next_bucket();
390template<
class Data,
class Degree>
391auto unique_table_iterator<Data, Degree>::operator++ (
int)
392 -> unique_table_iterator
394 auto const tmp = *
this;
399template<
class Data,
class Degree>
400auto unique_table_iterator<Data, Degree>::operator* () const -> node_t*
405template<
class Data,
class Degree>
406auto unique_table_iterator<Data, Degree>::operator== (
407 unique_table_iterator
const& other
410 return bucket_ == other.bucket_ && node_ == other.node_;
413template<
class Data,
class Degree>
414auto unique_table_iterator<Data, Degree>::operator!= (
415 unique_table_iterator
const& other
418 return not (*
this == other);
421template<
class Data,
class Degree>
422auto unique_table_iterator<Data, Degree>::get_bucket() const -> node_t**
427template<
class Data,
class Degree>
428auto unique_table_iterator<Data, Degree>::move_to_next_bucket() -> node_t*
430 while (bucket_ != lastBucket_ && not *bucket_)
434 return bucket_ != lastBucket_ ? *bucket_ :
nullptr;
439template<
class Data,
class Degree>
441 int64
const capacity,
446 capacity_(
table_base::get_gte_capacity(capacity)),
447 buckets_(callocate_buckets(capacity_))
451template<
class Data,
class Degree>
453 domain_(other.domain_),
455 capacity_(other.capacity_),
456 buckets_(mallocate_buckets(other.capacity_))
461 static_cast<std::size_t
>(capacity_) *
sizeof(
node_t*)
465template<
class Data,
class Degree>
467 domain_(other.domain_),
468 size_(utils::exchange(other.size_, 0)),
469 capacity_(other.capacity_),
470 buckets_(utils::exchange(other.buckets_,
nullptr))
474template<
class Data,
class Degree>
480template<
class Data,
class Degree>
484 std::size_t
const hash = this->node_hash(sons);
486 =
static_cast<int64
>(hash %
static_cast<std::size_t
>(capacity_));
487 node_t* current = buckets_[index];
490 if (this->node_equals(current, sons))
492 return {current, hash};
494 current = current->get_next();
496 return {
nullptr, hash};
499template<
class Data,
class Degree>
502 size_ += other.size_;
503 this->adjust_capacity();
504 auto it = other.begin();
505 auto const end = other.end();
508 node_t*
const otherNode = *it;
510 otherNode->set_next(
nullptr);
511 std::size_t
const hash = this->node_hash(otherNode->get_sons());
512 this->insert_impl(otherNode, hash);
516template<
class Data,
class Degree>
519 std::size_t
const hash
522 this->insert_impl(
node, hash);
526template<
class Data,
class Degree>
529 node_t**
const bucket = nodeIt.get_bucket();
531 return this->erase_impl(bucket,
node);
534template<
class Data,
class Degree>
537 std::size_t
const hash = this->node_hash(
node->get_sons());
539 =
static_cast<int64
>(hash %
static_cast<std::size_t
>(capacity_));
540 return this->erase_impl(buckets_ + index,
node);
543template<
class Data,
class Degree>
546 int64
const aproxCapacity
547 =
static_cast<int64
>(
static_cast<double>(size_) / LOAD_THRESHOLD);
548 int64
const newCapacity = table_base::get_gte_capacity(aproxCapacity);
549 if (newCapacity > capacity_)
551 this->rehash(newCapacity);
555template<
class Data,
class Degree>
561template<
class Data,
class Degree>
568 static_cast<std::size_t
>(capacity_) *
sizeof(
node_t*)
572template<
class Data,
class Degree>
575 return iterator(buckets_, buckets_ + capacity_);
578template<
class Data,
class Degree>
581 return iterator(buckets_ + capacity_, buckets_ + capacity_);
584template<
class Data,
class Degree>
587 return iterator(buckets_, buckets_ + capacity_);
590template<
class Data,
class Degree>
593 return iterator(buckets_ + capacity_, buckets_ + capacity_);
596template<
class Data,
class Degree>
599#ifdef LIBTEDDY_VERBOSE
601 " unique_table::rehash\tload before ",
602 this->get_load_factor(),
610 node_t**
const oldBuckets = buckets_;
611 int64
const oldCapacity = capacity_;
612 buckets_ = callocate_buckets(newCapacity);
613 capacity_ = newCapacity;
614 for (int64 i = 0; i < oldCapacity; ++i)
616 node_t*
node = oldBuckets[i];
619 node_t*
const next =
node->get_next();
620 std::size_t
const hash = this->node_hash(
node->get_sons());
621 node->set_next(
nullptr);
622 this->insert_impl(
node, hash);
627#ifdef LIBTEDDY_VERBOSE
628 debug::out(
", load after ", this->get_load_factor(),
"\n");
632template<
class Data,
class Degree>
633auto unique_table<Data, Degree>::get_load_factor() const ->
double
635 return static_cast<double>(size_) /
static_cast<double>(capacity_);
638template<
class Data,
class Degree>
639auto unique_table<Data, Degree>::insert_impl(
641 std::size_t
const hash
644 std::size_t
const index = hash %
static_cast<std::size_t
>(capacity_);
645 node_t*
const bucket = buckets_[index];
648 node->set_next(bucket);
650 buckets_[index] = node;
654template<
class Data,
class Degree>
655auto unique_table<Data, Degree>::erase_impl(
656 node_t**
const bucket,
660 iterator retIt(bucket, buckets_ + capacity_, node);
666 *bucket = node->get_next();
667 node->set_next(
nullptr);
671 node_t* prev = *bucket;
672 while (prev->get_next() != node)
674 prev = prev->get_next();
676 prev->set_next(node->get_next());
677 node->set_next(
nullptr);
681template<
class Data,
class Degree>
682auto unique_table<Data, Degree>::node_hash(son_container
const& sons)
const
685 std::size_t result = 0;
686 for (int32 k = 0; k < domain_; ++k)
688 utils::add_hash(result, sons[as_uindex(k)]);
693template<
class Data,
class Degree>
694auto unique_table<Data, Degree>::node_equals(
696 son_container
const& sons
699 for (int32 k = 0; k < domain_; ++k)
701 if (node->get_son(k) != sons[as_uindex(k)])
709template<
class Data,
class Degree>
710auto unique_table<Data, Degree>::callocate_buckets(int64
const count)
713 return static_cast<node_t**
>(
714 std::calloc(
static_cast<std::size_t
>(count),
sizeof(node_t*))
718template<
class Data,
class Degree>
719auto unique_table<Data, Degree>::mallocate_buckets(int64
const count)
722 return static_cast<node_t**
>(
723 std::malloc(
static_cast<std::size_t
>(count) *
sizeof(node_t*))
729template<
class Data,
class Degree>
730apply_cache<Data, Degree>::apply_cache(int64
const capacity) :
732 capacity_(table_base::get_gte_capacity(capacity)),
733 entries_(callocate_entries(capacity_))
737template<
class Data,
class Degree>
738apply_cache<Data, Degree>::apply_cache(apply_cache&& other) noexcept :
739 size_(utils::exchange(other.size_, 0)),
740 capacity_(other.capacity_),
741 entries_(utils::exchange(other.entries_,
nullptr))
745template<
class Data,
class Degree>
746apply_cache<Data, Degree>::~apply_cache()
751template<
class Data,
class Degree>
758 std::size_t
const hash = utils::pack_hash(opId, lhs, rhs);
759 std::size_t
const index = hash %
static_cast<std::size_t
>(capacity_);
762 = entry.opId_ == opId && entry.lhs_ == lhs && entry.rhs_ == rhs;
763 return matches ? entry.result_ :
nullptr;
766template<
class Data,
class Degree>
774 std::size_t
const hash = utils::pack_hash(opId, lhs, rhs);
775 std::size_t
const index = hash %
static_cast<std::size_t
>(capacity_);
777 if (not entry.result_)
784 entry.result_ = result;
787template<
class Data,
class Degree>
790 int64
const newCapacity = table_base::get_gte_capacity(aproxCapacity);
791 if (newCapacity > capacity_)
793 this->rehash(newCapacity);
797template<
class Data,
class Degree>
800 for (int64 i = 0; i < capacity_; ++i)
805 bool const isUsed = entry.lhs_->is_used() && entry.rhs_->is_used()
806 && entry.result_->is_used();
816template<
class Data,
class Degree>
823 static_cast<std::size_t
>(capacity_) *
sizeof(
cache_entry)
827template<
class Data,
class Degree>
830 return static_cast<double>(size_) /
static_cast<double>(capacity_);
833template<
class Data,
class Degree>
834auto apply_cache<Data, Degree>::rehash(int64
const newCapacity) ->
void
836#ifdef LIBTEDDY_VERBOSE
838 "apply_cache::rehash\tload is ",
839 this->get_load_factor(),
847 cache_entry*
const oldEntries = entries_;
848 int64
const oldCapacity = capacity_;
849 entries_ = callocate_entries(newCapacity);
850 capacity_ = newCapacity;
852 for (int64 i = 0; i < oldCapacity; ++i)
854 cache_entry
const& entry = oldEntries[i];
857 this->put(entry.opId_, entry.result_, entry.lhs_, entry.rhs_);
861#ifdef LIBTEDDY_VERBOSE
862 debug::out(
" new load is ", this->get_load_factor(),
"\n");
866template<
class Data,
class Degree>
867auto apply_cache<Data, Degree>::callocate_entries(int64
const count)
870 return static_cast<cache_entry*
>(
871 std::calloc(
static_cast<std::size_t
>(count),
sizeof(cache_entry))
Cache for the apply opertaion.
Definition hash_tables.hpp:255
auto find(int32 opId, node_t *lhs, node_t *rhs) -> node_t *
Looks up result of an operation.
Definition hash_tables.hpp:752
auto clear() -> void
Clears all entries.
Definition hash_tables.hpp:817
auto grow_capacity(int64 aproxCapacity) -> void
Increases the capacity so that it is close to aproxCapacity Never lowers the capacity!
Definition hash_tables.hpp:788
auto remove_unused() -> void
Removes entries pointing to unused nodes.
Definition hash_tables.hpp:798
auto put(int32 opId, node_t *result, node_t *lhs, node_t *rhs) -> void
Puts the result into the cache possibly overwriting old value.
Definition hash_tables.hpp:767
Definition hash_tables.hpp:261
Base class for hash tables.
Definition hash_tables.hpp:19
Iterator for the unique table.
Definition hash_tables.hpp:37
Table of unique nodes.
Definition hash_tables.hpp:71
~unique_table()
Destructor.
Definition hash_tables.hpp:475
auto clear() -> void
Clears the table.
Definition hash_tables.hpp:562
auto insert(node_t *node, std::size_t hash) -> void
Inserts node using pre-computed hash.
Definition hash_tables.hpp:517
auto adjust_capacity() -> void
Adjusts capacity of the table (number of buckets)
Definition hash_tables.hpp:544
auto erase(iterator nodeIt) -> iterator
Erases node pointed to by it.
Definition hash_tables.hpp:527
auto merge(unique_table other) -> void
Adds all nodes from other into this table Adjusts capacity if necessary.
Definition hash_tables.hpp:500
auto find(son_container const &sons) const -> result_of_find
Tries to find an internal node.
Definition hash_tables.hpp:481
unique_table(int64 capacity, int32 domain)
Initializes empty table.
Definition hash_tables.hpp:440
auto end() -> iterator
Definition hash_tables.hpp:579
auto get_size() const -> int64
Definition hash_tables.hpp:556
auto begin() -> iterator
Definition hash_tables.hpp:573
Definition hash_tables.hpp:79