2023-05-10 05:57:33 +10:00
|
|
|
use core::{alloc::Allocator, borrow::Borrow, mem};
|
|
|
|
|
|
|
|
use alloc::{alloc::Global, vec::Vec};
|
|
|
|
|
|
|
|
use crate::{node::Node, number_before_resize, ClonableAllocator, HashType};
|
|
|
|
|
2023-05-10 06:05:00 +10:00
|
|
|
#[derive(Clone)]
|
2023-05-10 05:57:33 +10:00
|
|
|
pub(crate) struct NodeStorage<K, V, ALLOCATOR: Allocator = Global> {
|
|
|
|
nodes: Vec<Node<K, V>, ALLOCATOR>,
|
|
|
|
max_distance_to_initial_bucket: i32,
|
|
|
|
|
|
|
|
number_of_items: usize,
|
|
|
|
max_number_before_resize: usize,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<K, V, ALLOCATOR: ClonableAllocator> NodeStorage<K, V, ALLOCATOR> {
|
|
|
|
pub(crate) fn with_size_in(capacity: usize, alloc: ALLOCATOR) -> Self {
|
|
|
|
assert!(capacity.is_power_of_two(), "Capacity must be a power of 2");
|
|
|
|
|
|
|
|
let mut nodes = Vec::with_capacity_in(capacity, alloc);
|
|
|
|
for _ in 0..capacity {
|
2023-05-10 07:10:53 +10:00
|
|
|
nodes.push(Node::default());
|
2023-05-10 05:57:33 +10:00
|
|
|
}
|
|
|
|
|
|
|
|
Self {
|
|
|
|
nodes,
|
|
|
|
max_distance_to_initial_bucket: 0,
|
|
|
|
number_of_items: 0,
|
|
|
|
max_number_before_resize: number_before_resize(capacity),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn allocator(&self) -> &ALLOCATOR {
|
|
|
|
self.nodes.allocator()
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn capacity(&self) -> usize {
|
|
|
|
self.max_number_before_resize
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn backing_vec_size(&self) -> usize {
|
|
|
|
self.nodes.len()
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn len(&self) -> usize {
|
|
|
|
self.number_of_items
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn insert_new(&mut self, key: K, value: V, hash: HashType) -> usize {
|
|
|
|
debug_assert!(
|
|
|
|
self.capacity() > self.len(),
|
|
|
|
"Do not have space to insert into len {} with {}",
|
|
|
|
self.backing_vec_size(),
|
|
|
|
self.len()
|
|
|
|
);
|
|
|
|
|
|
|
|
let mut new_node = Node::new_with(key, value, hash);
|
|
|
|
let mut inserted_location = usize::MAX;
|
|
|
|
|
|
|
|
loop {
|
2023-05-10 07:38:04 +10:00
|
|
|
let location =
|
|
|
|
(new_node.hash() + new_node.distance()).fast_mod(self.backing_vec_size());
|
|
|
|
|
2023-05-10 05:57:33 +10:00
|
|
|
let current_node = &mut self.nodes[location];
|
|
|
|
|
|
|
|
if current_node.has_value() {
|
|
|
|
if current_node.distance() <= new_node.distance() {
|
|
|
|
mem::swap(&mut new_node, current_node);
|
|
|
|
|
|
|
|
if inserted_location == usize::MAX {
|
|
|
|
inserted_location = location;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
self.nodes[location] = new_node;
|
|
|
|
if inserted_location == usize::MAX {
|
|
|
|
inserted_location = location;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
new_node.increment_distance();
|
|
|
|
self.max_distance_to_initial_bucket =
|
|
|
|
new_node.distance().max(self.max_distance_to_initial_bucket);
|
|
|
|
}
|
|
|
|
|
|
|
|
self.number_of_items += 1;
|
|
|
|
inserted_location
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn retain<F>(&mut self, mut f: F)
|
|
|
|
where
|
|
|
|
F: FnMut(&K, &mut V) -> bool,
|
|
|
|
{
|
|
|
|
let num_nodes = self.nodes.len();
|
|
|
|
let mut i = 0;
|
|
|
|
|
|
|
|
while i < num_nodes {
|
|
|
|
let node = &mut self.nodes[i];
|
|
|
|
|
|
|
|
if let Some((k, v)) = node.key_value_mut() {
|
|
|
|
if !f(k, v) {
|
|
|
|
self.remove_from_location(i);
|
|
|
|
|
|
|
|
// Need to continue before adding 1 to i because remove from location could
|
|
|
|
// put the element which was next into the ith location in the nodes array,
|
|
|
|
// so we need to check if that one needs removing too.
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
i += 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn remove_from_location(&mut self, location: usize) -> V {
|
|
|
|
let mut current_location = location;
|
|
|
|
self.number_of_items -= 1;
|
|
|
|
|
|
|
|
loop {
|
|
|
|
let next_location =
|
2023-05-10 07:38:04 +10:00
|
|
|
HashType::from(current_location + 1).fast_mod(self.backing_vec_size());
|
2023-05-10 05:57:33 +10:00
|
|
|
|
|
|
|
// if the next node is empty, or the next location has 0 distance to initial bucket then
|
|
|
|
// we can clear the current node
|
|
|
|
if !self.nodes[next_location].has_value() || self.nodes[next_location].distance() == 0 {
|
|
|
|
return self.nodes[current_location].take_key_value().unwrap().1;
|
|
|
|
}
|
|
|
|
|
|
|
|
self.nodes.swap(current_location, next_location);
|
|
|
|
self.nodes[current_location].decrement_distance();
|
|
|
|
current_location = next_location;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn location<Q>(&self, key: &Q, hash: HashType) -> Option<usize>
|
|
|
|
where
|
|
|
|
K: Borrow<Q>,
|
|
|
|
Q: Eq + ?Sized,
|
|
|
|
{
|
|
|
|
for distance_to_initial_bucket in 0..(self.max_distance_to_initial_bucket + 1) {
|
2023-05-11 01:01:24 +10:00
|
|
|
let location = (hash + distance_to_initial_bucket).fast_mod(self.backing_vec_size());
|
2023-05-10 05:57:33 +10:00
|
|
|
|
|
|
|
let node = &self.nodes[location];
|
2023-05-10 06:39:35 +10:00
|
|
|
let node_key_ref = node.key_ref()?;
|
|
|
|
|
|
|
|
if node_key_ref.borrow() == key {
|
|
|
|
return Some(location);
|
2023-05-10 05:57:33 +10:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
None
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn resized_to(&mut self, new_size: usize) -> Self {
|
|
|
|
let mut new_node_storage = Self::with_size_in(new_size, self.allocator().clone());
|
|
|
|
|
|
|
|
for mut node in self.nodes.drain(..) {
|
|
|
|
if let Some((key, value, hash)) = node.take_key_value() {
|
|
|
|
new_node_storage.insert_new(key, value, hash);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
new_node_storage
|
|
|
|
}
|
|
|
|
|
2023-05-10 07:43:06 +10:00
|
|
|
pub(crate) unsafe fn replace_at_location_unchecked(
|
|
|
|
&mut self,
|
|
|
|
location: usize,
|
|
|
|
key: K,
|
|
|
|
value: V,
|
|
|
|
) -> V {
|
|
|
|
self.node_at_unchecked_mut(location)
|
|
|
|
.replace_unchecked(key, value)
|
|
|
|
.1
|
2023-05-10 05:57:33 +10:00
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn iter_mut(&mut self) -> impl Iterator<Item = &mut Node<K, V>> {
|
|
|
|
self.nodes.iter_mut()
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn node_at(&self, at: usize) -> &Node<K, V> {
|
|
|
|
&self.nodes[at]
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn node_at_mut(&mut self, at: usize) -> &mut Node<K, V> {
|
|
|
|
&mut self.nodes[at]
|
|
|
|
}
|
2023-05-10 06:33:20 +10:00
|
|
|
|
|
|
|
pub(crate) unsafe fn node_at_unchecked(&self, at: usize) -> &Node<K, V> {
|
|
|
|
self.nodes.get_unchecked(at)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) unsafe fn node_at_unchecked_mut(&mut self, at: usize) -> &mut Node<K, V> {
|
|
|
|
self.nodes.get_unchecked_mut(at)
|
|
|
|
}
|
2023-05-11 02:49:48 +10:00
|
|
|
|
|
|
|
pub(crate) fn distance_histogram(&self) -> (Vec<usize>, usize) {
|
|
|
|
let mut ret = Vec::new();
|
|
|
|
|
|
|
|
for node in self.nodes.iter() {
|
|
|
|
let distance = node.distance();
|
|
|
|
|
|
|
|
if distance >= 0 {
|
|
|
|
let distance = distance as usize;
|
|
|
|
ret.resize(ret.len().max(distance + 1), 0);
|
|
|
|
ret[distance] += 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
(ret, self.max_distance_to_initial_bucket as usize)
|
|
|
|
}
|
2023-05-10 05:57:33 +10:00
|
|
|
}
|