//! A lot of the documentation for this module was copied straight out of the rust //! standard library. The implementation however is not. #![no_std] #![feature(allocator_api)] #![deny(clippy::all)] #![deny(clippy::must_use_candidate)] #![deny(missing_docs)] #![deny(clippy::trivially_copy_pass_by_ref)] #![deny(clippy::semicolon_if_nothing_returned)] #![deny(clippy::map_unwrap_or)] #![deny(clippy::needless_pass_by_value)] #![deny(clippy::redundant_closure_for_method_calls)] #![deny(clippy::cloned_instead_of_copied)] #![deny(rustdoc::broken_intra_doc_links)] #![deny(rustdoc::private_intra_doc_links)] #![deny(rustdoc::invalid_html_tags)] #![deny(unreachable_pub)] #![deny(clippy::missing_safety_doc)] #![deny(clippy::undocumented_unsafe_blocks)] #![deny(clippy::manual_assert)] #![deny(clippy::default_trait_access)] #![deny(clippy::missing_panics_doc)] #![deny(clippy::doc_markdown)] #![deny(clippy::return_self_not_must_use)] #![deny(clippy::cast_possible_truncation)] extern crate alloc; use alloc::{alloc::Global, vec::Vec}; use core::{ alloc::Allocator, borrow::Borrow, fmt::Debug, hash::{BuildHasher, BuildHasherDefault, Hash}, iter::FromIterator, num::Wrapping, ops::Index, }; use rustc_hash::FxHasher; mod node; mod node_storage; use node::Node; use node_storage::NodeStorage; // # Robin Hood Hash Tables // // The problem with regular hash tables where failing to find a slot for a specific // key will result in a linear search for the first free slot is that often these // slots can end up being quite far away from the original chosen location in fuller // hash tables. In Java, the hash table will resize when it is more than 2 thirds full // which is quite wasteful in terms of space. Robin Hood hash tables can be much // fuller before needing to resize and also keeps search times lower. // // The key concept is to keep the distance from the initial bucket chosen for a given // key to a minimum. We shall call this distance the "distance to the initial bucket" // or DIB for short. With each key - value pair, we store its DIB. When inserting // a value into the hash table, we check to see if there is an element in the initial // bucket. If there is, we move onto the next value. Then, we check to see if there // is already a value there and if there is, we check its DIB. If our DIB is greater // than or equal to the DIB of the value that is already there, we swap the working // value and the current entry. This continues until an empty slot is found. // // Using this technique, the average DIB is kept fairly low which decreases search // times. As a simple search time optimisation, the maximum DIB is kept track of // and so we will only need to search as far as that in order to know whether or // not a given element is in the hash table. // // # Deletion // // Special mention is given to deletion. Unfortunately, the maximum DIB is not // kept track of after deletion, since we would not only need to keep track of // the maximum DIB but also the number of elements which have that maximum DIB. // // In order to delete an element, we search to see if it exists. If it does, // we remove that element and then iterate through the array from that point // and move each element back one space (updating its DIB). If the DIB of the // element we are trying to remove is 0, then we stop this algorithm. // // This means that deletion will lower the average DIB of the elements and // keep searching and insertion fast. // // # Rehashing // // Currently, no incremental rehashing takes place. Once the HashMap becomes // more than 85% full (this value may change when I do some benchmarking), // a new list is allocated with double the capacity and the entire node list // is migrated. /// A hash map implemented very simply using robin hood hashing. /// /// `HashMap` uses `FxHasher` internally, which is a very fast hashing algorithm used /// by rustc and firefox in non-adversarial places. It is incredibly fast, and good /// enough for most cases. /// /// It is required that the keys implement the [`Eq`] and [`Hash`] traits, although this /// can be frequently achieved by using `#[derive(PartialEq, Eq, Hash)]`. If you /// implement these yourself, it is important that the following property holds: /// /// `k1 == k2 => hash(k1) == hash(k2)` /// /// It is a logic error for the key to be modified in such a way that the key's hash, as /// determined by the [`Hash`] trait, or its equality as determined by the [`Eq`] trait, /// changes while it is in the map. The behaviour for such a logic error is not specified, /// but will not result in undefined behaviour. This could include panics, incorrect results, /// aborts, memory leaks and non-termination. /// /// The API surface provided is incredibly similar to the /// [`std::collections::HashMap`](https://doc.rust-lang.org/std/collections/struct.HashMap.html) /// implementation with fewer guarantees, and better optimised for the `GameBoy Advance`. /// /// [`Eq`]: https://doc.rust-lang.org/core/cmp/trait.Eq.html /// [`Hash`]: https://doc.rust-lang.org/core/hash/trait.Hash.html /// /// # Example /// ``` /// use agb_hashmap::HashMap; /// /// // Type inference lets you omit the type signature (which would be HashMap in this example) /// let mut game_reviews = HashMap::new(); /// /// // Review some games /// game_reviews.insert( /// "Pokemon Emerald".to_string(), /// "Best post-game battle experience of any generation.".to_string(), /// ); /// game_reviews.insert( /// "Golden Sun".to_string(), /// "Some of the best music on the console".to_string(), /// ); /// game_reviews.insert( /// "Super Dodge Ball Advance".to_string(), /// "Really great launch title".to_string(), /// ); /// /// // Check for a specific entry /// if !game_reviews.contains_key("Legend of Zelda: The Minish Cap") { /// println!("We've got {} reviews, but The Minish Cap ain't one", game_reviews.len()); /// } /// /// // Iterate over everything /// for (game, review) in &game_reviews { /// println!("{game}: \"{review}\""); /// } /// ``` #[derive(Clone)] pub struct HashMap { nodes: NodeStorage, hasher: BuildHasherDefault, } /// Trait for allocators that are clonable, blanket implementation for all types that implement Allocator and Clone pub trait ClonableAllocator: Allocator + Clone {} impl ClonableAllocator for T {} impl HashMap { /// Creates a `HashMap` #[must_use] pub fn new() -> Self { Self::new_in(Global) } /// Creates an empty `HashMap` with specified internal size. The size must be a power of 2 #[must_use] pub fn with_size(size: usize) -> Self { Self::with_size_in(size, Global) } /// Creates an empty `HashMap` which can hold at least `capacity` elements before resizing. The actual /// internal size may be larger as it must be a power of 2 #[must_use] pub fn with_capacity(capacity: usize) -> Self { Self::with_capacity_in(capacity, Global) } #[doc(hidden)] #[must_use] pub fn distance_histogram(&self) -> (Vec, usize) { self.nodes.distance_histogram() } } impl HashMap { #[must_use] /// Creates an empty `HashMap` with specified internal size using the /// specified allocator. The size must be a power of 2 pub fn with_size_in(size: usize, alloc: ALLOCATOR) -> Self { Self { nodes: NodeStorage::with_size_in(size, alloc), hasher: BuildHasherDefault::default(), } } #[must_use] /// Creates a `HashMap` with a specified allocator pub fn new_in(alloc: ALLOCATOR) -> Self { Self::with_size_in(16, alloc) } /// Returns a reference to the underlying allocator pub fn allocator(&self) -> &ALLOCATOR { self.nodes.allocator() } /// Creates an empty `HashMap` which can hold at least `capacity` elements before resizing. The actual /// internal size may be larger as it must be a power of 2 /// /// # Panics /// /// Panics if capacity is larger than 2^32 * .85 #[must_use] pub fn with_capacity_in(capacity: usize, alloc: ALLOCATOR) -> Self { for i in 0..32 { let attempted_size = 1usize << i; if number_before_resize(attempted_size) > capacity { return Self::with_size_in(attempted_size, alloc); } } panic!( "Failed to come up with a size which satisfies capacity {}", capacity ); } /// Returns the number of elements in the map #[must_use] pub fn len(&self) -> usize { self.nodes.len() } /// Returns the number of elements the map can hold #[must_use] pub fn capacity(&self) -> usize { self.nodes.capacity() } /// An iterator visiting all keys in an arbitrary order pub fn keys(&self) -> impl Iterator { self.iter().map(|(k, _)| k) } /// An iterator visiting all values in an arbitrary order pub fn values(&self) -> impl Iterator { self.iter().map(|(_, v)| v) } /// An iterator visiting all values in an arbitrary order allowing for mutation pub fn values_mut(&mut self) -> impl Iterator { self.iter_mut().map(|(_, v)| v) } /// Removes all elements from the map pub fn clear(&mut self) { self.nodes.clear(); } /// An iterator visiting all key-value pairs in an arbitrary order pub fn iter(&self) -> impl Iterator { Iter { map: self, at: 0, num_found: 0, } } /// An iterator visiting all key-value pairs in an arbitrary order, with mutable references to the values pub fn iter_mut(&mut self) -> impl Iterator { self.nodes.iter_mut().filter_map(Node::key_value_mut) } /// Retains only the elements specified by the predicate `f`. pub fn retain(&mut self, f: F) where F: FnMut(&K, &mut V) -> bool, { self.nodes.retain(f); } /// Returns `true` if the map contains no elements #[must_use] pub fn is_empty(&self) -> bool { self.len() == 0 } fn resize(&mut self, new_size: usize) { assert!( new_size >= self.nodes.backing_vec_size(), "Can only increase the size of a hash map" ); if new_size == self.nodes.backing_vec_size() { return; } self.nodes = self.nodes.resized_to(new_size); } } impl Default for HashMap { fn default() -> Self { Self::new() } } impl HashMap where K: Eq + Hash, { /// Inserts a key-value pair into the map. /// /// If the map did not have this key present, [`None`] is returned. /// /// If the map did have this key present, the value is updated and the old value /// is returned. The key is not updated, which matters for types that can be `==` /// without being identical. pub fn insert(&mut self, key: K, value: V) -> Option { let hash = self.hash(&key); if let Some(location) = self.nodes.location(&key, hash) { Some( // SAFETY: location is valid due to the above unsafe { self.nodes .replace_at_location_unchecked(location, key, value) }, ) } else { if self.nodes.capacity() <= self.len() { self.resize(self.nodes.backing_vec_size() * 2); } self.nodes.insert_new(key, value, hash); None } } unsafe fn insert_new_and_get(&mut self, key: K, value: V, hash: HashType) -> &'_ mut V { if self.nodes.capacity() <= self.len() { self.resize(self.nodes.backing_vec_size() * 2); } let location = self.nodes.insert_new(key, value, hash); // SAFETY: location is always valid unsafe { self.nodes .node_at_unchecked_mut(location) .value_mut_unchecked() } } /// Returns `true` if the map contains a value for the specified key. pub fn contains_key(&self, k: &Q) -> bool where K: Borrow, Q: Hash + Eq + ?Sized, { let hash = self.hash(k); self.nodes.location(k, hash).is_some() } /// Returns the key-value pair corresponding to the supplied key pub fn get_key_value(&self, key: &Q) -> Option<(&K, &V)> where K: Borrow, Q: Hash + Eq + ?Sized, { let hash = self.hash(key); let location = self.nodes.location(key, hash)?; Some( // SAFETY: we know that a node exists and has a value from the location call above unsafe { self.nodes .node_at_unchecked(location) .key_value_ref_unchecked() }, ) } /// Returns a reference to the value corresponding to the key. Returns [`None`] if there is /// no element in the map with the given key. /// /// # Example /// ``` /// use agb_hashmap::HashMap; /// /// let mut map = HashMap::new(); /// map.insert("a".to_string(), "A"); /// assert_eq!(map.get("a"), Some(&"A")); /// assert_eq!(map.get("b"), None); /// ``` pub fn get(&self, key: &Q) -> Option<&V> where K: Borrow, Q: Hash + Eq + ?Sized, { self.get_key_value(key).map(|(_, v)| v) } /// Returns a mutable reference to the value corresponding to the key. Return [`None`] if /// there is no element in the map with the given key. /// /// # Example /// ``` /// use agb_hashmap::HashMap; /// /// let mut map = HashMap::new(); /// map.insert("a".to_string(), "A"); /// /// if let Some(x) = map.get_mut("a") { /// *x = "b"; /// } /// /// assert_eq!(map["a"], "b"); /// ``` pub fn get_mut(&mut self, key: &Q) -> Option<&mut V> where K: Borrow, Q: Hash + Eq + ?Sized, { let hash = self.hash(key); let location = self.nodes.location(key, hash)?; Some( // SAFETY: we know that a node exists and has a value from the location call above unsafe { self.nodes .node_at_unchecked_mut(location) .value_mut_unchecked() }, ) } /// Removes the given key from the map. Returns the current value if it existed, or [`None`] /// if it did not. /// /// # Example /// ``` /// use agb_hashmap::HashMap; /// /// let mut map = HashMap::new(); /// map.insert(1, "a"); /// assert_eq!(map.remove(&1), Some("a")); /// assert_eq!(map.remove(&1), None); /// ``` pub fn remove(&mut self, key: &Q) -> Option where K: Borrow, Q: Hash + Eq + ?Sized, { let hash = self.hash(key); self.nodes .location(key, hash) .map(|location| self.nodes.remove_from_location(location)) } } impl HashMap where K: Hash, { fn hash(&self, key: &Q) -> HashType where K: Borrow, Q: Hash + ?Sized, { let result = self.hasher.hash_one(key); // we want to allow truncation here since we're reducing 64 bits to 32 #[allow(clippy::cast_possible_truncation)] let reduced = (result as u32) ^ ((result >> 32) as u32); HashType::bit_mix(reduced) } } /// An iterator over entries of a [`HashMap`] /// /// This struct is created using the `into_iter()` method on [`HashMap`]. See its /// documentation for more. pub struct Iter<'a, K: 'a, V: 'a, ALLOCATOR: ClonableAllocator> { map: &'a HashMap, at: usize, num_found: usize, } impl<'a, K, V, ALLOCATOR: ClonableAllocator> Iterator for Iter<'a, K, V, ALLOCATOR> { type Item = (&'a K, &'a V); fn next(&mut self) -> Option { loop { if self.at >= self.map.nodes.backing_vec_size() { return None; } let node = &self.map.nodes.node_at(self.at); self.at += 1; if let Some(key_value) = node.key_value_ref() { self.num_found += 1; return Some(key_value); } } } fn size_hint(&self) -> (usize, Option) { ( self.map.len() - self.num_found, Some(self.map.len() - self.num_found), ) } } impl<'a, K, V, ALLOCATOR: ClonableAllocator> IntoIterator for &'a HashMap { type Item = (&'a K, &'a V); type IntoIter = Iter<'a, K, V, ALLOCATOR>; fn into_iter(self) -> Self::IntoIter { Iter { map: self, at: 0, num_found: 0, } } } /// An iterator over entries of a [`HashMap`] /// /// This struct is created using the `into_iter()` method on [`HashMap`] as part of its implementation /// of the `IntoIterator` trait. pub struct IterOwned { map: HashMap, at: usize, num_found: usize, } impl Iterator for IterOwned { type Item = (K, V); fn next(&mut self) -> Option { loop { if self.at >= self.map.nodes.backing_vec_size() { return None; } let maybe_kv = self.map.nodes.node_at_mut(self.at).take_key_value(); self.at += 1; if let Some((k, v, _)) = maybe_kv { self.num_found += 1; return Some((k, v)); } } } fn size_hint(&self) -> (usize, Option) { ( self.map.len() - self.num_found, Some(self.map.len() - self.num_found), ) } } /// An iterator over entries of a [`HashMap`] /// /// This struct is created using the `into_iter()` method on [`HashMap`] as part of its implementation /// of the `IntoIterator` trait. impl IntoIterator for HashMap { type Item = (K, V); type IntoIter = IterOwned; fn into_iter(self) -> Self::IntoIter { IterOwned { map: self, at: 0, num_found: 0, } } } mod entries { use core::{alloc::Allocator, hash::Hash}; use super::{ClonableAllocator, HashMap, HashType}; /// A view into an occupied entry in a `HashMap`. This is part of the [`crate::Entry`] enum. pub struct OccupiedEntry<'a, K: 'a, V: 'a, ALLOCATOR: Allocator> { key: K, map: &'a mut HashMap, location: usize, } impl<'a, K: 'a, V: 'a, ALLOCATOR: ClonableAllocator> OccupiedEntry<'a, K, V, ALLOCATOR> { /// # Safety /// /// You must call this with a valid location (one where the entry is defined) pub(crate) unsafe fn new( key: K, map: &'a mut HashMap, location: usize, ) -> Self { Self { key, map, location } } /// Gets a reference to the key in the entry. pub fn key(&self) -> &K { &self.key } /// Take the ownership of the key and value from the map. pub fn remove_entry(self) -> (K, V) { let old_value = self.map.nodes.remove_from_location(self.location); (self.key, old_value) } /// Gets a reference to the value in the entry. pub fn get(&self) -> &V { // SAFETY: This can only be constructed with valid locations unsafe { self.map .nodes .node_at_unchecked(self.location) .value_ref_unchecked() } } /// Gets a mutable reference to the value in the entry. /// /// If you need a reference to the `OccupiedEntry` which may outlive the destruction /// of the `Entry` value, see [`into_mut`]. /// /// [`into_mut`]: Self::into_mut pub fn get_mut(&mut self) -> &mut V { // SAFETY: This can only be constructed with valid locations unsafe { self.map .nodes .node_at_unchecked_mut(self.location) .value_mut_unchecked() } } /// Converts the `OccupiedEntry` into a mutable reference to the value in the entry with /// a lifetime bound to the map itself. /// /// If you need multiple references to the `OccupiedEntry`, see [`get_mut`]. /// /// [`get_mut`]: Self::get_mut pub fn into_mut(self) -> &'a mut V { // SAFETY: This can only be constructed with valid locations unsafe { self.map .nodes .node_at_unchecked_mut(self.location) .value_mut_unchecked() } } /// Sets the value of the entry and returns the entry's old value. pub fn insert(&mut self, value: V) -> V { // SAFETY: This can only be constructed with valid locations unsafe { self.map .nodes .node_at_unchecked_mut(self.location) .replace_value_unchecked(value) } } /// Takes the value out of the entry and returns it. pub fn remove(self) -> V { self.map.nodes.remove_from_location(self.location) } } /// A view into a vacant entry in a `HashMap`. It is part of the [`crate::Entry`] enum. pub struct VacantEntry<'a, K: 'a, V: 'a, ALLOCATOR: Allocator> { key: K, map: &'a mut HashMap, hash: HashType, } impl<'a, K: 'a, V: 'a, ALLOCATOR: ClonableAllocator> VacantEntry<'a, K, V, ALLOCATOR> { pub(crate) unsafe fn new( key: K, hash: HashType, map: &'a mut HashMap, ) -> Self { Self { key, map, hash } } /// Gets a reference to the key that would be used when inserting a value through `VacantEntry` pub fn key(&self) -> &K { &self.key } /// Take ownership of the key pub fn into_key(self) -> K { self.key } /// Sets the value of the entry with the `VacantEntry`'s key and returns a mutable reference to it. pub fn insert(self, value: V) -> &'a mut V where K: Hash + Eq, { // SAFETY: by construction, this doesn't already exist in the hashmap and we were given the hash and key unsafe { self.map.insert_new_and_get(self.key, value, self.hash) } } } } pub use entries::{OccupiedEntry, VacantEntry}; /// A view into a single entry in a map, which may be vacant or occupied. /// /// This is constructed using the [`entry`] method on [`HashMap`] /// /// [`entry`]: HashMap::entry() pub enum Entry<'a, K: 'a, V: 'a, ALLOCATOR: Allocator = Global> { /// An occupied entry Occupied(OccupiedEntry<'a, K, V, ALLOCATOR>), /// A vacant entry Vacant(VacantEntry<'a, K, V, ALLOCATOR>), } impl<'a, K, V, ALLOCATOR: ClonableAllocator> Entry<'a, K, V, ALLOCATOR> where K: Hash + Eq, { /// Ensures a value is in the entry by inserting the given value, and returns a mutable /// reference to the value in the entry. pub fn or_insert(self, value: V) -> &'a mut V { match self { Entry::Occupied(e) => e.into_mut(), Entry::Vacant(e) => e.insert(value), } } /// Ensures a value is in the entry by inserting the result of the function if empty, and /// returns a mutable reference to the value in the entry. pub fn or_insert_with(self, f: F) -> &'a mut V where F: FnOnce() -> V, { match self { Entry::Occupied(e) => e.into_mut(), Entry::Vacant(e) => e.insert(f()), } } /// Ensures a value is in the entry by inserting the result of the function if empty, and /// returns a mutable reference to the value in the entry. This method allows for key-derived /// values for insertion by providing the function with a reference to the key. /// /// The reference to the moved key is provided so that cloning or copying the key is unnecessary, /// unlike with `.or_insert_with(|| ...)`. pub fn or_insert_with_key(self, f: F) -> &'a mut V where F: FnOnce(&K) -> V, { match self { Entry::Occupied(e) => e.into_mut(), Entry::Vacant(e) => { let value = f(e.key()); e.insert(value) } } } /// Provides in-place mutable access to an occupied entry before any potential inserts /// into the map. #[must_use] pub fn and_modify(self, f: F) -> Self where F: FnOnce(&mut V), { match self { Entry::Occupied(mut e) => { f(e.get_mut()); Entry::Occupied(e) } Entry::Vacant(e) => Entry::Vacant(e), } } /// Ensures a value is in th entry by inserting the default value if empty. Returns a /// mutable reference to the value in the entry. pub fn or_default(self) -> &'a mut V where V: Default, { match self { Entry::Occupied(e) => e.into_mut(), Entry::Vacant(e) => e.insert(Default::default()), } } /// Returns a reference to this entry's key. pub fn key(&self) -> &K { match self { Entry::Occupied(e) => e.key(), Entry::Vacant(e) => e.key(), } } } impl HashMap where K: Hash + Eq, { /// Gets the given key's corresponding entry in the map for in-place manipulation. pub fn entry(&mut self, key: K) -> Entry<'_, K, V, ALLOCATOR> { let hash = self.hash(&key); let location = self.nodes.location(&key, hash); if let Some(location) = location { Entry::Occupied( // SAFETY: location is valid by the call to location above unsafe { OccupiedEntry::new(key, self, location) }, ) } else { Entry::Vacant( // SAFETY: item doesn't exist yet and the hash is correct here unsafe { VacantEntry::new(key, hash, self) }, ) } } } impl FromIterator<(K, V)> for HashMap where K: Eq + Hash, { fn from_iter>(iter: T) -> Self { let mut map = HashMap::new(); map.extend(iter); map } } impl Extend<(K, V)> for HashMap where K: Eq + Hash, { fn extend>(&mut self, iter: T) { for (k, v) in iter { self.insert(k, v); } } } impl Index<&Q> for HashMap where K: Eq + Hash + Borrow, Q: Eq + Hash + ?Sized, { type Output = V; fn index(&self, key: &Q) -> &V { self.get(key).expect("no entry found for key") } } impl PartialEq for HashMap where K: Eq + Hash, V: PartialEq, { fn eq(&self, other: &HashMap) -> bool { if self.len() != other.len() { return false; } self.iter() .all(|(key, value)| other.get(key).map_or(false, |v| *value == *v)) } } impl Eq for HashMap where K: Eq + Hash, V: PartialEq, { } impl Debug for HashMap where K: Debug, V: Debug, { fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result { f.debug_map().entries(self.iter()).finish() } } const fn number_before_resize(capacity: usize) -> usize { capacity * 60 / 100 } #[derive(Clone, Copy, PartialEq, Eq)] pub(crate) struct HashType(u32); impl From for HashType { fn from(value: usize) -> Self { // we explicitly want to allow truncation #[allow(clippy::cast_possible_truncation)] Self(value as u32) } } impl HashType { pub(crate) const fn new() -> Self { Self(0) } // 32 bit mix function from here: https://github.com/skeeto/hash-prospector fn bit_mix(key: u32) -> Self { let mut key = Wrapping(key); key ^= key >> 16; key *= 0x7feb352d; key ^= key >> 15; key *= 0x846ca68b; key ^= key >> 16; Self(key.0) } pub(crate) fn fast_mod(self, len: usize) -> usize { debug_assert!(len.is_power_of_two(), "Length must be a power of 2"); (self.0 as usize) & (len - 1) } } impl core::ops::Add for HashType { type Output = HashType; fn add(self, rhs: i32) -> Self::Output { Self(self.0.wrapping_add_signed(rhs)) } } #[cfg(test)] mod test { use core::{cell::RefCell, hash::Hasher}; use alloc::vec::Vec; use super::*; #[test] fn can_store_and_retrieve_8_elements() { let mut map = HashMap::new(); for i in 0..8 { map.insert(i, i % 4); } for i in 0..8 { assert_eq!(map.get(&i), Some(&(i % 4))); } } #[test] fn can_get_the_length() { let mut map = HashMap::new(); for i in 0..8 { map.insert(i / 2, true); } assert_eq!(map.len(), 4); } #[test] fn returns_none_if_element_does_not_exist() { let mut map = HashMap::new(); for i in 0..8 { map.insert(i, i % 3); } assert_eq!(map.get(&12), None); } #[test] fn can_delete_entries() { let mut map = HashMap::new(); for i in 0..8 { map.insert(i, i % 3); } for i in 0..4 { map.remove(&i); } assert_eq!(map.len(), 4); assert_eq!(map.get(&3), None); assert_eq!(map.get(&7), Some(&1)); } #[test] fn can_iterate_through_all_entries() { let mut map = HashMap::new(); for i in 0..8 { map.insert(i, i); } let mut max_found = -1; let mut num_found = 0; for (_, value) in map { max_found = max_found.max(value); num_found += 1; } assert_eq!(num_found, 8); assert_eq!(max_found, 7); } #[test] fn can_insert_more_than_initial_capacity() { let mut map = HashMap::new(); for i in 0..65 { map.insert(i, i % 4); } for i in 0..65 { assert_eq!(map.get(&i), Some(&(i % 4))); } } struct NoisyDrop { i: i32, dropped: bool, } impl NoisyDrop { #[cfg(not(miri))] fn new(i: i32) -> Self { Self { i, dropped: false } } } impl PartialEq for NoisyDrop { fn eq(&self, other: &Self) -> bool { self.i == other.i } } impl Eq for NoisyDrop {} impl Hash for NoisyDrop { fn hash(&self, hasher: &mut H) { hasher.write_i32(self.i); } } impl Drop for NoisyDrop { fn drop(&mut self) { assert!(!self.dropped, "NoisyDropped dropped twice"); self.dropped = true; } } trait RngNextI32 { fn next_i32(&mut self) -> i32; } impl RngNextI32 for T where T: rand::RngCore, { fn next_i32(&mut self) -> i32 { self.next_u32() as i32 } } #[cfg(not(miri))] // takes way too long to run under miri #[test] fn extreme_case() { use rand::SeedableRng; let mut map = HashMap::new(); let mut rng = rand::rngs::SmallRng::seed_from_u64(20); let mut answers: [Option; 512] = [None; 512]; for _ in 0..15_000 { let command = rng.next_i32().rem_euclid(2); let key = rng.next_i32().rem_euclid(answers.len().try_into().unwrap()); let value = rng.next_i32(); match command { 0 => { // insert answers[key as usize] = Some(value); map.insert(NoisyDrop::new(key), NoisyDrop::new(value)); } 1 => { // remove answers[key as usize] = None; map.remove(&NoisyDrop::new(key)); } _ => {} } for (i, answer) in answers.iter().enumerate() { assert_eq!( map.get(&NoisyDrop::new(i.try_into().unwrap())) .map(|nd| &nd.i), answer.as_ref() ); } } } #[derive(Clone)] struct Droppable<'a> { id: usize, drop_registry: &'a DropRegistry, } impl Hash for Droppable<'_> { fn hash(&self, hasher: &mut H) { hasher.write_usize(self.id); } } impl PartialEq for Droppable<'_> { fn eq(&self, other: &Self) -> bool { self.id == other.id } } impl Eq for Droppable<'_> {} impl Drop for Droppable<'_> { fn drop(&mut self) { self.drop_registry.dropped(self.id); } } struct DropRegistry { are_dropped: RefCell>, } impl DropRegistry { fn new() -> Self { Self { are_dropped: RefCell::default(), } } fn new_droppable(&self) -> Droppable<'_> { self.are_dropped.borrow_mut().push(0); Droppable { id: self.are_dropped.borrow().len() - 1, drop_registry: self, } } fn dropped(&self, id: usize) { self.are_dropped.borrow_mut()[id] += 1; } fn assert_dropped_once(&self, id: usize) { assert_eq!(self.are_dropped.borrow()[id], 1); } fn assert_not_dropped(&self, id: usize) { assert_eq!(self.are_dropped.borrow()[id], 0); } fn assert_dropped_n_times(&self, id: usize, num_drops: i32) { assert_eq!(self.are_dropped.borrow()[id], num_drops); } } #[test] fn correctly_drops_on_remove_and_overall_drop() { let drop_registry = DropRegistry::new(); let droppable1 = drop_registry.new_droppable(); let droppable2 = drop_registry.new_droppable(); let id1 = droppable1.id; let id2 = droppable2.id; { let mut map = HashMap::new(); map.insert(1, droppable1); map.insert(2, droppable2); drop_registry.assert_not_dropped(id1); drop_registry.assert_not_dropped(id2); map.remove(&1); drop_registry.assert_dropped_once(id1); drop_registry.assert_not_dropped(id2); } drop_registry.assert_dropped_once(id2); } #[test] fn correctly_drop_on_override() { let drop_registry = DropRegistry::new(); let droppable1 = drop_registry.new_droppable(); let droppable2 = drop_registry.new_droppable(); let id1 = droppable1.id; let id2 = droppable2.id; { let mut map = HashMap::new(); map.insert(1, droppable1); drop_registry.assert_not_dropped(id1); map.insert(1, droppable2); drop_registry.assert_dropped_once(id1); drop_registry.assert_not_dropped(id2); } drop_registry.assert_dropped_once(id2); } #[test] fn correctly_drops_key_on_override() { let drop_registry = DropRegistry::new(); let droppable1 = drop_registry.new_droppable(); let droppable1a = droppable1.clone(); let id1 = droppable1.id; { let mut map = HashMap::new(); map.insert(droppable1, 1); drop_registry.assert_not_dropped(id1); map.insert(droppable1a, 2); drop_registry.assert_dropped_once(id1); } drop_registry.assert_dropped_n_times(id1, 2); } #[test] fn test_retain() { let mut map = HashMap::new(); for i in 0..100 { map.insert(i, i); } map.retain(|k, _| k % 2 == 0); assert_eq!(map[&2], 2); assert_eq!(map.get(&3), None); assert_eq!(map.iter().count(), 50); // force full iteration } #[test] fn test_size_hint_iter() { let mut map = HashMap::new(); for i in 0..100 { map.insert(i, i); } let mut iter = map.iter(); assert_eq!(iter.size_hint(), (100, Some(100))); iter.next(); assert_eq!(iter.size_hint(), (99, Some(99))); } #[test] fn test_size_hint_into_iter() { let mut map = HashMap::new(); for i in 0..100 { map.insert(i, i); } let mut iter = map.into_iter(); assert_eq!(iter.size_hint(), (100, Some(100))); iter.next(); assert_eq!(iter.size_hint(), (99, Some(99))); } // Following test cases copied from the rust source // https://github.com/rust-lang/rust/blob/master/library/std/src/collections/hash/map/tests.rs mod rust_std_tests { use alloc::format; use crate::{Entry::*, HashMap}; #[test] fn test_entry() { let xs = [(1, 10), (2, 20), (3, 30), (4, 40), (5, 50), (6, 60)]; let mut map: HashMap<_, _> = xs.iter().copied().collect(); // Existing key (insert) match map.entry(1) { Vacant(_) => unreachable!(), Occupied(mut view) => { assert_eq!(view.get(), &10); assert_eq!(view.insert(100), 10); } } assert_eq!(map.get(&1).unwrap(), &100); assert_eq!(map.len(), 6); // Existing key (update) match map.entry(2) { Vacant(_) => unreachable!(), Occupied(mut view) => { let v = view.get_mut(); let new_v = (*v) * 10; *v = new_v; } } assert_eq!(map.get(&2).unwrap(), &200); assert_eq!(map.len(), 6); // Existing key (take) match map.entry(3) { Vacant(_) => unreachable!(), Occupied(view) => { assert_eq!(view.remove(), 30); } } assert_eq!(map.get(&3), None); assert_eq!(map.len(), 5); // Inexistent key (insert) match map.entry(10) { Occupied(_) => unreachable!(), Vacant(view) => { assert_eq!(*view.insert(1000), 1000); } } assert_eq!(map.get(&10).unwrap(), &1000); assert_eq!(map.len(), 6); } #[test] fn test_occupied_entry_key() { let mut a = HashMap::new(); let key = "hello there"; let value = "value goes here"; assert!(a.is_empty()); a.insert(key, value); assert_eq!(a.len(), 1); assert_eq!(a[key], value); match a.entry(key) { Vacant(_) => panic!(), Occupied(e) => assert_eq!(key, *e.key()), } assert_eq!(a.len(), 1); assert_eq!(a[key], value); } #[test] fn test_vacant_entry_key() { let mut a = HashMap::new(); let key = "hello there"; let value = "value goes here"; assert!(a.is_empty()); match a.entry(key) { Occupied(_) => panic!(), Vacant(e) => { assert_eq!(key, *e.key()); e.insert(value); } } assert_eq!(a.len(), 1); assert_eq!(a[key], value); } #[test] fn test_index() { let mut map = HashMap::new(); map.insert(1, 2); map.insert(2, 1); map.insert(3, 4); assert_eq!(map[&2], 1); } #[test] fn test_eq() { let mut m1 = HashMap::new(); m1.insert(1, 2); m1.insert(2, 3); m1.insert(3, 4); let mut m2 = HashMap::new(); m2.insert(1, 2); m2.insert(2, 3); assert!(m1 != m2); m2.insert(3, 4); assert_eq!(m1, m2); } #[test] fn test_show() { let mut map = HashMap::new(); let empty: HashMap = HashMap::new(); map.insert(1, 2); map.insert(3, 4); let map_str = format!("{map:?}"); assert!(map_str == "{1: 2, 3: 4}" || map_str == "{3: 4, 1: 2}"); assert_eq!(format!("{empty:?}"), "{}"); } } }