-
Notifications
You must be signed in to change notification settings - Fork 32
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Capped Hashmap #25
Merged
Merged
Capped Hashmap #25
Changes from all commits
Commits
Show all changes
16 commits
Select commit
Hold shift + click to select a range
1751c86
feat: implement a capped hashmap colelction
ppoliani d44929c
feat: implemebt CappedHashMap::remove
ppoliani 8929636
chore: use 4 space tabs
ppoliani bab9e7a
chore: fi typo
ppoliani fe21a47
chore: run cargo fmt
ppoliani 6f8294a
feat: add get fns to capped hashmap
ppoliani f061aad
test: add test_insert_should_return_removed_key
ppoliani 3329660
test: add test_remove
ppoliani c636aae
test: test insert duplicate
ppoliani c60603d
fix: PR comments
ppoliani 3eda4cf
feat: check if key exists before adding a new one
ppoliani 181a3ad
feat: allow user replace the code
ppoliani 81f616c
refactor: rename insert to add_entry
ppoliani 6f39a59
feat: use max_size field
ppoliani a0adf49
feat: add helper log function
ppoliani 8b7ab84
chore: code format
ppoliani File filter
Filter by extension
Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,26 @@ | ||
{ | ||
// Use IntelliSense to learn about possible attributes. | ||
// Hover to view descriptions of existing attributes. | ||
// For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387 | ||
"version": "0.2.0", | ||
"configurations": [ | ||
{ | ||
"type": "lldb", | ||
"request": "launch", | ||
"name": "Debug zkbtc", | ||
"cargo": { | ||
"args": [ | ||
"build", | ||
"--bin=zkbtc", | ||
"--package=zkbitcoin" | ||
], | ||
"filter": { | ||
"name": "zkbtc", | ||
"kind": "bin" | ||
} | ||
}, | ||
"args": [], | ||
"cwd": "${workspaceFolder}" | ||
}, | ||
] | ||
} | ||
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,188 @@ | ||
use std::{ | ||
cmp::Eq, | ||
collections::{HashMap, VecDeque}, | ||
hash::Hash, | ||
}; | ||
|
||
use log::info; | ||
|
||
pub struct CappedHashMap<K, V> | ||
where | ||
K: Hash + Eq + Copy + Clone, | ||
{ | ||
max_size: usize, | ||
inner: HashMap<K, V>, | ||
last_items: VecDeque<K>, | ||
} | ||
|
||
impl<K, V> CappedHashMap<K, V> | ||
where | ||
K: Hash + Eq + Copy + Clone, | ||
{ | ||
pub fn new(max_size: usize) -> Self { | ||
Self { | ||
max_size, | ||
inner: HashMap::with_capacity(max_size), | ||
last_items: VecDeque::with_capacity(max_size), | ||
} | ||
} | ||
|
||
fn log(&self) { | ||
let count = self.last_items.len(); | ||
|
||
if count >= self.max_size * 90 / 100 { | ||
info!("Over 90% full"); | ||
} else if count >= self.max_size / 2 { | ||
info!("Over 50% full"); | ||
} else if count >= self.max_size / 4 { | ||
info!("Over 25% full"); | ||
} | ||
} | ||
|
||
/// Inserts an new key-value pair to the collection. Return Some(key) where key is the | ||
/// key that was removed when we reach the max capacity. Otherwise returns None. | ||
pub fn add_entry(&mut self, k: K, v: V) -> Option<K> { | ||
let mut ret = None; | ||
let new_key = !self.inner.contains_key(&k); | ||
|
||
if new_key && self.last_items.len() >= self.max_size { | ||
// remove the oldest item. We an safely unwrap because we know the last_items is not empty at this point | ||
let key = self.last_items.pop_back().unwrap(); | ||
assert!(self.remove(&key).is_some()); | ||
|
||
ret = Some(key); | ||
} | ||
|
||
// replacing a value should not push any new items to last_items | ||
if self.inner.insert(k, v).is_none() { | ||
self.last_items.push_front(k); | ||
} | ||
|
||
self.log(); | ||
ret | ||
} | ||
|
||
/// Removes a key from the map, returning the value at the key if the key was previously in the map. | ||
pub fn remove(&mut self, k: &K) -> Option<V> { | ||
let Some(v) = self.inner.remove(k) else { | ||
return None; | ||
}; | ||
|
||
self.last_items | ||
.iter() | ||
.position(|key| key == k) | ||
.and_then(|pos| self.last_items.remove(pos)); | ||
|
||
Some(v) | ||
} | ||
|
||
/// Returns a reference to the value corresponding to the key. | ||
pub fn get(&self, k: &K) -> Option<&V> { | ||
self.inner.get(k) | ||
} | ||
|
||
/// Returns a mutable reference to the value corresponding to the key. | ||
pub fn get_mut(&mut self, k: &K) -> Option<&mut V> { | ||
self.inner.get_mut(k) | ||
} | ||
|
||
/// Returns the number of elements in the collection | ||
pub fn size(&self) -> usize { | ||
self.inner.len() | ||
} | ||
} | ||
|
||
#[cfg(test)] | ||
mod tests { | ||
use super::*; | ||
|
||
#[test] | ||
fn test_insert_into_non_full_collection() { | ||
let mut col: CappedHashMap<u8, u8> = CappedHashMap::new(10); | ||
col.add_entry(1, 1); | ||
col.add_entry(2, 2); | ||
col.add_entry(3, 3); | ||
|
||
assert_eq!(*col.get(&1).unwrap(), 1); | ||
assert_eq!(*col.get(&2).unwrap(), 2); | ||
assert_eq!(*col.get(&3).unwrap(), 3); | ||
} | ||
|
||
#[test] | ||
fn test_insert_should_return_removed_key() { | ||
// The real capacity will be 14. Read here for how this is calculated https://stackoverflow.com/a/76114888/512783 | ||
let mut col: CappedHashMap<u8, u8> = CappedHashMap::new(10); | ||
|
||
for i in 0..10 { | ||
col.add_entry(i, i); | ||
} | ||
|
||
for i in 10..30 { | ||
// the nth oldest key will be removed | ||
let key_removed = col.add_entry(i, i); | ||
// our hashmap and vecqueue should never grow i.e. capacity doesn't change | ||
assert_eq!(col.last_items.capacity(), 10); | ||
|
||
assert!(key_removed.is_some()); | ||
assert_eq!(key_removed.unwrap(), i - 10); | ||
assert_eq!(col.size(), 10); | ||
} | ||
|
||
// Not that we should have the last 10 keys in the collection i.e. 20-30. All the previous | ||
// were replaced by these new ones | ||
for i in 0..20 { | ||
assert!(col.get(&i).is_none()); | ||
} | ||
|
||
// after cyclic inserts we still have a full capacity collection. We can remove one item... | ||
assert!(col.remove(&20).is_some()); | ||
assert_eq!(col.size(), 9); | ||
|
||
// ... and now inserting a new item will not replace any existing one | ||
assert!(col.add_entry(31, 31).is_none()); | ||
} | ||
|
||
#[test] | ||
fn test_insert_duplicate() { | ||
let mut col: CappedHashMap<u8, u8> = CappedHashMap::new(10); | ||
|
||
for i in 0..10 { | ||
col.add_entry(i, i); | ||
} | ||
|
||
assert_eq!(*col.get(&0).unwrap(), 0); | ||
assert_eq!(col.size(), 10); | ||
|
||
// replacing should simply replace the value and not affect the size. | ||
// so altough our col is full capacity, replacing an existing should not remove the oldest item | ||
assert!(col.add_entry(0, 2).is_none()); | ||
assert_eq!(*col.get(&0).unwrap(), 2); | ||
assert_eq!(col.size(), 10); | ||
|
||
// but inserting a new one should | ||
let key_removed = col.add_entry(10, 10); | ||
assert!(key_removed.is_some()); | ||
assert_eq!(key_removed.unwrap(), 0); | ||
assert_eq!(col.size(), 10); | ||
} | ||
|
||
#[test] | ||
fn test_remove() { | ||
let mut col: CappedHashMap<u8, u8> = CappedHashMap::new(10); | ||
|
||
for i in 0..10 { | ||
col.add_entry(i, i); | ||
} | ||
|
||
for i in 0..10 { | ||
let v = col.remove(&i); | ||
assert!(v.is_some()); | ||
assert_eq!(v.unwrap(), i); | ||
assert_eq!(col.size() as u8, 10 - i - 1); | ||
} | ||
|
||
// the collection is empty so the next remove should return None | ||
let v = col.remove(&0); | ||
assert!(v.is_none()); | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
you probably didn't mean to push this file :o