vector/expiring_hash_map.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299
//! Expiring Hash Map and related types. See [`ExpiringHashMap`].
#![warn(missing_docs)]
use std::{
borrow::Borrow,
collections::HashMap,
fmt,
hash::Hash,
time::{Duration, Instant},
};
use futures::StreamExt;
use tokio_util::time::{delay_queue, DelayQueue};
/// An expired item, holding the value and the key with an expiration information.
pub type ExpiredItem<K, V> = (V, delay_queue::Expired<K>);
/// A [`HashMap`] that maintains deadlines for the keys via a [`DelayQueue`].
pub struct ExpiringHashMap<K, V> {
map: HashMap<K, (V, delay_queue::Key)>,
expiration_queue: DelayQueue<K>,
}
impl<K, V> Unpin for ExpiringHashMap<K, V> {}
impl<K, V> ExpiringHashMap<K, V>
where
K: Eq + Hash + Clone,
{
/// Insert a new key with a TTL.
pub fn insert(&mut self, key: K, value: V, ttl: Duration) {
let delay_queue_key = self.expiration_queue.insert(key.clone(), ttl);
self.map.insert(key, (value, delay_queue_key));
}
/// Insert a new value with a deadline.
pub fn insert_at(&mut self, key: K, value: V, deadline: Instant) {
let delay_queue_key = self
.expiration_queue
.insert_at(key.clone(), deadline.into());
self.map.insert(key, (value, delay_queue_key));
}
/// Get a reference to the value by key.
pub fn get<Q>(&self, k: &Q) -> Option<&V>
where
K: Borrow<Q>,
Q: ?Sized + Hash + Eq,
{
self.map.get(k).map(|(v, _)| v)
}
/// Get a mut reference to the value by key.
pub fn get_mut<Q>(&mut self, k: &Q) -> Option<&mut V>
where
K: Borrow<Q>,
Q: ?Sized + Hash + Eq,
{
self.map.get_mut(k).map(|&mut (ref mut v, _)| v)
}
/// Reset the deadline for a key, and return a mut ref to the value.
pub fn reset_at<Q>(&mut self, k: &Q, when: Instant) -> Option<&mut V>
where
K: Borrow<Q>,
Q: ?Sized + Hash + Eq,
{
let (value, delay_queue_key) = self.map.get_mut(k)?;
self.expiration_queue.reset_at(delay_queue_key, when.into());
Some(value)
}
/// Reset the key if it exists, returning the value and the expiration
/// information.
pub fn remove<Q>(&mut self, k: &Q) -> Option<ExpiredItem<K, V>>
where
K: Borrow<Q>,
Q: ?Sized + Hash + Eq,
{
let (value, expiration_queue_key) = self.map.remove(k)?;
let expired = self.expiration_queue.remove(&expiration_queue_key);
Some((value, expired))
}
/// Return an iterator over keys and values of ExpiringHashMap. Useful for
/// processing all values in ExpiringHashMap irrespective of expiration. This
/// may be required for processing shutdown or other operations.
pub fn iter_mut(&mut self) -> impl Iterator<Item = (&K, &mut V)> {
self.map.iter_mut().map(|(k, (v, _delayed_key))| (k, v))
}
/// Check whether the [`ExpiringHashMap`] is empty.
/// If it's empty, the `next_expired` function immediately resolves to
/// [`None`]. Be aware that this may cause a spinlock behaviour if the
/// `next_expired` is polled in a loop while [`ExpiringHashMap`] is empty.
/// See [`ExpiringHashMap::next_expired`] for more info.
pub fn is_empty(&self) -> bool {
self.expiration_queue.is_empty()
}
/// Returns the number of elements in the map.
pub fn len(&self) -> usize {
self.map.len()
}
/// If the [`ExpiringHashMap`] is empty, immediately returns `None`.
/// Otherwise, waits for the closest deadline, removes expired item and
/// returns it.
///
/// Be aware that misuse of this function may cause a spinlock! If you want
/// to `select` on this future in a loop, be sure to check
/// [`ExpiringHashMap::is_empty`] and skip polling on
/// [`ExpiringHashMap::next_expired`] if the [`ExpiringHashMap`] is empty.
/// Otherwise, when the [`ExpiringHashMap`] is empty you'll effectively get
/// a spinlock on the first value insertion.
///
/// We currently don't offer an API that would allow simply waiting for
/// expired items regardless of what state the [`ExpiringHashMap`] is.
/// This is a deliberate design decision, we went with it for the following
/// reasons:
/// 1. Use of `async fn`. One of the benefits of this API is that it relies
/// only on `async fn`s, and doesn't require manual `Future`
/// implementation. While this is not a problem in general, but there is
/// some value with doing it this way. With a switch to `async` across
/// our code base, the idea is that we should completely eliminate manual
/// `Future` implementations and poll fns. This is controversial, but we
/// decided to give it a try.
/// 2. We don't know all the use cases, and exposing this kind of API might
/// make more sense, since it allows more flexibility.
/// We were choosing between, effectively, the current "drain"-like API,
/// and the "queue" like API.
/// Current ("drain"-like) API waits on the deadline or returns `None`
/// when there are no more items. Very similar how we [`Vec::drain`] iter
/// works.
/// The "queue"-like API would, pretty much, be simply waiting expired
/// items to appear. In the case of empty [`ExpiringHashMap`], we would
/// wait indefinitely - or until an item is inserted. This would be
/// possible to carry on, for instance, from a sibling branch of a
/// `select` statement, so the borrowing rules won't be a problem here.
/// 3. We went over the following alternative signature:
/// ```ignore
/// pub fn next_expired(&mut self) -> Option<impl Future<Outcome = Result<ExpiredItem<K, V>, Error>>> {...}
/// ```
/// This captures the API restrictions a bit better, and should provide
/// less possibilities to misuse the API.
/// We didn't pick this one because it's not an `async fn` and we wanted
/// this, see (1) of this list. Furthermore, instead of doing a
/// `select { _ = map.next_expired(), if !map.is_empty() => { ... } }`
/// users would have to do
/// `let exp = map.next_expired(); select { _ = exp.unwrap(), if exp.is_some() => { ... } }`,
/// which is less readable and a bit harder to understand. Although it
/// has a possibility of a nicer generalization if `select` macro
/// supported a `Some(future)` kind of pattern matching, we decided to go
/// with other solution for now.
///
/// # Examples
///
/// ```rust
/// # let rt = tokio::runtime::Runtime::new().unwrap();
/// # rt.block_on(async {
/// use vector::expiring_hash_map::ExpiringHashMap;
/// use std::time::Duration;
///
/// let mut map: ExpiringHashMap<String, String> = ExpiringHashMap::default();
///
/// loop {
/// tokio::select! {
/// // You need to ensure that this branch is disabled if the map
/// // is empty! Not doing this will result in a spinlock.
/// val = map.next_expired(), if !map.is_empty() => match val {
/// None => unreachable!(), // we never poll the empty map in the first place!
/// Some((val, _)) => {
/// println!("Expired: {}", val);
/// break;
/// }
/// },
/// _ = tokio::time::sleep(Duration::from_millis(100)) => map.insert(
/// "key".to_owned(),
/// "val".to_owned(),
/// Duration::from_millis(30),
/// ),
/// }
/// }
/// # });
/// ```
pub async fn next_expired(&mut self) -> Option<ExpiredItem<K, V>> {
self.expiration_queue.next().await.map(|key| {
let (value, _) = self.map.remove(key.get_ref()).unwrap();
(value, key)
})
}
}
impl<K, V> Default for ExpiringHashMap<K, V>
where
K: Eq + Hash + Clone,
{
fn default() -> Self {
Self {
map: HashMap::new(),
expiration_queue: DelayQueue::new(),
}
}
}
impl<K, V> fmt::Debug for ExpiringHashMap<K, V>
where
K: Eq + Hash + Clone,
{
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
f.debug_struct("ExpiringHashMap").finish()
}
}
#[cfg(test)]
mod tests {
use std::task::Poll;
use tokio_test::{assert_pending, assert_ready, task};
use super::*;
fn unwrap_ready<T>(poll: Poll<T>) -> T {
assert_ready!(&poll);
match poll {
Poll::Ready(val) => val,
_ => unreachable!(),
}
}
#[test]
fn next_expired_is_pending_with_empty_map() {
let mut map = ExpiringHashMap::<String, String>::default();
let mut fut = task::spawn(map.next_expired());
assert!(unwrap_ready(fut.poll()).is_none());
}
#[tokio::test]
async fn next_expired_is_pending_with_a_non_empty_map() {
let mut map = ExpiringHashMap::<String, String>::default();
map.insert("key".to_owned(), "val".to_owned(), Duration::from_secs(1));
let mut fut = task::spawn(map.next_expired());
assert_pending!(fut.poll());
}
#[tokio::test]
async fn next_expired_does_not_wake_when_the_value_is_available_upfront() {
let mut map = ExpiringHashMap::<String, String>::default();
let a_minute_ago = Instant::now() - Duration::from_secs(60);
map.insert_at("key".to_owned(), "val".to_owned(), a_minute_ago);
let mut fut = task::spawn(map.next_expired());
assert_eq!(unwrap_ready(fut.poll()).unwrap().0, "val");
assert!(!fut.is_woken());
}
#[tokio::test(start_paused = true)]
async fn next_expired_wakes_and_becomes_ready_when_value_ttl_expires() {
let mut map = ExpiringHashMap::<String, String>::default();
let ttl = Duration::from_secs(1);
map.insert("key".to_owned(), "val".to_owned(), ttl);
let mut fut = task::spawn(map.next_expired());
// At first, has to be pending.
assert_pending!(fut.poll());
assert!(!fut.is_woken());
// Then, after deadline, has to be ready.
tokio::time::advance(Duration::from_secs(1)).await;
assert!(fut.is_woken());
let value = assert_ready!(fut.poll());
let (key, value) = value
.map(|(value, key)| (key.into_inner(), value))
.expect("map definitively had entry that should be expired");
assert_eq!(key, "key".to_owned());
assert_eq!(value, "val".to_owned());
}
#[tokio::test]
async fn next_expired_api_allows_inserting_items() {
let mut map = ExpiringHashMap::<String, String>::default();
// At first, has to be pending.
let mut fut = task::spawn(map.next_expired());
assert!(unwrap_ready(fut.poll()).is_none());
drop(fut);
// Insert an item.
let ttl = Duration::from_secs(1000);
map.insert("key".to_owned(), "val".to_owned(), ttl);
// Then, after value is inserted, has to be still pending.
let mut fut = task::spawn(map.next_expired());
assert_pending!(fut.poll());
}
}