use std::ops::Bound; use std::path::Path; use std::sync::atomic::AtomicUsize; use std::sync::Arc; use anyhow::Result; use bytes::Bytes; use crossbeam_skiplist::map::Entry; use crossbeam_skiplist::SkipMap; use ouroboros::self_referencing; use crate::iterators::StorageIterator; use crate::key::KeySlice; use crate::table::SsTableBuilder; use crate::wal::Wal; /// A basic mem-table based on crossbeam-skiplist. /// /// An initial implementation of memtable is part of week 1, day 1. It will be incrementally implemented in other /// chapters of week 1 and week 2. pub struct MemTable { map: Arc>, wal: Option, id: usize, approximate_size: Arc, } /// Create a bound of `Bytes` from a bound of `&[u8]`. pub(crate) fn map_bound(bound: Bound<&[u8]>) -> Bound { match bound { Bound::Included(x) => Bound::Included(Bytes::copy_from_slice(x)), Bound::Excluded(x) => Bound::Excluded(Bytes::copy_from_slice(x)), Bound::Unbounded => Bound::Unbounded, } } impl MemTable { /// Create a new mem-table. pub fn create(id: usize) -> Self { Self { id, map: Arc::new(SkipMap::new()), wal: None, approximate_size: Arc::new(AtomicUsize::new(0)), } } /// Create a new mem-table with WAL pub fn create_with_wal(id: usize, path: impl AsRef) -> Result { Ok(Self { id, map: Arc::new(SkipMap::new()), wal: Some(Wal::create(path.as_ref())?), approximate_size: Arc::new(AtomicUsize::new(0)), }) } /// Create a memtable from WAL pub fn recover_from_wal(id: usize, path: impl AsRef) -> Result { let map = Arc::new(SkipMap::new()); Ok(Self { id, wal: Some(Wal::recover(path.as_ref(), &map)?), map, approximate_size: Arc::new(AtomicUsize::new(0)), }) } pub fn for_testing_put_slice(&self, key: &[u8], value: &[u8]) -> Result<()> { self.put(key, value) } pub fn for_testing_get_slice(&self, key: &[u8]) -> Option { self.get(key) } pub fn for_testing_scan_slice( &self, lower: Bound<&[u8]>, upper: Bound<&[u8]>, ) -> MemTableIterator { self.scan(lower, upper) } /// Get a value by key. pub fn get(&self, key: &[u8]) -> Option { self.map.get(key).map(|e| e.value().clone()) } /// Put a key-value pair into the mem-table. /// /// In week 1, day 1, simply put the key-value pair into the skipmap. /// In week 2, day 6, also flush the data to WAL. pub fn put(&self, key: &[u8], value: &[u8]) -> Result<()> { let estimated_size = key.len() + value.len(); self.map .insert(Bytes::copy_from_slice(key), Bytes::copy_from_slice(value)); self.approximate_size .fetch_add(estimated_size, std::sync::atomic::Ordering::Relaxed); if let Some(ref wal) = self.wal { wal.put(key, value)?; } Ok(()) } pub fn sync_wal(&self) -> Result<()> { if let Some(ref wal) = self.wal { wal.sync()?; } Ok(()) } /// Get an iterator over a range of keys. pub fn scan(&self, lower: Bound<&[u8]>, upper: Bound<&[u8]>) -> MemTableIterator { let (lower, upper) = (map_bound(lower), map_bound(upper)); let mut iter = MemTableIteratorBuilder { map: self.map.clone(), iter_builder: |map| map.range((lower, upper)), item: (Bytes::new(), Bytes::new()), } .build(); iter.next().unwrap(); iter } /// Flush the mem-table to SSTable. Implement in week 1 day 6. pub fn flush(&self, builder: &mut SsTableBuilder) -> Result<()> { for entry in self.map.iter() { builder.add(KeySlice::from_slice(&entry.key()[..]), &entry.value()[..]); } Ok(()) } pub fn id(&self) -> usize { self.id } pub fn approximate_size(&self) -> usize { self.approximate_size .load(std::sync::atomic::Ordering::Relaxed) } /// Only use this function when closing the database pub fn is_empty(&self) -> bool { self.map.is_empty() } } type SkipMapRangeIter<'a> = crossbeam_skiplist::map::Range<'a, Bytes, (Bound, Bound), Bytes, Bytes>; /// An iterator over a range of `SkipMap`. This is a self-referential structure and please refer to week 1, day 2 /// chapter for more information. /// /// This is part of week 1, day 2. #[self_referencing] pub struct MemTableIterator { /// Stores a reference to the skipmap. map: Arc>, /// Stores a skipmap iterator that refers to the lifetime of `MemTableIterator` itself. #[borrows(map)] #[not_covariant] iter: SkipMapRangeIter<'this>, /// Stores the current key-value pair. item: (Bytes, Bytes), } impl MemTableIterator { fn entry_to_item(entry: Option>) -> (Bytes, Bytes) { entry .map(|x| (x.key().clone(), x.value().clone())) .unwrap_or_else(|| (Bytes::from_static(&[]), Bytes::from_static(&[]))) } } impl StorageIterator for MemTableIterator { type KeyType<'a> = KeySlice<'a>; fn value(&self) -> &[u8] { &self.borrow_item().1[..] } fn key(&self) -> KeySlice { KeySlice::from_slice(&self.borrow_item().0[..]) } fn is_valid(&self) -> bool { !self.borrow_item().0.is_empty() } fn next(&mut self) -> Result<()> { let entry = self.with_iter_mut(|iter| MemTableIterator::entry_to_item(iter.next())); self.with_mut(|x| *x.item = entry); Ok(()) } }