checkin initial MVCC codebase
Signed-off-by: Alex Chi <iskyzh@gmail.com>
This commit is contained in:
		
							
								
								
									
										184
									
								
								mini-lsm-mvcc/src/mem_table.rs
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										184
									
								
								mini-lsm-mvcc/src/mem_table.rs
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,184 @@ | ||||
| use std::ops::Bound; | ||||
| use std::path::Path; | ||||
| use std::sync::atomic::AtomicUsize; | ||||
| use std::sync::Arc; | ||||
|  | ||||
| use anyhow::Result; | ||||
| use bytes::Bytes; | ||||
| use crossbeam_skiplist::map::Entry; | ||||
| use crossbeam_skiplist::SkipMap; | ||||
| use ouroboros::self_referencing; | ||||
|  | ||||
| use crate::iterators::StorageIterator; | ||||
| use crate::key::{self, KeySlice}; | ||||
| use crate::table::SsTableBuilder; | ||||
| use crate::wal::Wal; | ||||
|  | ||||
| /// A basic mem-table based on crossbeam-skiplist. | ||||
| /// | ||||
| /// An initial implementation of memtable is part of week 1, day 1. It will be incrementally implemented in other | ||||
| /// chapters of week 1 and week 2. | ||||
| pub struct MemTable { | ||||
|     map: Arc<SkipMap<Bytes, Bytes>>, | ||||
|     wal: Option<Wal>, | ||||
|     id: usize, | ||||
|     approximate_size: Arc<AtomicUsize>, | ||||
| } | ||||
|  | ||||
| /// Create a bound of `Bytes` from a bound of `&[u8]`. | ||||
| pub(crate) fn map_bound(bound: Bound<&[u8]>) -> Bound<Bytes> { | ||||
|     match bound { | ||||
|         Bound::Included(x) => Bound::Included(Bytes::copy_from_slice(x)), | ||||
|         Bound::Excluded(x) => Bound::Excluded(Bytes::copy_from_slice(x)), | ||||
|         Bound::Unbounded => Bound::Unbounded, | ||||
|     } | ||||
| } | ||||
|  | ||||
| impl MemTable { | ||||
|     /// Create a new mem-table. | ||||
|     pub fn create(id: usize) -> Self { | ||||
|         Self { | ||||
|             id, | ||||
|             map: Arc::new(SkipMap::new()), | ||||
|             wal: None, | ||||
|             approximate_size: Arc::new(AtomicUsize::new(0)), | ||||
|         } | ||||
|     } | ||||
|  | ||||
|     /// Create a new mem-table with WAL | ||||
|     pub fn create_with_wal(id: usize, path: impl AsRef<Path>) -> Result<Self> { | ||||
|         Ok(Self { | ||||
|             id, | ||||
|             map: Arc::new(SkipMap::new()), | ||||
|             wal: Some(Wal::create(path.as_ref())?), | ||||
|             approximate_size: Arc::new(AtomicUsize::new(0)), | ||||
|         }) | ||||
|     } | ||||
|  | ||||
|     /// Create a memtable from WAL | ||||
|     pub fn recover_from_wal(id: usize, path: impl AsRef<Path>) -> Result<Self> { | ||||
|         let map = Arc::new(SkipMap::new()); | ||||
|         Ok(Self { | ||||
|             id, | ||||
|             wal: Some(Wal::recover(path.as_ref(), &map)?), | ||||
|             map, | ||||
|             approximate_size: Arc::new(AtomicUsize::new(0)), | ||||
|         }) | ||||
|     } | ||||
|  | ||||
|     /// Get a value by key. | ||||
|     pub fn get(&self, key: &[u8]) -> Option<Bytes> { | ||||
|         self.map.get(key).map(|e| e.value().clone()) | ||||
|     } | ||||
|  | ||||
|     /// Put a key-value pair into the mem-table. | ||||
|     /// | ||||
|     /// In week 1, day 1, simply put the key-value pair into the skipmap. | ||||
|     /// In week 2, day 6, also flush the data to WAL. | ||||
|     pub fn put(&self, key: &[u8], value: &[u8]) -> Result<()> { | ||||
|         let estimated_size = key.len() + value.len(); | ||||
|         self.map | ||||
|             .insert(Bytes::copy_from_slice(key), Bytes::copy_from_slice(value)); | ||||
|         self.approximate_size | ||||
|             .fetch_add(estimated_size, std::sync::atomic::Ordering::Relaxed); | ||||
|         if let Some(ref wal) = self.wal { | ||||
|             wal.put(key, value)?; | ||||
|         } | ||||
|         Ok(()) | ||||
|     } | ||||
|  | ||||
|     pub fn sync_wal(&self) -> Result<()> { | ||||
|         if let Some(ref wal) = self.wal { | ||||
|             wal.sync()?; | ||||
|         } | ||||
|         Ok(()) | ||||
|     } | ||||
|  | ||||
|     /// Get an iterator over a range of keys. | ||||
|     pub fn scan(&self, lower: Bound<&[u8]>, upper: Bound<&[u8]>) -> MemTableIterator { | ||||
|         let (lower, upper) = (map_bound(lower), map_bound(upper)); | ||||
|         let mut iter = MemTableIteratorBuilder { | ||||
|             map: self.map.clone(), | ||||
|             iter_builder: |map| map.range((lower, upper)), | ||||
|             item: (Bytes::new(), Bytes::new()), | ||||
|         } | ||||
|         .build(); | ||||
|         let entry = iter.with_iter_mut(|iter| MemTableIterator::entry_to_item(iter.next())); | ||||
|         iter.with_mut(|x| *x.item = entry); | ||||
|         iter | ||||
|     } | ||||
|  | ||||
|     /// Flush the mem-table to SSTable. Implement in week 1 day 6. | ||||
|     pub fn flush(&self, builder: &mut SsTableBuilder) -> Result<()> { | ||||
|         for entry in self.map.iter() { | ||||
|             builder.add( | ||||
|                 KeySlice::from_slice(&entry.key()[..], key::TS_DEFAULT), | ||||
|                 &entry.value()[..], | ||||
|             ); | ||||
|         } | ||||
|         Ok(()) | ||||
|     } | ||||
|  | ||||
|     pub fn id(&self) -> usize { | ||||
|         self.id | ||||
|     } | ||||
|  | ||||
|     pub fn approximate_size(&self) -> usize { | ||||
|         self.approximate_size | ||||
|             .load(std::sync::atomic::Ordering::Relaxed) | ||||
|     } | ||||
|  | ||||
|     /// Only use this function when closing the database | ||||
|     pub fn is_empty(&self) -> bool { | ||||
|         self.map.is_empty() | ||||
|     } | ||||
| } | ||||
|  | ||||
| type SkipMapRangeIter<'a> = | ||||
|     crossbeam_skiplist::map::Range<'a, Bytes, (Bound<Bytes>, Bound<Bytes>), Bytes, Bytes>; | ||||
|  | ||||
| /// An iterator over a range of `SkipMap`. This is a self-referential structure and please refer to week 1, day 2 | ||||
| /// chapter for more information. | ||||
| /// | ||||
| /// This is part of week 1, day 2. | ||||
| #[self_referencing] | ||||
| pub struct MemTableIterator { | ||||
|     /// Stores a reference to the skipmap. | ||||
|     map: Arc<SkipMap<Bytes, Bytes>>, | ||||
|     /// Stores a skipmap iterator that refers to the lifetime of `MemTableIterator` itself. | ||||
|     #[borrows(map)] | ||||
|     #[not_covariant] | ||||
|     iter: SkipMapRangeIter<'this>, | ||||
|     /// Stores the current key-value pair. | ||||
|     item: (Bytes, Bytes), | ||||
| } | ||||
|  | ||||
| impl MemTableIterator { | ||||
|     fn entry_to_item(entry: Option<Entry<'_, Bytes, Bytes>>) -> (Bytes, Bytes) { | ||||
|         entry | ||||
|             .map(|x| (x.key().clone(), x.value().clone())) | ||||
|             .unwrap_or_else(|| (Bytes::from_static(&[]), Bytes::from_static(&[]))) | ||||
|     } | ||||
| } | ||||
|  | ||||
| impl StorageIterator for MemTableIterator { | ||||
|     type KeyType<'a> = KeySlice<'a>; | ||||
|  | ||||
|     fn value(&self) -> &[u8] { | ||||
|         &self.borrow_item().1[..] | ||||
|     } | ||||
|  | ||||
|     fn key(&self) -> KeySlice { | ||||
|         KeySlice::from_slice(&self.borrow_item().0[..], key::TS_DEFAULT) | ||||
|     } | ||||
|  | ||||
|     fn is_valid(&self) -> bool { | ||||
|         !self.borrow_item().0.is_empty() | ||||
|     } | ||||
|  | ||||
|     fn next(&mut self) -> Result<()> { | ||||
|         let entry = self.with_iter_mut(|iter| MemTableIterator::entry_to_item(iter.next())); | ||||
|         self.with_mut(|x| *x.item = entry); | ||||
|         Ok(()) | ||||
|     } | ||||
| } | ||||
		Reference in New Issue
	
	Block a user
	 Alex Chi
					Alex Chi