| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | use std::ops::Bound;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  | use anyhow::{bail, Result};
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | use bytes::Bytes;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  | use crate::iterators::concat_iterator::SstConcatIterator;
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | use crate::iterators::merge_iterator::MergeIterator;
 | 
					
						
							|  |  |  | use crate::iterators::two_merge_iterator::TwoMergeIterator;
 | 
					
						
							| 
									
										
										
										
											2022-12-24 18:25:41 -05:00
										 |  |  | use crate::iterators::StorageIterator;
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | use crate::mem_table::MemTableIterator;
 | 
					
						
							|  |  |  | use crate::table::SsTableIterator;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  | /// Represents the internal type for an LSM iterator. This type will be changed across the tutorial for multiple times.
 | 
					
						
							|  |  |  | type LsmIteratorInner = TwoMergeIterator<
 | 
					
						
							|  |  |  |     TwoMergeIterator<MergeIterator<MemTableIterator>, MergeIterator<SsTableIterator>>,
 | 
					
						
							|  |  |  |     MergeIterator<SstConcatIterator>,
 | 
					
						
							|  |  |  | >;
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | pub struct LsmIterator {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |     inner: LsmIteratorInner,
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |     end_bound: Bound<Bytes>,
 | 
					
						
							|  |  |  |     is_valid: bool,
 | 
					
						
							|  |  |  | }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | impl LsmIterator {
 | 
					
						
							|  |  |  |     pub(crate) fn new(iter: LsmIteratorInner, end_bound: Bound<Bytes>) -> Result<Self> {
 | 
					
						
							|  |  |  |         let mut iter = Self {
 | 
					
						
							|  |  |  |             is_valid: iter.is_valid(),
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |             inner: iter,
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |             end_bound,
 | 
					
						
							|  |  |  |         };
 | 
					
						
							|  |  |  |         iter.move_to_non_delete()?;
 | 
					
						
							|  |  |  |         Ok(iter)
 | 
					
						
							|  |  |  |     }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     fn next_inner(&mut self) -> Result<()> {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |         self.inner.next()?;
 | 
					
						
							|  |  |  |         if !self.inner.is_valid() {
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |             self.is_valid = false;
 | 
					
						
							|  |  |  |             return Ok(());
 | 
					
						
							|  |  |  |         }
 | 
					
						
							|  |  |  |         match self.end_bound.as_ref() {
 | 
					
						
							|  |  |  |             Bound::Unbounded => {}
 | 
					
						
							| 
									
										
										
										
											2024-01-25 10:59:08 +08:00
										 |  |  |             Bound::Included(key) => self.is_valid = self.inner.key().raw_ref() <= key.as_ref(),
 | 
					
						
							|  |  |  |             Bound::Excluded(key) => self.is_valid = self.inner.key().raw_ref() < key.as_ref(),
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |         }
 | 
					
						
							|  |  |  |         Ok(())
 | 
					
						
							|  |  |  |     }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     fn move_to_non_delete(&mut self) -> Result<()> {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |         while self.is_valid() && self.inner.value().is_empty() {
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |             self.next_inner()?;
 | 
					
						
							|  |  |  |         }
 | 
					
						
							|  |  |  |         Ok(())
 | 
					
						
							|  |  |  |     }
 | 
					
						
							|  |  |  | }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | impl StorageIterator for LsmIterator {
 | 
					
						
							| 
									
										
										
										
											2024-01-25 10:59:08 +08:00
										 |  |  |     type KeyType<'a> = &'a [u8];
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |     fn is_valid(&self) -> bool {
 | 
					
						
							|  |  |  |         self.is_valid
 | 
					
						
							|  |  |  |     }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     fn key(&self) -> &[u8] {
 | 
					
						
							| 
									
										
										
										
											2024-01-25 10:59:08 +08:00
										 |  |  |         self.inner.key().raw_ref()
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |     }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     fn value(&self) -> &[u8] {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |         self.inner.value()
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |     }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     fn next(&mut self) -> Result<()> {
 | 
					
						
							|  |  |  |         self.next_inner()?;
 | 
					
						
							|  |  |  |         self.move_to_non_delete()?;
 | 
					
						
							|  |  |  |         Ok(())
 | 
					
						
							|  |  |  |     }
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     fn num_active_iterators(&self) -> usize {
 | 
					
						
							|  |  |  |         self.inner.num_active_iterators()
 | 
					
						
							|  |  |  |     }
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | }
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-24 15:34:34 -05:00
										 |  |  | /// A wrapper around existing iterator, will prevent users from calling `next` when the iterator is
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  | /// invalid. If an iterator is already invalid, `next` does not do anything. If `next` returns an error,
 | 
					
						
							|  |  |  | /// `is_valid` should return false, and `next` should always return an error.
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | pub struct FusedIterator<I: StorageIterator> {
 | 
					
						
							|  |  |  |     iter: I,
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |     has_errored: bool,
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | impl<I: StorageIterator> FusedIterator<I> {
 | 
					
						
							|  |  |  |     pub fn new(iter: I) -> Self {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |         Self {
 | 
					
						
							|  |  |  |             iter,
 | 
					
						
							|  |  |  |             has_errored: false,
 | 
					
						
							|  |  |  |         }
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |     }
 | 
					
						
							|  |  |  | }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | impl<I: StorageIterator> StorageIterator for FusedIterator<I> {
 | 
					
						
							| 
									
										
										
										
											2024-01-25 10:59:08 +08:00
										 |  |  |     type KeyType<'a> = I::KeyType<'a> where Self: 'a;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |     fn is_valid(&self) -> bool {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |         !self.has_errored && self.iter.is_valid()
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |     }
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-01-25 10:59:08 +08:00
										 |  |  |     fn key(&self) -> Self::KeyType<'_> {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |         if self.has_errored || !self.iter.is_valid() {
 | 
					
						
							|  |  |  |             panic!("invalid access to the underlying iterator");
 | 
					
						
							|  |  |  |         }
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |         self.iter.key()
 | 
					
						
							|  |  |  |     }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     fn value(&self) -> &[u8] {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |         if self.has_errored || !self.iter.is_valid() {
 | 
					
						
							|  |  |  |             panic!("invalid access to the underlying iterator");
 | 
					
						
							|  |  |  |         }
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |         self.iter.value()
 | 
					
						
							|  |  |  |     }
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     fn next(&mut self) -> Result<()> {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |         // only move when the iterator is valid and not errored
 | 
					
						
							|  |  |  |         if self.has_errored {
 | 
					
						
							|  |  |  |             bail!("the iterator is tainted");
 | 
					
						
							|  |  |  |         }
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |         if self.iter.is_valid() {
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  |             if let Err(e) = self.iter.next() {
 | 
					
						
							|  |  |  |                 self.has_errored = true;
 | 
					
						
							|  |  |  |                 return Err(e);
 | 
					
						
							|  |  |  |             }
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  |         }
 | 
					
						
							|  |  |  |         Ok(())
 | 
					
						
							|  |  |  |     }
 | 
					
						
							| 
									
										
										
										
											2024-01-24 14:32:13 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     fn num_active_iterators(&self) -> usize {
 | 
					
						
							|  |  |  |         self.iter.num_active_iterators()
 | 
					
						
							|  |  |  |     }
 | 
					
						
							| 
									
										
										
										
											2022-12-24 14:48:57 -05:00
										 |  |  | }
 |