mini_lsm/mini-lsm-starter/src/lsm_iterator.rs

// Copyright (c) 2022-2025 Alex Chi Z
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![allow(unused_variables)] // TODO(you): remove this lint after implementing this mod
#![allow(dead_code)] // TODO(you): remove this lint after implementing this mod

use anyhow::Result;

use crate::{
    iterators::{StorageIterator, merge_iterator::MergeIterator},
    mem_table::MemTableIterator,
};

/// Represents the internal type for an LSM iterator. This type will be changed across the course for multiple times.
type LsmIteratorInner = MergeIterator<MemTableIterator>;

pub struct LsmIterator {
    inner: LsmIteratorInner,
}

impl LsmIterator {
    pub(crate) fn new(iter: LsmIteratorInner) -> Result<Self> {
        Ok(Self { inner: iter })
    }
}

impl StorageIterator for LsmIterator {
    type KeyType<'a> = &'a [u8];

    fn is_valid(&self) -> bool {
        self.inner.is_valid()
    }

    fn key(&self) -> &[u8] {
        self.inner.key().into_inner()
    }

    fn value(&self) -> &[u8] {
        self.inner.value()
    }

    fn next(&mut self) -> Result<()> {
        // TODO: I dont know if I need use ? to return the Error or not
        self.inner.next()?;
        // 跳过已经删除的key
        while self.inner.is_valid() && self.inner.value().is_empty() {
            self.inner.next()?;
        }
        Ok(())
    }
}

/// A wrapper around existing iterator, will prevent users from calling `next` when the iterator is
/// invalid. If an iterator is already invalid, `next` does not do anything. If `next` returns an error,
/// `is_valid` should return false, and `next` should always return an error.
pub struct FusedIterator<I: StorageIterator> {
    iter: I,
    has_errored: bool,
}

impl<I: StorageIterator> FusedIterator<I> {
    pub fn new(iter: I) -> Self {
        Self {
            iter,
            has_errored: false,
        }
    }
}

impl<I: StorageIterator> StorageIterator for FusedIterator<I> {
    type KeyType<'a>
        = I::KeyType<'a>
    where
        Self: 'a;

    fn is_valid(&self) -> bool {
        // self.iter.is_valid() && !self.has_errored
        if self.has_errored {
            false
        } else {
            self.iter.is_valid()
        }
    }

    fn key(&self) -> Self::KeyType<'_> {
        self.iter.key()
    }

    fn value(&self) -> &[u8] {
        self.iter.value()
    }

    fn next(&mut self) -> Result<()> {
        // 按照测试用例，出现错误就要返回err
        if self.has_errored {
            return Err(anyhow::anyhow!("iterator has errored previously"));
        }

        // 但是对于迭代器已经失效，不应该报错
        if !self.iter.is_valid() {
            return Ok(());
        }

        //
        match self.iter.next() {
            Ok(()) => Ok(()),
            Err(e) => {
                self.has_errored = true;
                Err(e)
            }
        }
    }
}
-												relicense mini-lsm-book to CC BY-NC-SA 4.0 (#118)

* relicense mini-lsm-book to CC BY-NC-SA 4.0

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

* clearify license

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

* fix fmt

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

* fix fmt

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>
											
										
										
											2025-01-19 19:24:12 -05:00
+								// Copyright (c) 2022-2025 Alex Chi Z
 								//
 								// Licensed under the Apache License, Version 2.0 (the "License");
 								// you may not use this file except in compliance with the License.
 								// You may obtain a copy of the License at
 								//
 								//     http://www.apache.org/licenses/LICENSE-2.0
 								//
 								// Unless required by applicable law or agreed to in writing, software
 								// distributed under the License is distributed on an "AS IS" BASIS,
 								// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 								// See the License for the specific language governing permissions and
 								// limitations under the License.
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								#![allow(unused_variables)] // TODO(you): remove this lint after implementing this mod
 								#![allow(dead_code)] // TODO(you): remove this lint after implementing this mod
 								use anyhow::Result;
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
+								use crate::{
-												feat: bump to Rust edition 2024 (#132)

* feat: bump to Rust edition 2024

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* allow deadcode

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix deploy to pages

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix fmt

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* update actions

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2025-03-09 16:11:52 -04:00
+								    iterators::{StorageIterator, merge_iterator::MergeIterator},
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
+								    mem_table::MemTableIterator,
 								};
-												feat(docs): finish part 2

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 15:34:34 -05:00
-												docs: s/tutorial/course

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2025-01-19 19:28:04 -05:00
+								/// Represents the internal type for an LSM iterator. This type will be changed across the course for multiple times.
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
+								type LsmIteratorInner = MergeIterator<MemTableIterator>;
 								pub struct LsmIterator {
 								    inner: LsmIteratorInner,
 								}
 								impl LsmIterator {
 								    pub(crate) fn new(iter: LsmIteratorInner) -> Result<Self> {
 								        Ok(Self { inner: iter })
 								    }
 								}
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
 								impl StorageIterator for LsmIterator {
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
+								    type KeyType<'a> = &'a [u8];
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    fn is_valid(&self) -> bool {
-												First Commit

											
										
										
											2025-10-20 20:12:40 +08:00
+								        self.inner.is_valid()
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
 								    fn key(&self) -> &[u8] {
-												First Commit

											
										
										
											2025-10-20 20:12:40 +08:00
+								        self.inner.key().into_inner()
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
 								    fn value(&self) -> &[u8] {
-												First Commit

											
										
										
											2025-10-20 20:12:40 +08:00
+								        self.inner.value()
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
 								    fn next(&mut self) -> Result<()> {
-												First Commit

											
										
										
											2025-10-20 20:12:40 +08:00
+								        // TODO: I dont know if I need use ? to return the Error or not
 								        self.inner.next()?;
 								        // 跳过已经删除的key
 								        while self.inner.is_valid() && self.inner.value().is_empty() {
 								            self.inner.next()?;
 								        }
 								        Ok(())
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
 								}
-												feat(docs): finish part 2

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 15:34:34 -05:00
+								/// A wrapper around existing iterator, will prevent users from calling `next` when the iterator is
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
+								/// invalid. If an iterator is already invalid, `next` does not do anything. If `next` returns an error,
 								/// `is_valid` should return false, and `next` should always return an error.
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								pub struct FusedIterator<I: StorageIterator> {
 								    iter: I,
-												refactor: error handling (#41)


											
										
										
											2024-02-06 11:37:59 +08:00
+								    has_errored: bool,
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								}
 								impl<I: StorageIterator> FusedIterator<I> {
 								    pub fn new(iter: I) -> Self {
-												refactor: error handling (#41)


											
										
										
											2024-02-06 11:37:59 +08:00
+								        Self {
 								            iter,
 								            has_errored: false,
 								        }
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
 								}
 								impl<I: StorageIterator> StorageIterator for FusedIterator<I> {
-												chore: bump compiler version and clippy fixes (#105)

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>
											
										
										
											2024-12-09 00:23:03 -05:00
+								    type KeyType<'a>
 								        = I::KeyType<'a>
 								    where
 								        Self: 'a;
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    fn is_valid(&self) -> bool {
-												First Commit

											
										
										
											2025-10-20 20:12:40 +08:00
+								        // self.iter.is_valid() && !self.has_errored
 								        if self.has_errored {
 								            false
 								        } else {
 								            self.iter.is_valid()
 								        }
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
+								    fn key(&self) -> Self::KeyType<'_> {
-												First Commit

											
										
										
											2025-10-20 20:12:40 +08:00
+								        self.iter.key()
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
 								    fn value(&self) -> &[u8] {
-												First Commit

											
										
										
											2025-10-20 20:12:40 +08:00
+								        self.iter.value()
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
 								    fn next(&mut self) -> Result<()> {
-												First Commit

											
										
										
											2025-10-20 20:12:40 +08:00
+								        // 按照测试用例，出现错误就要返回err
 								        if self.has_errored {
 								            return Err(anyhow::anyhow!("iterator has errored previously"));
 								        }
 								        // 但是对于迭代器已经失效，不应该报错
 								        if !self.iter.is_valid() {
 								            return Ok(());
 								        }
 								        //
 								        match self.iter.next() {
 								            Ok(()) => Ok(()),
 								            Err(e) => {
 								                self.has_errored = true;
 								                Err(e)
 								            }
 								        }
-												feat(code): finish part 3

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2022-12-24 14:48:57 -05:00
+								    }
 								}