mini_lsm/mini-lsm/src/tests/harness.rs

// Copyright (c) 2022-2025 Alex Chi Z
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::{
    collections::BTreeMap, ops::Bound, os::unix::fs::MetadataExt, path::Path, sync::Arc,
    time::Duration,
};

use anyhow::{bail, Result};
use bytes::Bytes;

use crate::{
    compact::{
        CompactionOptions, LeveledCompactionOptions, SimpleLeveledCompactionOptions,
        TieredCompactionOptions,
    },
    iterators::{merge_iterator::MergeIterator, StorageIterator},
    key::{KeySlice, TS_ENABLED},
    lsm_storage::{BlockCache, LsmStorageInner, LsmStorageState, MiniLsm},
    table::{SsTable, SsTableBuilder, SsTableIterator},
};

#[derive(Clone)]
pub struct MockIterator {
    pub data: Vec<(Bytes, Bytes)>,
    pub error_when: Option<usize>,
    pub index: usize,
}

impl MockIterator {
    pub fn new(data: Vec<(Bytes, Bytes)>) -> Self {
        Self {
            data,
            index: 0,
            error_when: None,
        }
    }

    pub fn new_with_error(data: Vec<(Bytes, Bytes)>, error_when: usize) -> Self {
        Self {
            data,
            index: 0,
            error_when: Some(error_when),
        }
    }
}

impl StorageIterator for MockIterator {
    type KeyType<'a> = KeySlice<'a>;

    fn next(&mut self) -> Result<()> {
        if self.index < self.data.len() {
            self.index += 1;
        }
        if let Some(error_when) = self.error_when {
            if self.index == error_when {
                bail!("fake error!");
            }
        }
        Ok(())
    }

    fn key(&self) -> KeySlice {
        if let Some(error_when) = self.error_when {
            if self.index >= error_when {
                panic!("invalid access after next returns an error!");
            }
        }
        KeySlice::for_testing_from_slice_no_ts(self.data[self.index].0.as_ref())
    }

    fn value(&self) -> &[u8] {
        if let Some(error_when) = self.error_when {
            if self.index >= error_when {
                panic!("invalid access after next returns an error!");
            }
        }
        self.data[self.index].1.as_ref()
    }

    fn is_valid(&self) -> bool {
        if let Some(error_when) = self.error_when {
            if self.index >= error_when {
                panic!("invalid access after next returns an error!");
            }
        }
        self.index < self.data.len()
    }
}

pub fn as_bytes(x: &[u8]) -> Bytes {
    Bytes::copy_from_slice(x)
}

pub fn check_iter_result_by_key<I>(iter: &mut I, expected: Vec<(Bytes, Bytes)>)
where
    I: for<'a> StorageIterator<KeyType<'a> = KeySlice<'a>>,
{
    for (k, v) in expected {
        assert!(iter.is_valid());
        assert_eq!(
            k,
            iter.key().for_testing_key_ref(),
            "expected key: {:?}, actual key: {:?}",
            k,
            as_bytes(iter.key().for_testing_key_ref()),
        );
        assert_eq!(
            v,
            iter.value(),
            "expected value: {:?}, actual value: {:?}",
            v,
            as_bytes(iter.value()),
        );
        iter.next().unwrap();
    }
    assert!(!iter.is_valid());
}

#[allow(dead_code)]
pub fn check_iter_result_by_key_and_ts<I>(iter: &mut I, expected: Vec<((Bytes, u64), Bytes)>)
where
    I: for<'a> StorageIterator<KeyType<'a> = KeySlice<'a>>,
{
    for ((k, ts), v) in expected {
        assert!(iter.is_valid());
        assert_eq!(
            (&k[..], ts),
            (
                iter.key().for_testing_key_ref(),
                iter.key().for_testing_ts()
            ),
            "expected key: {:?}@{}, actual key: {:?}@{}",
            k,
            ts,
            as_bytes(iter.key().for_testing_key_ref()),
            iter.key().for_testing_ts(),
        );
        assert_eq!(
            v,
            iter.value(),
            "expected value: {:?}, actual value: {:?}",
            v,
            as_bytes(iter.value()),
        );
        iter.next().unwrap();
    }
    assert!(!iter.is_valid());
}

pub fn check_lsm_iter_result_by_key<I>(iter: &mut I, expected: Vec<(Bytes, Bytes)>)
where
    I: for<'a> StorageIterator<KeyType<'a> = &'a [u8]>,
{
    for (k, v) in expected {
        assert!(iter.is_valid());
        assert_eq!(
            k,
            iter.key(),
            "expected key: {:?}, actual key: {:?}",
            k,
            as_bytes(iter.key()),
        );
        assert_eq!(
            v,
            iter.value(),
            "expected value: {:?}, actual value: {:?}",
            v,
            as_bytes(iter.value()),
        );
        iter.next().unwrap();
    }
    assert!(!iter.is_valid());
}

pub fn expect_iter_error(mut iter: impl StorageIterator) {
    loop {
        match iter.next() {
            Ok(_) if iter.is_valid() => continue,
            Ok(_) => panic!("expect an error"),
            Err(_) => break,
        }
    }
}

pub fn generate_sst(
    id: usize,
    path: impl AsRef<Path>,
    data: Vec<(Bytes, Bytes)>,
    block_cache: Option<Arc<BlockCache>>,
) -> SsTable {
    let mut builder = SsTableBuilder::new(128);
    for (key, value) in data {
        builder.add(KeySlice::for_testing_from_slice_no_ts(&key[..]), &value[..]);
    }
    builder.build(id, block_cache, path.as_ref()).unwrap()
}

#[allow(dead_code)]
pub fn generate_sst_with_ts(
    id: usize,
    path: impl AsRef<Path>,
    data: Vec<((Bytes, u64), Bytes)>,
    block_cache: Option<Arc<BlockCache>>,
) -> SsTable {
    let mut builder = SsTableBuilder::new(128);
    for ((key, ts), value) in data {
        builder.add(
            KeySlice::for_testing_from_slice_with_ts(&key[..], ts),
            &value[..],
        );
    }
    builder.build(id, block_cache, path.as_ref()).unwrap()
}

pub fn sync(storage: &LsmStorageInner) {
    storage
        .force_freeze_memtable(&storage.state_lock.lock())
        .unwrap();
    storage.force_flush_next_imm_memtable().unwrap();
}

pub fn compaction_bench(storage: Arc<MiniLsm>) {
    let mut key_map = BTreeMap::<usize, usize>::new();
    let gen_key = |i| format!("{:010}", i); // 10B
    let gen_value = |i| format!("{:0110}", i); // 110B
    let mut max_key = 0;
    let overlaps = if TS_ENABLED { 10000 } else { 20000 };
    for iter in 0..10 {
        let range_begin = iter * 5000;
        for i in range_begin..(range_begin + overlaps) {
            // 120B per key, 4MB data populated
            let key: String = gen_key(i);
            let version = key_map.get(&i).copied().unwrap_or_default() + 1;
            let value = gen_value(version);
            key_map.insert(i, version);
            storage.put(key.as_bytes(), value.as_bytes()).unwrap();
            max_key = max_key.max(i);
        }
    }

    std::thread::sleep(Duration::from_secs(1)); // wait until all memtables flush
    while {
        let snapshot = storage.inner.state.read();
        !snapshot.imm_memtables.is_empty()
    } {
        storage.inner.force_flush_next_imm_memtable().unwrap();
    }

    let mut prev_snapshot = storage.inner.state.read().clone();
    while {
        std::thread::sleep(Duration::from_secs(1));
        let snapshot = storage.inner.state.read().clone();
        let to_cont = prev_snapshot.levels != snapshot.levels
            || prev_snapshot.l0_sstables != snapshot.l0_sstables;
        prev_snapshot = snapshot;
        to_cont
    } {
        println!("waiting for compaction to converge");
    }

    let mut expected_key_value_pairs = Vec::new();
    for i in 0..(max_key + 40000) {
        let key = gen_key(i);
        let value = storage.get(key.as_bytes()).unwrap();
        if let Some(val) = key_map.get(&i) {
            let expected_value = gen_value(*val);
            assert_eq!(value, Some(Bytes::from(expected_value.clone())));
            expected_key_value_pairs.push((Bytes::from(key), Bytes::from(expected_value)));
        } else {
            assert!(value.is_none());
        }
    }

    check_lsm_iter_result_by_key(
        &mut storage.scan(Bound::Unbounded, Bound::Unbounded).unwrap(),
        expected_key_value_pairs,
    );

    storage.dump_structure();

    println!("This test case does not guarantee your compaction algorithm produces a LSM state as expected. It only does minimal checks on the size of the levels. Please use the compaction simulator to check if the compaction is correctly going on.");
}

pub fn check_compaction_ratio(storage: Arc<MiniLsm>) {
    let state = storage.inner.state.read().clone();
    let compaction_options = storage.inner.options.compaction_options.clone();
    let mut level_size = Vec::new();
    let l0_sst_num = state.l0_sstables.len();
    for (_, files) in &state.levels {
        let size = match &compaction_options {
            CompactionOptions::Leveled(_) => files
                .iter()
                .map(|x| state.sstables.get(x).as_ref().unwrap().table_size())
                .sum::<u64>(),
            CompactionOptions::Simple(_) | CompactionOptions::Tiered(_) => files.len() as u64,
            _ => unreachable!(),
        };
        level_size.push(size);
    }
    let extra_iterators = if TS_ENABLED {
        1 /* txn local iterator for OCC */
    } else {
        0
    };
    let num_iters = storage
        .scan(Bound::Unbounded, Bound::Unbounded)
        .unwrap()
        .num_active_iterators();
    let num_memtables = storage.inner.state.read().imm_memtables.len() + 1;
    match compaction_options {
        CompactionOptions::NoCompaction => unreachable!(),
        CompactionOptions::Simple(SimpleLeveledCompactionOptions {
            size_ratio_percent,
            level0_file_num_compaction_trigger,
            max_levels,
        }) => {
            assert!(l0_sst_num < level0_file_num_compaction_trigger);
            assert!(level_size.len() <= max_levels);
            for idx in 1..level_size.len() {
                let prev_size = level_size[idx - 1];
                let this_size = level_size[idx];
                if prev_size == 0 && this_size == 0 {
                    continue;
                }
                assert!(
                    this_size as f64 / prev_size as f64 >= size_ratio_percent as f64 / 100.0,
                    "L{}/L{}, {}/{}<{}%",
                    state.levels[idx - 1].0,
                    state.levels[idx].0,
                    this_size,
                    prev_size,
                    size_ratio_percent
                );
            }
            assert!(
                num_iters <= l0_sst_num + num_memtables + max_levels + extra_iterators,
                "we found {num_iters} iterators in your implementation, (l0_sst_num={l0_sst_num}, num_memtables={num_memtables}, max_levels={max_levels}) did you use concat iterators?"
            );
        }
        CompactionOptions::Leveled(LeveledCompactionOptions {
            level_size_multiplier,
            level0_file_num_compaction_trigger,
            max_levels,
            ..
        }) => {
            assert!(l0_sst_num < level0_file_num_compaction_trigger);
            assert!(level_size.len() <= max_levels);
            let last_level_size = *level_size.last().unwrap();
            let mut multiplier = 1.0;
            for idx in (1..level_size.len()).rev() {
                multiplier *= level_size_multiplier as f64;
                let this_size = level_size[idx - 1];
                assert!(
                    // do not add hard requirement on level size multiplier considering bloom filters...
                    this_size as f64 / last_level_size as f64 <= 1.0 / multiplier + 0.5,
                    "L{}/L_max, {}/{}>>1.0/{}",
                    state.levels[idx - 1].0,
                    this_size,
                    last_level_size,
                    multiplier
                );
            }
            assert!(
                num_iters <= l0_sst_num + num_memtables + max_levels + extra_iterators,
                "we found {num_iters} iterators in your implementation, (l0_sst_num={l0_sst_num}, num_memtables={num_memtables}, max_levels={max_levels}) did you use concat iterators?"
            );
        }
        CompactionOptions::Tiered(TieredCompactionOptions {
            num_tiers,
            max_size_amplification_percent,
            size_ratio,
            min_merge_width,
            ..
        }) => {
            let size_ratio_trigger = (100.0 + size_ratio as f64) / 100.0;
            assert_eq!(l0_sst_num, 0);
            assert!(level_size.len() <= num_tiers);
            let mut sum_size = level_size[0];
            for idx in 1..level_size.len() {
                let this_size = level_size[idx];
                if level_size.len() > min_merge_width {
                    assert!(
                        sum_size as f64 / this_size as f64 <= size_ratio_trigger,
                        "violation of size ratio: sum(⬆️L{})/L{}, {}/{}>{}",
                        state.levels[idx - 1].0,
                        state.levels[idx].0,
                        sum_size,
                        this_size,
                        size_ratio_trigger
                    );
                }
                if idx + 1 == level_size.len() {
                    assert!(
                        sum_size as f64 / this_size as f64
                            <= max_size_amplification_percent as f64 / 100.0,
                        "violation of space amp: sum(⬆️L{})/L{}, {}/{}>{}%",
                        state.levels[idx - 1].0,
                        state.levels[idx].0,
                        sum_size,
                        this_size,
                        max_size_amplification_percent
                    );
                }
                sum_size += this_size;
            }
            assert!(
                num_iters <= num_memtables + num_tiers + extra_iterators,
                "we found {num_iters} iterators in your implementation, (num_memtables={num_memtables}, num_tiers={num_tiers}) did you use concat iterators?"
            );
        }
    }
}

pub fn dump_files_in_dir(path: impl AsRef<Path>) {
    println!("--- DIR DUMP ---");
    for f in path.as_ref().read_dir().unwrap() {
        let f = f.unwrap();
        print!("{}", f.path().display());
        println!(
            ", size={:.3}KB",
            f.metadata().unwrap().size() as f64 / 1024.0
        );
    }
}

pub fn construct_merge_iterator_over_storage(
    state: &LsmStorageState,
) -> MergeIterator<SsTableIterator> {
    let mut iters = Vec::new();
    for t in &state.l0_sstables {
        iters.push(Box::new(
            SsTableIterator::create_and_seek_to_first(state.sstables.get(t).cloned().unwrap())
                .unwrap(),
        ));
    }
    for (_, files) in &state.levels {
        for f in files {
            iters.push(Box::new(
                SsTableIterator::create_and_seek_to_first(state.sstables.get(f).cloned().unwrap())
                    .unwrap(),
            ));
        }
    }
    MergeIterator::create(iters)
}
-												relicense mini-lsm-book to CC BY-NC-SA 4.0 (#118)

* relicense mini-lsm-book to CC BY-NC-SA 4.0

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

* clearify license

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

* fix fmt

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

* fix fmt

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>
											
										
										
											2025-01-19 19:24:12 -05:00
+								// Copyright (c) 2022-2025 Alex Chi Z
 								//
 								// Licensed under the Apache License, Version 2.0 (the "License");
 								// you may not use this file except in compliance with the License.
 								// You may obtain a copy of the License at
 								//
 								//     http://www.apache.org/licenses/LICENSE-2.0
 								//
 								// Unless required by applicable law or agreed to in writing, software
 								// distributed under the License is distributed on an "AS IS" BASIS,
 								// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 								// See the License for the specific language governing permissions and
 								// limitations under the License.
-												fix compaction split bug and add 3.1 test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:01:40 +08:00
+								use std::{
 								    collections::BTreeMap, ops::Bound, os::unix::fs::MetadataExt, path::Path, sync::Arc,
 								    time::Duration,
 								};
-												finish week 1 day 5 read path

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-21 15:26:22 +08:00
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
+								use anyhow::{bail, Result};
 								use bytes::Bytes;
-												finish week 1 day 5 read path

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-21 15:26:22 +08:00
+								use crate::{
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								    compact::{
 								        CompactionOptions, LeveledCompactionOptions, SimpleLeveledCompactionOptions,
 								        TieredCompactionOptions,
 								    },
-												add 3.4 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 12:14:32 +08:00
+								    iterators::{merge_iterator::MergeIterator, StorageIterator},
-												add week 2 day 5 + 6 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 15:19:56 +08:00
+								    key::{KeySlice, TS_ENABLED},
-												add 3.4 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 12:14:32 +08:00
+								    lsm_storage::{BlockCache, LsmStorageInner, LsmStorageState, MiniLsm},
 								    table::{SsTable, SsTableBuilder, SsTableIterator},
-												finish week 1 day 5 read path

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-21 15:26:22 +08:00
+								};
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
 								#[derive(Clone)]
 								pub struct MockIterator {
 								    pub data: Vec<(Bytes, Bytes)>,
 								    pub error_when: Option<usize>,
 								    pub index: usize,
 								}
 								impl MockIterator {
 								    pub fn new(data: Vec<(Bytes, Bytes)>) -> Self {
 								        Self {
 								            data,
 								            index: 0,
 								            error_when: None,
 								        }
 								    }
 								    pub fn new_with_error(data: Vec<(Bytes, Bytes)>, error_when: usize) -> Self {
 								        Self {
 								            data,
 								            index: 0,
 								            error_when: Some(error_when),
 								        }
 								    }
 								}
 								impl StorageIterator for MockIterator {
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
+								    type KeyType<'a> = KeySlice<'a>;
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
+								    fn next(&mut self) -> Result<()> {
 								        if self.index < self.data.len() {
 								            self.index += 1;
 								        }
 								        if let Some(error_when) = self.error_when {
 								            if self.index == error_when {
 								                bail!("fake error!");
 								            }
 								        }
 								        Ok(())
 								    }
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
+								    fn key(&self) -> KeySlice {
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
+								        if let Some(error_when) = self.error_when {
 								            if self.index >= error_when {
 								                panic!("invalid access after next returns an error!");
 								            }
 								        }
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
+								        KeySlice::for_testing_from_slice_no_ts(self.data[self.index].0.as_ref())
-												add week 1 day 2 tutorial

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-21 11:56:09 +08:00
+								    }
 								    fn value(&self) -> &[u8] {
 								        if let Some(error_when) = self.error_when {
 								            if self.index >= error_when {
 								                panic!("invalid access after next returns an error!");
 								            }
 								        }
 								        self.data[self.index].1.as_ref()
 								    }
 								    fn is_valid(&self) -> bool {
 								        if let Some(error_when) = self.error_when {
 								            if self.index >= error_when {
 								                panic!("invalid access after next returns an error!");
 								            }
 								        }
 								        self.index < self.data.len()
 								    }
 								}
-												finish week 1 day 5 read path

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-21 15:26:22 +08:00
 								pub fn as_bytes(x: &[u8]) -> Bytes {
 								    Bytes::copy_from_slice(x)
 								}
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
+								pub fn check_iter_result_by_key<I>(iter: &mut I, expected: Vec<(Bytes, Bytes)>)
 								where
 								    I: for<'a> StorageIterator<KeyType<'a> = KeySlice<'a>>,
 								{
 								    for (k, v) in expected {
 								        assert!(iter.is_valid());
 								        assert_eq!(
 								            k,
 								            iter.key().for_testing_key_ref(),
 								            "expected key: {:?}, actual key: {:?}",
 								            k,
 								            as_bytes(iter.key().for_testing_key_ref()),
 								        );
 								        assert_eq!(
 								            v,
 								            iter.value(),
 								            "expected value: {:?}, actual value: {:?}",
 								            v,
 								            as_bytes(iter.value()),
 								        );
 								        iter.next().unwrap();
 								    }
 								    assert!(!iter.is_valid());
 								}
-												add 3.5 tests

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-30 13:39:58 +08:00
+								#[allow(dead_code)]
-												fix compaction split bug and add 3.1 test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:01:40 +08:00
+								pub fn check_iter_result_by_key_and_ts<I>(iter: &mut I, expected: Vec<((Bytes, u64), Bytes)>)
 								where
 								    I: for<'a> StorageIterator<KeyType<'a> = KeySlice<'a>>,
 								{
 								    for ((k, ts), v) in expected {
 								        assert!(iter.is_valid());
 								        assert_eq!(
 								            (&k[..], ts),
 								            (
 								                iter.key().for_testing_key_ref(),
 								                iter.key().for_testing_ts()
 								            ),
 								            "expected key: {:?}@{}, actual key: {:?}@{}",
 								            k,
 								            ts,
 								            as_bytes(iter.key().for_testing_key_ref()),
 								            iter.key().for_testing_ts(),
 								        );
 								        assert_eq!(
 								            v,
 								            iter.value(),
 								            "expected value: {:?}, actual value: {:?}",
 								            v,
 								            as_bytes(iter.value()),
 								        );
 								        iter.next().unwrap();
 								    }
 								    assert!(!iter.is_valid());
 								}
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
+								pub fn check_lsm_iter_result_by_key<I>(iter: &mut I, expected: Vec<(Bytes, Bytes)>)
 								where
 								    I: for<'a> StorageIterator<KeyType<'a> = &'a [u8]>,
 								{
-												finish week 1 day 5 read path

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-21 15:26:22 +08:00
+								    for (k, v) in expected {
 								        assert!(iter.is_valid());
 								        assert_eq!(
 								            k,
 								            iter.key(),
 								            "expected key: {:?}, actual key: {:?}",
 								            k,
 								            as_bytes(iter.key()),
 								        );
 								        assert_eq!(
 								            v,
 								            iter.value(),
 								            "expected value: {:?}, actual value: {:?}",
 								            v,
 								            as_bytes(iter.value()),
 								        );
 								        iter.next().unwrap();
 								    }
 								    assert!(!iter.is_valid());
 								}
 								pub fn expect_iter_error(mut iter: impl StorageIterator) {
 								    loop {
 								        match iter.next() {
 								            Ok(_) if iter.is_valid() => continue,
 								            Ok(_) => panic!("expect an error"),
 								            Err(_) => break,
 								        }
 								    }
 								}
 								pub fn generate_sst(
 								    id: usize,
 								    path: impl AsRef<Path>,
 								    data: Vec<(Bytes, Bytes)>,
 								    block_cache: Option<Arc<BlockCache>>,
 								) -> SsTable {
 								    let mut builder = SsTableBuilder::new(128);
 								    for (key, value) in data {
-												add key abstraction and prepare for MVCC (#28)

* add key abstraction and prepare for MVCC

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* a little bit type exercise

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* fix clippy warnings

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* refactor starter code

Signed-off-by: Alex Chi <iskyzh@gmail.com>

* final touch docs

Signed-off-by: Alex Chi <iskyzh@gmail.com>

---------

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-01-25 10:59:08 +08:00
+								        builder.add(KeySlice::for_testing_from_slice_no_ts(&key[..]), &value[..]);
-												finish week 1 day 5 read path

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-21 15:26:22 +08:00
+								    }
 								    builder.build(id, block_cache, path.as_ref()).unwrap()
 								}
-												finish 2.1 and tests

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-23 13:44:48 +08:00
-												add 3.5 tests

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-30 13:39:58 +08:00
+								#[allow(dead_code)]
-												fix compaction split bug and add 3.1 test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:01:40 +08:00
+								pub fn generate_sst_with_ts(
 								    id: usize,
 								    path: impl AsRef<Path>,
 								    data: Vec<((Bytes, u64), Bytes)>,
 								    block_cache: Option<Arc<BlockCache>>,
 								) -> SsTable {
 								    let mut builder = SsTableBuilder::new(128);
 								    for ((key, ts), value) in data {
 								        builder.add(
 								            KeySlice::for_testing_from_slice_with_ts(&key[..], ts),
 								            &value[..],
 								        );
 								    }
 								    builder.build(id, block_cache, path.as_ref()).unwrap()
 								}
-												finish 2.1 and tests

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-23 13:44:48 +08:00
+								pub fn sync(storage: &LsmStorageInner) {
 								    storage
 								        .force_freeze_memtable(&storage.state_lock.lock())
 								        .unwrap();
 								    storage.force_flush_next_imm_memtable().unwrap();
-												checkin part 2 solution

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-24 14:32:13 +08:00
+								}
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
 								pub fn compaction_bench(storage: Arc<MiniLsm>) {
 								    let mut key_map = BTreeMap::<usize, usize>::new();
 								    let gen_key = |i| format!("{:010}", i); // 10B
 								    let gen_value = |i| format!("{:0110}", i); // 110B
 								    let mut max_key = 0;
-												add week 2 day 5 + 6 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 15:19:56 +08:00
+								    let overlaps = if TS_ENABLED { 10000 } else { 20000 };
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								    for iter in 0..10 {
 								        let range_begin = iter * 5000;
-												add week 2 day 5 + 6 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 15:19:56 +08:00
+								        for i in range_begin..(range_begin + overlaps) {
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								            // 120B per key, 4MB data populated
-												add week 2 day 5 + 6 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 15:19:56 +08:00
+								            let key: String = gen_key(i);
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								            let version = key_map.get(&i).copied().unwrap_or_default() + 1;
 								            let value = gen_value(version);
 								            key_map.insert(i, version);
 								            storage.put(key.as_bytes(), value.as_bytes()).unwrap();
 								            max_key = max_key.max(i);
 								        }
 								    }
-												fix compaction split bug and add 3.1 test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:01:40 +08:00
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								    std::thread::sleep(Duration::from_secs(1)); // wait until all memtables flush
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								    while {
 								        let snapshot = storage.inner.state.read();
 								        !snapshot.imm_memtables.is_empty()
 								    } {
 								        storage.inner.force_flush_next_imm_memtable().unwrap();
 								    }
 								    let mut prev_snapshot = storage.inner.state.read().clone();
 								    while {
 								        std::thread::sleep(Duration::from_secs(1));
 								        let snapshot = storage.inner.state.read().clone();
 								        let to_cont = prev_snapshot.levels != snapshot.levels
 								            || prev_snapshot.l0_sstables != snapshot.l0_sstables;
 								        prev_snapshot = snapshot;
 								        to_cont
 								    } {
 								        println!("waiting for compaction to converge");
 								    }
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								    let mut expected_key_value_pairs = Vec::new();
 								    for i in 0..(max_key + 40000) {
 								        let key = gen_key(i);
 								        let value = storage.get(key.as_bytes()).unwrap();
 								        if let Some(val) = key_map.get(&i) {
 								            let expected_value = gen_value(*val);
 								            assert_eq!(value, Some(Bytes::from(expected_value.clone())));
 								            expected_key_value_pairs.push((Bytes::from(key), Bytes::from(expected_value)));
 								        } else {
 								            assert!(value.is_none());
 								        }
 								    }
 								    check_lsm_iter_result_by_key(
 								        &mut storage.scan(Bound::Unbounded, Bound::Unbounded).unwrap(),
 								        expected_key_value_pairs,
 								    );
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								    storage.dump_structure();
 								    println!("This test case does not guarantee your compaction algorithm produces a LSM state as expected. It only does minimal checks on the size of the levels. Please use the compaction simulator to check if the compaction is correctly going on.");
 								}
 								pub fn check_compaction_ratio(storage: Arc<MiniLsm>) {
 								    let state = storage.inner.state.read().clone();
 								    let compaction_options = storage.inner.options.compaction_options.clone();
 								    let mut level_size = Vec::new();
 								    let l0_sst_num = state.l0_sstables.len();
 								    for (_, files) in &state.levels {
 								        let size = match &compaction_options {
 								            CompactionOptions::Leveled(_) => files
 								                .iter()
 								                .map(|x| state.sstables.get(x).as_ref().unwrap().table_size())
 								                .sum::<u64>(),
 								            CompactionOptions::Simple(_) | CompactionOptions::Tiered(_) => files.len() as u64,
 								            _ => unreachable!(),
 								        };
 								        level_size.push(size);
 								    }
-												consider mvcc iterator in compaction test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 18:21:27 +08:00
+								    let extra_iterators = if TS_ENABLED {
 /* txn local iterator for OCC */
 								    } else {
 
 								    };
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								    let num_iters = storage
 								        .scan(Bound::Unbounded, Bound::Unbounded)
 								        .unwrap()
 								        .num_active_iterators();
 								    let num_memtables = storage.inner.state.read().imm_memtables.len() + 1;
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								    match compaction_options {
 								        CompactionOptions::NoCompaction => unreachable!(),
 								        CompactionOptions::Simple(SimpleLeveledCompactionOptions {
 								            size_ratio_percent,
 								            level0_file_num_compaction_trigger,
 								            max_levels,
 								        }) => {
 								            assert!(l0_sst_num < level0_file_num_compaction_trigger);
 								            assert!(level_size.len() <= max_levels);
 								            for idx in 1..level_size.len() {
 								                let prev_size = level_size[idx - 1];
 								                let this_size = level_size[idx];
 								                if prev_size == 0 && this_size == 0 {
 								                    continue;
 								                }
 								                assert!(
 								                    this_size as f64 / prev_size as f64 >= size_ratio_percent as f64 / 100.0,
 								                    "L{}/L{}, {}/{}<{}%",
 								                    state.levels[idx - 1].0,
 								                    state.levels[idx].0,
 								                    this_size,
 								                    prev_size,
 								                    size_ratio_percent
 								                );
 								            }
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								            assert!(
-												consider mvcc iterator in compaction test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 18:21:27 +08:00
+								                num_iters <= l0_sst_num + num_memtables + max_levels + extra_iterators,
-												improve compaction concat iterator tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 18:18:55 +08:00
+								                "we found {num_iters} iterators in your implementation, (l0_sst_num={l0_sst_num}, num_memtables={num_memtables}, max_levels={max_levels}) did you use concat iterators?"
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								            );
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								        }
 								        CompactionOptions::Leveled(LeveledCompactionOptions {
 								            level_size_multiplier,
 								            level0_file_num_compaction_trigger,
 								            max_levels,
 								            ..
 								        }) => {
 								            assert!(l0_sst_num < level0_file_num_compaction_trigger);
 								            assert!(level_size.len() <= max_levels);
-												fix leveled compaction tests

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-30 17:14:45 +08:00
+								            let last_level_size = *level_size.last().unwrap();
 								            let mut multiplier = 1.0;
 								            for idx in (1..level_size.len()).rev() {
 								                multiplier *= level_size_multiplier as f64;
 								                let this_size = level_size[idx - 1];
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								                assert!(
 								                    // do not add hard requirement on level size multiplier considering bloom filters...
-												fix leveled compaction tests

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-30 17:14:45 +08:00
+								                    this_size as f64 / last_level_size as f64 <= 1.0 / multiplier + 0.5,
 								                    "L{}/L_max, {}/{}>>1.0/{}",
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								                    state.levels[idx - 1].0,
 								                    this_size,
-												fix leveled compaction tests

Signed-off-by: Alex Chi Z <iskyzh@gmail.com>

											
										
										
											2024-01-30 17:14:45 +08:00
+								                    last_level_size,
 								                    multiplier
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								                );
 								            }
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								            assert!(
-												consider mvcc iterator in compaction test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 18:21:27 +08:00
+								                num_iters <= l0_sst_num + num_memtables + max_levels + extra_iterators,
-												improve compaction concat iterator tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 18:18:55 +08:00
+								                "we found {num_iters} iterators in your implementation, (l0_sst_num={l0_sst_num}, num_memtables={num_memtables}, max_levels={max_levels}) did you use concat iterators?"
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								            );
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								        }
 								        CompactionOptions::Tiered(TieredCompactionOptions {
 								            num_tiers,
 								            max_size_amplification_percent,
 								            size_ratio,
-												consider merge width for tiered trigger + mvcc compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 23:38:26 +08:00
+								            min_merge_width,
-												fix: universal compaction condition (#97)

Signed-off-by: Alex Chi <iskyzh@gmail.com>
											
										
										
											2024-11-12 21:27:00 -05:00
+								            ..
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								        }) => {
 								            let size_ratio_trigger = (100.0 + size_ratio as f64) / 100.0;
 								            assert_eq!(l0_sst_num, 0);
 								            assert!(level_size.len() <= num_tiers);
 								            let mut sum_size = level_size[0];
 								            for idx in 1..level_size.len() {
 								                let this_size = level_size[idx];
-												consider merge width for tiered trigger + mvcc compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 23:38:26 +08:00
+								                if level_size.len() > min_merge_width {
 								                    assert!(
 								                        sum_size as f64 / this_size as f64 <= size_ratio_trigger,
 								                        "violation of size ratio: sum(⬆️L{})/L{}, {}/{}>{}",
 								                        state.levels[idx - 1].0,
 								                        state.levels[idx].0,
 								                        sum_size,
 								                        this_size,
 								                        size_ratio_trigger
 								                    );
 								                }
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								                if idx + 1 == level_size.len() {
 								                    assert!(
 								                        sum_size as f64 / this_size as f64
 								                            <= max_size_amplification_percent as f64 / 100.0,
-												consider merge width for tiered trigger + mvcc compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 23:38:26 +08:00
+								                        "violation of space amp: sum(⬆️L{})/L{}, {}/{}>{}%",
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								                        state.levels[idx - 1].0,
 								                        state.levels[idx].0,
 								                        sum_size,
 								                        this_size,
 								                        max_size_amplification_percent
 								                    );
 								                }
 								                sum_size += this_size;
 								            }
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								            assert!(
-												consider mvcc iterator in compaction test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 18:21:27 +08:00
+								                num_iters <= num_memtables + num_tiers + extra_iterators,
-												improve compaction concat iterator tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 18:18:55 +08:00
+								                "we found {num_iters} iterators in your implementation, (num_memtables={num_memtables}, num_tiers={num_tiers}) did you use concat iterators?"
-												implement mvcc compaction + snapshot

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 16:52:37 +08:00
+								            );
-												add compaction tests and fix bugs in compaction

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-25 15:25:23 +08:00
+								        }
 								    }
 								}
-												add week 2 day 5 + 6 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 15:19:56 +08:00
 								pub fn dump_files_in_dir(path: impl AsRef<Path>) {
-												fix wal close not waiting for threads, better test harness

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:38:56 +08:00
+								    println!("--- DIR DUMP ---");
-												add week 2 day 5 + 6 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 15:19:56 +08:00
+								    for f in path.as_ref().read_dir().unwrap() {
-												fix compaction split bug and add 3.1 test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:01:40 +08:00
+								        let f = f.unwrap();
-												fix wal close not waiting for threads, better test harness

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:38:56 +08:00
+								        print!("{}", f.path().display());
-												fix compaction split bug and add 3.1 test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:01:40 +08:00
+								        println!(
-												fix wal close not waiting for threads, better test harness

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:38:56 +08:00
+								            ", size={:.3}KB",
-												fix compaction split bug and add 3.1 test

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:01:40 +08:00
+								            f.metadata().unwrap().size() as f64 / 1024.0
-												fix wal close not waiting for threads, better test harness

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-28 16:38:56 +08:00
+								        );
-												add week 2 day 5 + 6 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-26 15:19:56 +08:00
+								    }
 								}
-												add 3.4 tests

Signed-off-by: Alex Chi <iskyzh@gmail.com>

											
										
										
											2024-01-30 12:14:32 +08:00
 								pub fn construct_merge_iterator_over_storage(
 								    state: &LsmStorageState,
 								) -> MergeIterator<SsTableIterator> {
 								    let mut iters = Vec::new();
 								    for t in &state.l0_sstables {
 								        iters.push(Box::new(
 								            SsTableIterator::create_and_seek_to_first(state.sstables.get(t).cloned().unwrap())
 								                .unwrap(),
 								        ));
 								    }
 								    for (_, files) in &state.levels {
 								        for f in files {
 								            iters.push(Box::new(
 								                SsTableIterator::create_and_seek_to_first(state.sstables.get(f).cloned().unwrap())
 								                    .unwrap(),
 								            ));
 								        }
 								    }
 								    MergeIterator::create(iters)
 								}