feat(code): add sst iterator / day 2
Signed-off-by: Alex Chi <iskyzh@gmail.com>
This commit is contained in:
1
Cargo.lock
generated
1
Cargo.lock
generated
@@ -175,6 +175,7 @@ checksum = "f051f77a7c8e6957c0696eac88f26b0117e54f52d3fc682ab19397a8812846a4"
|
|||||||
name = "mini-lsm"
|
name = "mini-lsm"
|
||||||
version = "0.1.0"
|
version = "0.1.0"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
|
"anyhow",
|
||||||
"bytes",
|
"bytes",
|
||||||
]
|
]
|
||||||
|
|
||||||
|
|||||||
@@ -1,7 +1,14 @@
|
|||||||
# LSM in a Week
|
# LSM in a Week
|
||||||
|
|
||||||
|
[](https://github.com/skyzh/mini-lsm/actions/workflows/main.yml)
|
||||||
|
|
||||||
Build a simple key-value storage engine in a week!
|
Build a simple key-value storage engine in a week!
|
||||||
|
|
||||||
|
## Tutorial
|
||||||
|
|
||||||
|
The tutorial is available at [https://skyzh.github.io/mini-lsm](https://skyzh.github.io/mini-lsm). You can use the provided starter
|
||||||
|
code to kick off your project, and follow the tutorial to implement the LSM tree.
|
||||||
|
|
||||||
## Development
|
## Development
|
||||||
|
|
||||||
```
|
```
|
||||||
|
|||||||
@@ -1 +1,2 @@
|
|||||||
pub mod block;
|
pub mod block;
|
||||||
|
pub mod table;
|
||||||
|
|||||||
1
mini-lsm-starter/src/table.rs
Normal file
1
mini-lsm-starter/src/table.rs
Normal file
@@ -0,0 +1 @@
|
|||||||
|
|
||||||
0
mini-lsm-starter/src/table/builder.rs
Normal file
0
mini-lsm-starter/src/table/builder.rs
Normal file
0
mini-lsm-starter/src/table/iterator.rs
Normal file
0
mini-lsm-starter/src/table/iterator.rs
Normal file
0
mini-lsm-starter/src/table/tests.rs
Normal file
0
mini-lsm-starter/src/table/tests.rs
Normal file
@@ -11,4 +11,5 @@ description = "A tutorial for building an LSM tree storage engine in a week."
|
|||||||
# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
|
# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
|
||||||
|
|
||||||
[dependencies]
|
[dependencies]
|
||||||
|
anyhow = "1"
|
||||||
bytes = "1"
|
bytes = "1"
|
||||||
|
|||||||
@@ -10,8 +10,8 @@ pub const SIZEOF_U16: usize = std::mem::size_of::<u16>();
|
|||||||
|
|
||||||
/// A block is the smallest unit of read and caching in LSM tree. It is a collection of sorted key-value pairs.
|
/// A block is the smallest unit of read and caching in LSM tree. It is a collection of sorted key-value pairs.
|
||||||
pub struct Block {
|
pub struct Block {
|
||||||
pub(self) data: Vec<u8>,
|
data: Vec<u8>,
|
||||||
pub(self) offsets: Vec<u16>,
|
offsets: Vec<u16>,
|
||||||
}
|
}
|
||||||
|
|
||||||
impl Block {
|
impl Block {
|
||||||
|
|||||||
@@ -6,16 +6,16 @@ use super::{Block, SIZEOF_U16};
|
|||||||
pub struct BlockBuilder {
|
pub struct BlockBuilder {
|
||||||
offsets: Vec<u16>,
|
offsets: Vec<u16>,
|
||||||
data: Vec<u8>,
|
data: Vec<u8>,
|
||||||
target_size: usize,
|
block_size: usize,
|
||||||
}
|
}
|
||||||
|
|
||||||
impl BlockBuilder {
|
impl BlockBuilder {
|
||||||
/// Creates a new block builder
|
/// Creates a new block builder
|
||||||
pub fn new(target_size: usize) -> Self {
|
pub fn new(block_size: usize) -> Self {
|
||||||
Self {
|
Self {
|
||||||
offsets: Vec::new(),
|
offsets: Vec::new(),
|
||||||
data: Vec::new(),
|
data: Vec::new(),
|
||||||
target_size,
|
block_size,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -27,7 +27,8 @@ impl BlockBuilder {
|
|||||||
#[must_use]
|
#[must_use]
|
||||||
pub fn add(&mut self, key: &[u8], value: &[u8]) -> bool {
|
pub fn add(&mut self, key: &[u8], value: &[u8]) -> bool {
|
||||||
assert!(!key.is_empty(), "key must not be empty");
|
assert!(!key.is_empty(), "key must not be empty");
|
||||||
if self.estimated_size() + key.len() + value.len() + SIZEOF_U16 * 3 > self.target_size
|
assert!(!value.is_empty(), "value must not be empty");
|
||||||
|
if self.estimated_size() + key.len() + value.len() + SIZEOF_U16 * 3 > self.block_size
|
||||||
&& !self.is_empty()
|
&& !self.is_empty()
|
||||||
{
|
{
|
||||||
return false;
|
return false;
|
||||||
|
|||||||
@@ -51,10 +51,6 @@ impl BlockIterator {
|
|||||||
self.seek_to(0);
|
self.seek_to(0);
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn seek_to_last(&mut self) {
|
|
||||||
self.seek_to(self.block.offsets.len() - 1);
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn len(&self) -> usize {
|
pub fn len(&self) -> usize {
|
||||||
self.block.offsets.len()
|
self.block.offsets.len()
|
||||||
}
|
}
|
||||||
@@ -106,5 +102,6 @@ impl BlockIterator {
|
|||||||
std::cmp::Ordering::Equal => return,
|
std::cmp::Ordering::Equal => return,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
self.seek_to(low);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -18,7 +18,7 @@ fn test_block_build_full() {
|
|||||||
}
|
}
|
||||||
|
|
||||||
fn key_of(idx: usize) -> Vec<u8> {
|
fn key_of(idx: usize) -> Vec<u8> {
|
||||||
format!("key_{:03}", idx).into_bytes()
|
format!("key_{:03}", idx * 5).into_bytes()
|
||||||
}
|
}
|
||||||
|
|
||||||
fn value_of(idx: usize) -> Vec<u8> {
|
fn value_of(idx: usize) -> Vec<u8> {
|
||||||
@@ -67,6 +67,7 @@ fn as_bytes(x: &[u8]) -> Bytes {
|
|||||||
fn test_block_iterator() {
|
fn test_block_iterator() {
|
||||||
let block = Arc::new(generate_block());
|
let block = Arc::new(generate_block());
|
||||||
let mut iter = BlockIterator::create_and_seek_to_first(block);
|
let mut iter = BlockIterator::create_and_seek_to_first(block);
|
||||||
|
for _ in 0..5 {
|
||||||
for i in 0..num_of_keys() {
|
for i in 0..num_of_keys() {
|
||||||
let key = iter.key();
|
let key = iter.key();
|
||||||
let value = iter.value();
|
let value = iter.value();
|
||||||
@@ -86,4 +87,34 @@ fn test_block_iterator() {
|
|||||||
);
|
);
|
||||||
iter.next();
|
iter.next();
|
||||||
}
|
}
|
||||||
|
iter.seek_to_first();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_block_seek_key() {
|
||||||
|
let block = Arc::new(generate_block());
|
||||||
|
let mut iter = BlockIterator::create_and_seek_to_key(block, &key_of(0));
|
||||||
|
for offset in 1..=5 {
|
||||||
|
for i in 0..num_of_keys() {
|
||||||
|
let key = iter.key();
|
||||||
|
let value = iter.value();
|
||||||
|
assert_eq!(
|
||||||
|
key,
|
||||||
|
key_of(i),
|
||||||
|
"expected key: {:?}, actual key: {:?}",
|
||||||
|
as_bytes(&key_of(i)),
|
||||||
|
as_bytes(key)
|
||||||
|
);
|
||||||
|
assert_eq!(
|
||||||
|
value,
|
||||||
|
value_of(i),
|
||||||
|
"expected value: {:?}, actual value: {:?}",
|
||||||
|
as_bytes(&value_of(i)),
|
||||||
|
as_bytes(value)
|
||||||
|
);
|
||||||
|
iter.seek_to_key(&format!("key_{:03}", i * 5 + offset).into_bytes());
|
||||||
|
}
|
||||||
|
iter.seek_to_key(b"k");
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1 +1,2 @@
|
|||||||
pub mod block;
|
pub mod block;
|
||||||
|
pub mod table;
|
||||||
|
|||||||
113
mini-lsm/src/table.rs
Normal file
113
mini-lsm/src/table.rs
Normal file
@@ -0,0 +1,113 @@
|
|||||||
|
mod builder;
|
||||||
|
mod iterator;
|
||||||
|
|
||||||
|
use std::{path::Path, sync::Arc};
|
||||||
|
|
||||||
|
pub use builder::SsTableBuilder;
|
||||||
|
use bytes::{Buf, BufMut, Bytes};
|
||||||
|
pub use iterator::SsTableIterator;
|
||||||
|
|
||||||
|
use crate::block::Block;
|
||||||
|
use anyhow::Result;
|
||||||
|
|
||||||
|
#[derive(Clone, Debug, PartialEq, Eq)]
|
||||||
|
pub struct BlockMeta {
|
||||||
|
pub offset: usize,
|
||||||
|
pub first_key: Bytes,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl BlockMeta {
|
||||||
|
pub fn encode_block_meta(block_meta: &[BlockMeta], buf: &mut Vec<u8>) {
|
||||||
|
let mut estimated_size = 0;
|
||||||
|
for meta in block_meta {
|
||||||
|
estimated_size += std::mem::size_of::<u32>();
|
||||||
|
estimated_size += std::mem::size_of::<u16>();
|
||||||
|
estimated_size += meta.first_key.len();
|
||||||
|
}
|
||||||
|
buf.reserve(estimated_size);
|
||||||
|
let original_len = buf.len();
|
||||||
|
for meta in block_meta {
|
||||||
|
buf.put_u32(meta.offset as u32);
|
||||||
|
buf.put_u16(meta.first_key.len() as u16);
|
||||||
|
buf.put_slice(&meta.first_key);
|
||||||
|
}
|
||||||
|
assert_eq!(estimated_size, buf.len() - original_len);
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn decode_block_meta(mut buf: impl Buf) -> Vec<BlockMeta> {
|
||||||
|
let mut block_meta = Vec::new();
|
||||||
|
while buf.has_remaining() {
|
||||||
|
let offset = buf.get_u32() as usize;
|
||||||
|
let first_key_len = buf.get_u16() as usize;
|
||||||
|
let first_key = buf.copy_to_bytes(first_key_len);
|
||||||
|
block_meta.push(BlockMeta { offset, first_key });
|
||||||
|
}
|
||||||
|
block_meta
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct FileObject(Bytes);
|
||||||
|
|
||||||
|
impl FileObject {
|
||||||
|
pub fn read(&self, offset: u64, len: u64) -> Result<Vec<u8>> {
|
||||||
|
Ok(self.0[offset as usize..(offset + len) as usize].to_vec())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn size(&self) -> u64 {
|
||||||
|
self.0.len() as u64
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn create(_path: &Path, data: Vec<u8>) -> Result<Self> {
|
||||||
|
Ok(FileObject(data.into()))
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn open(_path: &Path) -> Result<Self> {
|
||||||
|
unimplemented!()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct SsTable {
|
||||||
|
file: FileObject,
|
||||||
|
block_metas: Vec<BlockMeta>,
|
||||||
|
block_meta_offset: usize,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl SsTable {
|
||||||
|
pub fn open(file: FileObject) -> Result<Self> {
|
||||||
|
let len = file.size();
|
||||||
|
let raw_meta_offset = file.read(len - 4, 4)?;
|
||||||
|
let block_meta_offset = (&raw_meta_offset[..]).get_u32() as u64;
|
||||||
|
let raw_meta = file.read(block_meta_offset, len - 4 - block_meta_offset)?;
|
||||||
|
Ok(Self {
|
||||||
|
file,
|
||||||
|
block_metas: BlockMeta::decode_block_meta(&raw_meta[..]),
|
||||||
|
block_meta_offset: block_meta_offset as usize,
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
fn read_block(&self, block_idx: usize) -> Result<Arc<Block>> {
|
||||||
|
let offset = self.block_metas[block_idx].offset;
|
||||||
|
let offset_end = self
|
||||||
|
.block_metas
|
||||||
|
.get(block_idx + 1)
|
||||||
|
.map(|x| x.offset)
|
||||||
|
.unwrap_or(self.block_meta_offset);
|
||||||
|
let block_data = self
|
||||||
|
.file
|
||||||
|
.read(offset as u64, (offset_end - offset) as u64)?;
|
||||||
|
Ok(Arc::new(Block::decode(&block_data[..])))
|
||||||
|
}
|
||||||
|
|
||||||
|
fn find_block_idx(&self, key: &[u8]) -> usize {
|
||||||
|
self.block_metas
|
||||||
|
.partition_point(|meta| meta.first_key <= key)
|
||||||
|
.saturating_sub(1)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn num_of_blocks(&self) -> usize {
|
||||||
|
self.block_metas.len()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[cfg(test)]
|
||||||
|
mod tests;
|
||||||
75
mini-lsm/src/table/builder.rs
Normal file
75
mini-lsm/src/table/builder.rs
Normal file
@@ -0,0 +1,75 @@
|
|||||||
|
use anyhow::Result;
|
||||||
|
use bytes::BufMut;
|
||||||
|
use std::path::Path;
|
||||||
|
|
||||||
|
use super::{BlockMeta, FileObject, SsTable};
|
||||||
|
use crate::block::BlockBuilder;
|
||||||
|
|
||||||
|
pub struct SsTableBuilder {
|
||||||
|
builder: BlockBuilder,
|
||||||
|
first_key: Vec<u8>,
|
||||||
|
data: Vec<u8>,
|
||||||
|
pub(super) meta: Vec<BlockMeta>,
|
||||||
|
target_size: usize,
|
||||||
|
block_size: usize,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl SsTableBuilder {
|
||||||
|
pub fn new(target_size: usize, block_size: usize) -> Self {
|
||||||
|
Self {
|
||||||
|
data: Vec::new(),
|
||||||
|
meta: Vec::new(),
|
||||||
|
first_key: Vec::new(),
|
||||||
|
target_size,
|
||||||
|
block_size,
|
||||||
|
builder: BlockBuilder::new(block_size),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
pub fn add(&mut self, key: &[u8], value: &[u8]) -> bool {
|
||||||
|
if self.data.len() > self.target_size {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
if self.first_key.is_empty() {
|
||||||
|
self.first_key = key.to_vec();
|
||||||
|
}
|
||||||
|
|
||||||
|
if self.builder.add(key, value) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
// create a new block builder and append block data
|
||||||
|
self.finish_block();
|
||||||
|
|
||||||
|
// add the key-value pair to the next block
|
||||||
|
assert!(self.builder.add(key, value));
|
||||||
|
self.first_key = key.to_vec();
|
||||||
|
|
||||||
|
true
|
||||||
|
}
|
||||||
|
|
||||||
|
fn finish_block(&mut self) {
|
||||||
|
let builder = std::mem::replace(&mut self.builder, BlockBuilder::new(self.block_size));
|
||||||
|
let encoded_block = builder.build().encode();
|
||||||
|
self.meta.push(BlockMeta {
|
||||||
|
offset: self.data.len(),
|
||||||
|
first_key: std::mem::take(&mut self.first_key).into(),
|
||||||
|
});
|
||||||
|
self.data.extend(encoded_block);
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn build(mut self, path: impl AsRef<Path>) -> Result<SsTable> {
|
||||||
|
self.finish_block();
|
||||||
|
let mut buf = self.data;
|
||||||
|
let meta_offset = buf.len();
|
||||||
|
BlockMeta::encode_block_meta(&self.meta, &mut buf);
|
||||||
|
buf.put_u32(meta_offset as u32);
|
||||||
|
let file = FileObject::create(path.as_ref(), buf)?;
|
||||||
|
Ok(SsTable {
|
||||||
|
file,
|
||||||
|
block_metas: self.meta,
|
||||||
|
block_meta_offset: meta_offset,
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
||||||
91
mini-lsm/src/table/iterator.rs
Normal file
91
mini-lsm/src/table/iterator.rs
Normal file
@@ -0,0 +1,91 @@
|
|||||||
|
use anyhow::Result;
|
||||||
|
use std::sync::Arc;
|
||||||
|
|
||||||
|
use super::SsTable;
|
||||||
|
use crate::block::BlockIterator;
|
||||||
|
|
||||||
|
pub struct SsTableIterator {
|
||||||
|
table: Arc<SsTable>,
|
||||||
|
blk_iter: BlockIterator,
|
||||||
|
blk_idx: usize,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl SsTableIterator {
|
||||||
|
fn seek_to_first_inner(table: &Arc<SsTable>) -> Result<(usize, BlockIterator)> {
|
||||||
|
Ok((
|
||||||
|
0,
|
||||||
|
BlockIterator::create_and_seek_to_first(table.read_block(0)?),
|
||||||
|
))
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn create_and_seek_to_first(table: Arc<SsTable>) -> Result<Self> {
|
||||||
|
let (blk_idx, blk_iter) = Self::seek_to_first_inner(&table)?;
|
||||||
|
let iter = Self {
|
||||||
|
blk_iter,
|
||||||
|
table,
|
||||||
|
blk_idx,
|
||||||
|
};
|
||||||
|
Ok(iter)
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn seek_to_first(&mut self) -> Result<()> {
|
||||||
|
let (blk_idx, blk_iter) = Self::seek_to_first_inner(&self.table)?;
|
||||||
|
self.blk_idx = blk_idx;
|
||||||
|
self.blk_iter = blk_iter;
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn seek_to_key_inner(table: &Arc<SsTable>, key: &[u8]) -> Result<(usize, BlockIterator)> {
|
||||||
|
let mut blk_idx = table.find_block_idx(key);
|
||||||
|
let mut blk_iter = BlockIterator::create_and_seek_to_key(table.read_block(blk_idx)?, key);
|
||||||
|
if !blk_iter.is_valid() {
|
||||||
|
blk_idx += 1;
|
||||||
|
if blk_idx < table.num_of_blocks() {
|
||||||
|
blk_iter = BlockIterator::create_and_seek_to_first(table.read_block(blk_idx)?);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Ok((blk_idx, blk_iter))
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn create_and_seek_to_key(table: Arc<SsTable>, key: &[u8]) -> Result<Self> {
|
||||||
|
let (blk_idx, blk_iter) = Self::seek_to_key_inner(&table, key)?;
|
||||||
|
let iter = Self {
|
||||||
|
blk_iter,
|
||||||
|
table,
|
||||||
|
blk_idx,
|
||||||
|
};
|
||||||
|
Ok(iter)
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn seek_to_key(&mut self, key: &[u8]) -> Result<()> {
|
||||||
|
let (blk_idx, blk_iter) = Self::seek_to_key_inner(&self.table, key)?;
|
||||||
|
self.blk_iter = blk_iter;
|
||||||
|
self.blk_idx = blk_idx;
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn key(&self) -> &[u8] {
|
||||||
|
self.blk_iter.key()
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn value(&self) -> &[u8] {
|
||||||
|
self.blk_iter.value()
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn is_valid(&self) -> bool {
|
||||||
|
self.blk_iter.is_valid()
|
||||||
|
}
|
||||||
|
|
||||||
|
#[allow(clippy::should_implement_trait)]
|
||||||
|
pub fn next(&mut self) -> Result<()> {
|
||||||
|
self.blk_iter.next();
|
||||||
|
if !self.blk_iter.is_valid() {
|
||||||
|
self.blk_idx += 1;
|
||||||
|
if self.blk_idx < self.table.num_of_blocks() {
|
||||||
|
self.blk_iter =
|
||||||
|
BlockIterator::create_and_seek_to_first(self.table.read_block(self.blk_idx)?);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
}
|
||||||
134
mini-lsm/src/table/tests.rs
Normal file
134
mini-lsm/src/table/tests.rs
Normal file
@@ -0,0 +1,134 @@
|
|||||||
|
use std::sync::Arc;
|
||||||
|
|
||||||
|
use bytes::Bytes;
|
||||||
|
|
||||||
|
use crate::table::SsTableBuilder;
|
||||||
|
|
||||||
|
use super::{SsTable, SsTableIterator};
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_sst_build_single_key() {
|
||||||
|
let mut builder = SsTableBuilder::new(16, 16);
|
||||||
|
assert!(builder.add(b"233", b"233333"));
|
||||||
|
builder.build("").unwrap();
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_sst_build_two_blocks() {
|
||||||
|
let mut builder = SsTableBuilder::new(1024, 16);
|
||||||
|
assert!(builder.add(b"11", b"11"));
|
||||||
|
assert!(builder.add(b"22", b"22"));
|
||||||
|
assert!(builder.add(b"33", b"11"));
|
||||||
|
assert!(builder.add(b"44", b"22"));
|
||||||
|
assert!(builder.add(b"55", b"11"));
|
||||||
|
assert!(builder.add(b"66", b"22"));
|
||||||
|
assert!(builder.meta.len() >= 2);
|
||||||
|
builder.build("").unwrap();
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_sst_build_full() {
|
||||||
|
let mut builder = SsTableBuilder::new(32, 16);
|
||||||
|
assert!(builder.add(b"11", b"11"));
|
||||||
|
assert!(builder.add(b"22", b"22"));
|
||||||
|
assert!(builder.add(b"33", b"11"));
|
||||||
|
assert!(builder.add(b"44", b"22"));
|
||||||
|
assert!(!builder.add(b"55", b"11"));
|
||||||
|
builder.build("").unwrap();
|
||||||
|
}
|
||||||
|
|
||||||
|
fn key_of(idx: usize) -> Vec<u8> {
|
||||||
|
format!("key_{:03}", idx * 5).into_bytes()
|
||||||
|
}
|
||||||
|
|
||||||
|
fn value_of(idx: usize) -> Vec<u8> {
|
||||||
|
format!("value_{:010}", idx).into_bytes()
|
||||||
|
}
|
||||||
|
|
||||||
|
fn num_of_keys() -> usize {
|
||||||
|
100
|
||||||
|
}
|
||||||
|
|
||||||
|
fn generate_sst() -> SsTable {
|
||||||
|
let mut builder = SsTableBuilder::new(65536, 128);
|
||||||
|
for idx in 0..num_of_keys() {
|
||||||
|
let key = key_of(idx);
|
||||||
|
let value = value_of(idx);
|
||||||
|
assert!(builder.add(&key[..], &value[..]));
|
||||||
|
}
|
||||||
|
builder.build("").unwrap()
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_sst_build_all() {
|
||||||
|
generate_sst();
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_sst_decode() {
|
||||||
|
let sst = generate_sst();
|
||||||
|
let meta = sst.block_metas.clone();
|
||||||
|
let new_sst = SsTable::open(sst.file).unwrap();
|
||||||
|
assert_eq!(new_sst.block_metas, meta);
|
||||||
|
}
|
||||||
|
|
||||||
|
fn as_bytes(x: &[u8]) -> Bytes {
|
||||||
|
Bytes::copy_from_slice(x)
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_sst_iterator() {
|
||||||
|
let sst = Arc::new(generate_sst());
|
||||||
|
let mut iter = SsTableIterator::create_and_seek_to_first(sst).unwrap();
|
||||||
|
for _ in 0..5 {
|
||||||
|
for i in 0..num_of_keys() {
|
||||||
|
let key = iter.key();
|
||||||
|
let value = iter.value();
|
||||||
|
assert_eq!(
|
||||||
|
key,
|
||||||
|
key_of(i),
|
||||||
|
"expected key: {:?}, actual key: {:?}",
|
||||||
|
as_bytes(&key_of(i)),
|
||||||
|
as_bytes(key)
|
||||||
|
);
|
||||||
|
assert_eq!(
|
||||||
|
value,
|
||||||
|
value_of(i),
|
||||||
|
"expected value: {:?}, actual value: {:?}",
|
||||||
|
as_bytes(&value_of(i)),
|
||||||
|
as_bytes(value)
|
||||||
|
);
|
||||||
|
iter.next().unwrap();
|
||||||
|
}
|
||||||
|
iter.seek_to_first().unwrap();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_sst_seek_key() {
|
||||||
|
let sst = Arc::new(generate_sst());
|
||||||
|
let mut iter = SsTableIterator::create_and_seek_to_key(sst, &key_of(0)).unwrap();
|
||||||
|
for offset in 1..=5 {
|
||||||
|
for i in 0..num_of_keys() {
|
||||||
|
let key = iter.key();
|
||||||
|
let value = iter.value();
|
||||||
|
assert_eq!(
|
||||||
|
key,
|
||||||
|
key_of(i),
|
||||||
|
"expected key: {:?}, actual key: {:?}",
|
||||||
|
as_bytes(&key_of(i)),
|
||||||
|
as_bytes(key)
|
||||||
|
);
|
||||||
|
assert_eq!(
|
||||||
|
value,
|
||||||
|
value_of(i),
|
||||||
|
"expected value: {:?}, actual value: {:?}",
|
||||||
|
as_bytes(&value_of(i)),
|
||||||
|
as_bytes(value)
|
||||||
|
);
|
||||||
|
iter.seek_to_key(&format!("key_{:03}", i * 5 + offset).into_bytes())
|
||||||
|
.unwrap();
|
||||||
|
}
|
||||||
|
iter.seek_to_key(b"k").unwrap();
|
||||||
|
}
|
||||||
|
}
|
||||||
Reference in New Issue
Block a user