2025-01-19 19:24:12 -05:00
|
|
|
// Copyright (c) 2022-2025 Alex Chi Z
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2024-01-17 14:51:15 +08:00
|
|
|
use std::collections::HashMap;
|
|
|
|
|
2024-01-19 11:21:38 +08:00
|
|
|
use serde::{Deserialize, Serialize};
|
|
|
|
|
2024-01-18 17:51:24 +08:00
|
|
|
use crate::lsm_storage::LsmStorageState;
|
2024-01-16 16:30:01 +08:00
|
|
|
|
2024-01-19 16:10:18 +08:00
|
|
|
#[derive(Debug, Serialize, Deserialize)]
|
2024-01-16 16:30:01 +08:00
|
|
|
pub struct TieredCompactionTask {
|
2024-01-17 14:51:15 +08:00
|
|
|
pub tiers: Vec<(usize, Vec<usize>)>,
|
2024-01-18 19:40:05 +08:00
|
|
|
pub bottom_tier_included: bool,
|
2024-01-17 14:51:15 +08:00
|
|
|
}
|
|
|
|
|
2024-01-18 17:51:24 +08:00
|
|
|
#[derive(Debug, Clone)]
|
2024-01-17 14:51:15 +08:00
|
|
|
pub struct TieredCompactionOptions {
|
2024-01-18 19:40:05 +08:00
|
|
|
pub num_tiers: usize,
|
2024-01-17 14:51:15 +08:00
|
|
|
pub max_size_amplification_percent: usize,
|
|
|
|
pub size_ratio: usize,
|
|
|
|
pub min_merge_width: usize,
|
2024-11-12 21:27:00 -05:00
|
|
|
pub max_merge_width: Option<usize>,
|
2024-01-16 16:30:01 +08:00
|
|
|
}
|
|
|
|
|
2024-01-17 14:51:15 +08:00
|
|
|
pub struct TieredCompactionController {
|
|
|
|
options: TieredCompactionOptions,
|
|
|
|
}
|
2024-01-16 16:30:01 +08:00
|
|
|
|
|
|
|
impl TieredCompactionController {
|
2024-01-17 14:51:15 +08:00
|
|
|
pub fn new(options: TieredCompactionOptions) -> Self {
|
|
|
|
Self { options }
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn generate_compaction_task(
|
|
|
|
&self,
|
2024-01-18 17:51:24 +08:00
|
|
|
snapshot: &LsmStorageState,
|
2024-01-17 14:51:15 +08:00
|
|
|
) -> Option<TieredCompactionTask> {
|
|
|
|
assert!(
|
|
|
|
snapshot.l0_sstables.is_empty(),
|
|
|
|
"should not add l0 ssts in tiered compaction"
|
|
|
|
);
|
2024-01-18 19:40:05 +08:00
|
|
|
if snapshot.levels.len() < self.options.num_tiers {
|
2024-01-17 14:51:15 +08:00
|
|
|
return None;
|
|
|
|
}
|
|
|
|
// compaction triggered by space amplification ratio
|
|
|
|
let mut size = 0;
|
|
|
|
for id in 0..(snapshot.levels.len() - 1) {
|
|
|
|
size += snapshot.levels[id].1.len();
|
|
|
|
}
|
|
|
|
let space_amp_ratio =
|
|
|
|
(size as f64) / (snapshot.levels.last().unwrap().1.len() as f64) * 100.0;
|
|
|
|
if space_amp_ratio >= self.options.max_size_amplification_percent as f64 {
|
|
|
|
println!(
|
|
|
|
"compaction triggered by space amplification ratio: {}",
|
|
|
|
space_amp_ratio
|
|
|
|
);
|
|
|
|
return Some(TieredCompactionTask {
|
|
|
|
tiers: snapshot.levels.clone(),
|
2024-01-18 19:40:05 +08:00
|
|
|
bottom_tier_included: true,
|
2024-01-17 14:51:15 +08:00
|
|
|
});
|
|
|
|
}
|
|
|
|
let size_ratio_trigger = (100.0 + self.options.size_ratio as f64) / 100.0;
|
|
|
|
// compaction triggered by size ratio
|
|
|
|
let mut size = 0;
|
|
|
|
for id in 0..(snapshot.levels.len() - 1) {
|
|
|
|
size += snapshot.levels[id].1.len();
|
|
|
|
let next_level_size = snapshot.levels[id + 1].1.len();
|
2024-11-12 21:27:00 -05:00
|
|
|
let current_size_ratio = next_level_size as f64 / size as f64;
|
|
|
|
if current_size_ratio > size_ratio_trigger && id + 1 >= self.options.min_merge_width {
|
2024-01-17 14:51:15 +08:00
|
|
|
println!(
|
2024-11-12 21:27:00 -05:00
|
|
|
"compaction triggered by size ratio: {} > {}",
|
|
|
|
current_size_ratio * 100.0,
|
|
|
|
size_ratio_trigger * 100.0
|
2024-01-17 14:51:15 +08:00
|
|
|
);
|
|
|
|
return Some(TieredCompactionTask {
|
|
|
|
tiers: snapshot
|
|
|
|
.levels
|
|
|
|
.iter()
|
2024-11-12 21:27:00 -05:00
|
|
|
.take(id + 1)
|
2024-01-17 14:51:15 +08:00
|
|
|
.cloned()
|
|
|
|
.collect::<Vec<_>>(),
|
2025-06-07 07:27:52 -04:00
|
|
|
// Size ratio trigger will never include the bottom level
|
|
|
|
bottom_tier_included: false,
|
2024-01-17 14:51:15 +08:00
|
|
|
});
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// trying to reduce sorted runs without respecting size ratio
|
2024-11-12 21:27:00 -05:00
|
|
|
let num_tiers_to_take = snapshot
|
|
|
|
.levels
|
|
|
|
.len()
|
|
|
|
.min(self.options.max_merge_width.unwrap_or(usize::MAX));
|
2024-01-17 14:51:15 +08:00
|
|
|
println!("compaction triggered by reducing sorted runs");
|
2024-12-09 00:23:03 -05:00
|
|
|
Some(TieredCompactionTask {
|
2024-01-17 14:51:15 +08:00
|
|
|
tiers: snapshot
|
|
|
|
.levels
|
|
|
|
.iter()
|
|
|
|
.take(num_tiers_to_take)
|
|
|
|
.cloned()
|
|
|
|
.collect::<Vec<_>>(),
|
2024-01-18 19:40:05 +08:00
|
|
|
bottom_tier_included: snapshot.levels.len() >= num_tiers_to_take,
|
2024-12-09 00:23:03 -05:00
|
|
|
})
|
2024-01-16 16:30:01 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
pub fn apply_compaction_result(
|
|
|
|
&self,
|
2024-01-18 17:51:24 +08:00
|
|
|
snapshot: &LsmStorageState,
|
2024-01-16 16:30:01 +08:00
|
|
|
task: &TieredCompactionTask,
|
|
|
|
output: &[usize],
|
2024-01-18 17:51:24 +08:00
|
|
|
) -> (LsmStorageState, Vec<usize>) {
|
2024-01-17 14:51:15 +08:00
|
|
|
assert!(
|
|
|
|
snapshot.l0_sstables.is_empty(),
|
|
|
|
"should not add l0 ssts in tiered compaction"
|
|
|
|
);
|
|
|
|
let mut snapshot = snapshot.clone();
|
|
|
|
let mut tier_to_remove = task
|
|
|
|
.tiers
|
|
|
|
.iter()
|
|
|
|
.map(|(x, y)| (*x, y))
|
|
|
|
.collect::<HashMap<_, _>>();
|
|
|
|
let mut levels = Vec::new();
|
|
|
|
let mut new_tier_added = false;
|
|
|
|
let mut files_to_remove = Vec::new();
|
|
|
|
for (tier_id, files) in &snapshot.levels {
|
|
|
|
if let Some(ffiles) = tier_to_remove.remove(tier_id) {
|
|
|
|
// the tier should be removed
|
|
|
|
assert_eq!(ffiles, files, "file changed after issuing compaction task");
|
|
|
|
files_to_remove.extend(ffiles.iter().copied());
|
|
|
|
} else {
|
|
|
|
// retain the tier
|
|
|
|
levels.push((*tier_id, files.clone()));
|
|
|
|
}
|
|
|
|
if tier_to_remove.is_empty() && !new_tier_added {
|
|
|
|
// add the compacted tier to the LSM tree
|
|
|
|
new_tier_added = true;
|
|
|
|
levels.push((output[0], output.to_vec()));
|
|
|
|
}
|
|
|
|
}
|
2024-01-17 15:49:43 +08:00
|
|
|
if !tier_to_remove.is_empty() {
|
|
|
|
unreachable!("some tiers not found??");
|
|
|
|
}
|
2024-01-17 14:51:15 +08:00
|
|
|
snapshot.levels = levels;
|
|
|
|
(snapshot, files_to_remove)
|
2024-01-16 16:30:01 +08:00
|
|
|
}
|
|
|
|
}
|