1mod block_size;
6mod compression;
7mod filter;
8mod hash_ratio;
9mod pinning;
10mod restart_interval;
11
12pub use block_size::BlockSizePolicy;
13pub use compression::CompressionPolicy;
14pub use filter::{BloomConstructionPolicy, FilterPolicy, FilterPolicyEntry};
15pub use hash_ratio::HashRatioPolicy;
16pub use pinning::PinningPolicy;
17pub use restart_interval::RestartIntervalPolicy;
18
19pub type PartioningPolicy = PinningPolicy;
21
22use crate::{
23 path::absolute_path, version::DEFAULT_LEVEL_COUNT, AnyTree, BlobTree, Cache, CompressionType,
24 DescriptorTable, Tree,
25};
26use std::{
27 path::{Path, PathBuf},
28 sync::Arc,
29};
30
31#[derive(Copy, Clone, Debug, PartialEq, Eq)]
33pub enum TreeType {
34 Standard,
36
37 Blob,
39}
40
41impl From<TreeType> for u8 {
42 fn from(val: TreeType) -> Self {
43 match val {
44 TreeType::Standard => 0,
45 TreeType::Blob => 1,
46 }
47 }
48}
49
50impl TryFrom<u8> for TreeType {
51 type Error = ();
52
53 fn try_from(value: u8) -> Result<Self, Self::Error> {
54 match value {
55 0 => Ok(Self::Standard),
56 1 => Ok(Self::Blob),
57 _ => Err(()),
58 }
59 }
60}
61
62const DEFAULT_FILE_FOLDER: &str = ".lsm.data";
63
64#[derive(Clone, Debug, PartialEq)]
66pub struct KvSeparationOptions {
67 #[doc(hidden)]
69 pub compression: CompressionType,
70
71 #[doc(hidden)]
73 pub file_target_size: u64,
74
75 #[doc(hidden)]
77 pub separation_threshold: u32,
78
79 #[doc(hidden)]
80 pub staleness_threshold: f32,
81
82 #[doc(hidden)]
83 pub age_cutoff: f32,
84}
85
86impl Default for KvSeparationOptions {
87 fn default() -> Self {
88 Self {
89 #[cfg(feature="lz4")]
90 compression: CompressionType::Lz4,
91
92 #[cfg(not(feature="lz4"))]
93 compression: CompressionType::None,
94
95 file_target_size: 64 * 1_024 * 1_024,
96 separation_threshold: 1_024,
97
98 staleness_threshold: 0.33,
99 age_cutoff: 0.20,
100 }
101 }
102}
103
104impl KvSeparationOptions {
105 #[must_use]
107 pub fn compression(mut self, compression: CompressionType) -> Self {
108 self.compression = compression;
109 self
110 }
111
112 #[must_use]
122 pub fn file_target_size(mut self, bytes: u64) -> Self {
123 self.file_target_size = bytes;
124 self
125 }
126
127 #[must_use]
134 pub fn separation_threshold(mut self, bytes: u32) -> Self {
135 self.separation_threshold = bytes;
136 self
137 }
138
139 #[must_use]
146 pub fn staleness_threshold(mut self, ratio: f32) -> Self {
147 self.staleness_threshold = ratio;
148 self
149 }
150
151 #[must_use]
155 pub fn age_cutoff(mut self, ratio: f32) -> Self {
156 self.age_cutoff = ratio;
157 self
158 }
159}
160
161#[derive(Clone)]
162pub struct Config {
164 #[doc(hidden)]
166 pub path: PathBuf,
167
168 #[doc(hidden)]
170 pub cache: Arc<Cache>,
171
172 #[doc(hidden)]
174 pub descriptor_table: Arc<DescriptorTable>,
175
176 pub level_count: u8,
180
181 pub data_block_compression_policy: CompressionPolicy,
183
184 pub index_block_compression_policy: CompressionPolicy,
186
187 pub data_block_restart_interval_policy: RestartIntervalPolicy,
189
190 pub index_block_restart_interval_policy: RestartIntervalPolicy,
192
193 pub data_block_size_policy: BlockSizePolicy,
195
196 pub index_block_pinning_policy: PinningPolicy,
198
199 pub filter_block_pinning_policy: PinningPolicy,
201
202 pub top_level_index_block_pinning_policy: PinningPolicy,
204
205 pub top_level_filter_block_pinning_policy: PinningPolicy,
207
208 pub data_block_hash_ratio_policy: HashRatioPolicy,
210
211 pub index_block_partitioning_policy: PartioningPolicy,
213
214 pub filter_block_partitioning_policy: PartioningPolicy,
216
217 pub index_block_partition_size_policy: BlockSizePolicy,
219
220 pub filter_block_partition_size_policy: BlockSizePolicy,
222
223 pub(crate) expect_point_read_hits: bool,
226
227 pub filter_policy: FilterPolicy,
229
230 #[doc(hidden)]
231 pub kv_separation_opts: Option<KvSeparationOptions>,
232}
233
234impl Default for Config {
235 fn default() -> Self {
236 Self {
237 path: absolute_path(Path::new(DEFAULT_FILE_FOLDER)),
238 descriptor_table: Arc::new(DescriptorTable::new(256)),
239
240 cache: Arc::new(Cache::with_capacity_bytes(
241 16 * 1_024 * 1_024,
242 )),
243
244 data_block_restart_interval_policy: RestartIntervalPolicy::all(16),
245 index_block_restart_interval_policy: RestartIntervalPolicy::all(1),
246
247 level_count: DEFAULT_LEVEL_COUNT,
248
249 data_block_size_policy: BlockSizePolicy::default(),
250
251 index_block_pinning_policy: PinningPolicy::new(&[true, true, false]),
252 filter_block_pinning_policy: PinningPolicy::new(&[true, false]),
253
254 top_level_index_block_pinning_policy: PinningPolicy::all(true), top_level_filter_block_pinning_policy: PinningPolicy::all(true), index_block_partitioning_policy: PinningPolicy::new(&[false, false, false, true]),
258 filter_block_partitioning_policy: PinningPolicy::new(&[false, false, false, true]),
259
260 index_block_partition_size_policy: BlockSizePolicy::all(4_096), filter_block_partition_size_policy: BlockSizePolicy::all(4_096), data_block_compression_policy: CompressionPolicy::default(),
264 index_block_compression_policy: CompressionPolicy::all(CompressionType::None),
265
266 data_block_hash_ratio_policy: HashRatioPolicy::all(0.0),
267
268 filter_policy: FilterPolicy::default(),
269
270 expect_point_read_hits: false,
271
272 kv_separation_opts: None,
273 }
274 }
275}
276
277impl Config {
278 pub fn new<P: AsRef<Path>>(path: P) -> Self {
280 Self {
281 path: absolute_path(path.as_ref()),
282 ..Default::default()
283 }
284 }
285
286 #[must_use]
293 pub fn use_cache(mut self, cache: Arc<Cache>) -> Self {
294 self.cache = cache;
295 self
296 }
297
298 #[must_use]
299 #[doc(hidden)]
300 pub fn use_descriptor_table(mut self, descriptor_table: Arc<DescriptorTable>) -> Self {
301 self.descriptor_table = descriptor_table;
302 self
303 }
304
305 #[must_use]
310 pub fn expect_point_read_hits(mut self, b: bool) -> Self {
311 self.expect_point_read_hits = b;
312 self
313 }
314
315 #[must_use]
317 pub fn filter_block_partitioning_policy(mut self, policy: PinningPolicy) -> Self {
318 self.filter_block_partitioning_policy = policy;
319 self
320 }
321
322 #[must_use]
324 pub fn index_block_partitioning_policy(mut self, policy: PinningPolicy) -> Self {
325 self.index_block_partitioning_policy = policy;
326 self
327 }
328
329 #[must_use]
331 pub fn filter_block_pinning_policy(mut self, policy: PinningPolicy) -> Self {
332 self.filter_block_pinning_policy = policy;
333 self
334 }
335
336 #[must_use]
338 pub fn index_block_pinning_policy(mut self, policy: PinningPolicy) -> Self {
339 self.index_block_pinning_policy = policy;
340 self
341 }
342
343 #[must_use]
350 pub fn data_block_restart_interval_policy(mut self, policy: RestartIntervalPolicy) -> Self {
351 self.data_block_restart_interval_policy = policy;
352 self
353 }
354
355 #[must_use]
370 pub fn filter_policy(mut self, policy: FilterPolicy) -> Self {
371 self.filter_policy = policy;
372 self
373 }
374
375 #[must_use]
377 pub fn data_block_compression_policy(mut self, policy: CompressionPolicy) -> Self {
378 self.data_block_compression_policy = policy;
379 self
380 }
381
382 #[must_use]
384 pub fn index_block_compression_policy(mut self, policy: CompressionPolicy) -> Self {
385 self.index_block_compression_policy = policy;
386 self
387 }
388
389 #[must_use]
409 pub fn data_block_size_policy(mut self, policy: BlockSizePolicy) -> Self {
410 self.data_block_size_policy = policy;
411 self
412 }
413
414 #[must_use]
419 pub fn data_block_hash_ratio_policy(mut self, policy: HashRatioPolicy) -> Self {
420 self.data_block_hash_ratio_policy = policy;
421 self
422 }
423
424 #[must_use]
426 pub fn with_kv_separation(mut self, opts: Option<KvSeparationOptions>) -> Self {
427 self.kv_separation_opts = opts;
428 self
429 }
430
431 pub fn open(self) -> crate::Result<AnyTree> {
437 Ok(if self.kv_separation_opts.is_some() {
438 AnyTree::Blob(BlobTree::open(self)?)
439 } else {
440 AnyTree::Standard(Tree::open(self)?)
441 })
442 }
443}