1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
use idx_sized::IdxSized;
use std::cmp::Ordering;
use various_data_file::{DataAddress, VariousDataFile};
pub struct IdxBinary {
index: IdxSized<DataAddress>,
data: VariousDataFile,
}
impl IdxBinary {
pub fn new(path_prefix: &str) -> Result<Self, std::io::Error> {
let index = IdxSized::new(&(path_prefix.to_string() + ".i"))?;
let data = VariousDataFile::new(&(path_prefix.to_string() + ".d"))?;
Ok(IdxBinary { index, data })
}
pub unsafe fn bytes(&self, row: u32) -> &[u8] {
match self.index.triee().value(row) {
Some(word) => self.data.bytes(word),
None => b"",
}
}
pub unsafe fn str(&self, row: u32) -> &str {
std::str::from_utf8(self.bytes(row)).unwrap()
}
fn search(&self, target: &[u8]) -> (Ordering, u32) {
self.index
.triee()
.search_cb(|s| -> Ordering { target.cmp(unsafe { self.data.bytes(s) }) })
}
pub fn find_row(&self, target: &[u8]) -> Option<u32> {
let (ord, found_row) = self.search(target);
if ord == Ordering::Equal && found_row != 0 {
Some(found_row)
} else {
None
}
}
pub fn entry(&mut self, target: &[u8]) -> Result<u32, std::io::Error> {
let (ord, found_row) = self.search(target);
if ord == Ordering::Equal && found_row != 0 {
Ok(found_row)
} else {
let data = self.data.insert(target)?;
self.index
.insert_unique(data.address().clone(), found_row, ord, 0)
}
}
}
#[test]
fn test() {
let dir = "./ib-test";
if std::path::Path::new(dir).exists() {
std::fs::remove_dir_all(dir).unwrap();
std::fs::create_dir_all(dir).unwrap();
} else {
std::fs::create_dir_all(dir).unwrap();
}
if let Ok(mut s) = IdxBinary::new(&(dir.to_owned() + "/test")) {
s.entry(b"US").unwrap();
s.entry(b"US").unwrap();
s.entry(b"US").unwrap();
s.entry(b"US").unwrap();
s.entry(b"UK").unwrap();
s.entry(b"US").unwrap();
s.entry(b"US").unwrap();
s.entry(b"UK").unwrap();
}
}