use num_bigint::BigUint;
pub type VocabId = u64;
pub type CharIndexType = u8;
pub type CharType = u32;
pub type NormString = Vec<CharIndexType>;
pub const PRIMES: &[CharType] = &[2, 3, 5, 7, 11, 13, 17, 19, 23, 29, 31, 37, 41, 43, 47, 53, 59, 61, 67, 71, 73, 79, 83, 89, 97, 101, 103, 107, 109, 113, 127, 131, 137, 139, 149, 151, 157, 163, 167, 173, 179, 181, 191, 193, 197, 199, 211, 223, 227, 229, 233, 239, 241, 251, 257, 263, 269, 271, 277, 281, 283, 293, 307, 311, 313, 317, 331, 337, 347, 349, 353, 359, 367, 373, 379, 383, 389, 397, 401, 409, 419, 421, 431, 433, 439, 443, 449, 457, 461, 463, 467, 479, 487, 491, 499, 503, 509, 521, 523, 541, 547, 557, 563, 569, 571, 577, 587, 593, 599, 601, 607, 613, 617, 619, 631, 641, 643, 647, 653, 659, 661, 673, 677, 683, 691, 701, 709, 719, 727, 733, 739, 743, 751, 757, 761, 769, 773, 787, 797, 809, 811, 821, 823, 827, 829, 839, 853, 857, 859, 863, 877, 881, 883, 887, 907, 911, 919, 929, 937, 941, 947, 953, 967, 971, 977, 983, 991, 997];
pub type AnaValue = BigUint;
pub type Alphabet = Vec<Vec<String>>;
pub struct Weights {
pub ld: f64,
pub lcs: f64,
pub freq: f64,
pub prefix: f64,
pub suffix: f64,
pub lex: f64,
pub case: f64,
}
impl Default for Weights {
fn default() -> Self {
Self {
ld: 1.0,
lcs: 1.0,
freq: 1.0,
prefix: 1.0,
suffix: 1.0,
lex: 1.0,
case: 0.2,
}
}
}
impl Weights {
pub fn sum(&self) -> f64 {
self.ld + self.lcs + self.freq + self.prefix + self.suffix + self.lex + self.case
}
}
#[derive(Debug,Clone)]
pub struct Distance {
pub ld: CharIndexType,
pub lcs: u16,
pub prefixlen: u16,
pub suffixlen: u16,
pub freq: u32,
pub lex: f32,
pub samecase: bool,
}
#[derive(Debug,Clone,Copy)]
pub enum StopCriterion {
Exhaustive,
StopAtExactMatch,
Iterative(usize),
IterativeStopAtExactMatch(usize),
}
impl StopCriterion {
pub fn stop_at_exact_match(&self) -> bool {
match self {
Self::StopAtExactMatch | Self::IterativeStopAtExactMatch(_) => true,
_ => false
}
}
pub fn iterative(&self) -> usize {
match self {
Self::Iterative(matches) | Self::IterativeStopAtExactMatch(matches) => *matches,
_ => 0
}
}
}