1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
use std::collections::HashMap;
use crate::{
UltraNLPResult,
UltraNLPError,
};
#[derive(Clone)]
pub struct Dictionary {
pub(crate) map: HashMap<String, u32>,
}
impl Dictionary {
pub fn new<T: AsRef<str>, I: IntoIterator<Item = T> + Clone>(
patterns: I
) -> UltraNLPResult<Self> {
let patterns_with_values = prepare_patterns_for_dictionary(patterns)?;
if patterns_with_values.len() == 0 {
return Err(UltraNLPError::new("The patterns cannot be empty"));
}
let mut map: HashMap<String, u32> = HashMap::new();
for (pattern, value) in patterns_with_values {
let result = map.insert(pattern, value);
if let Some(_) = result {
return Err(UltraNLPError::new("The patterns are not unique"));
}
}
Ok(Self { map })
}
}
fn prepare_patterns_for_dictionary<
T: AsRef<str>,
I: IntoIterator<Item = T>
>(
patterns: I,
) -> UltraNLPResult<Vec<(String, u32)>> {
let patterns_with_values = patterns
.into_iter()
.enumerate()
.map(|(index, pattern)| -> Result<(String, u32), _>{
let pattern = pattern.as_ref().to_lowercase();
let value = u32::try_from(index)
.map_err(|err| UltraNLPError::new(err.to_string()))?;
Ok((pattern, value))
})
.collect::<Result<Vec<_>, _>>()?;
Ok(patterns_with_values)
}
#[cfg(test)]
mod tests {
use crate::hashmap::Dictionary;
#[test]
fn test_empty_patterns() {
let patterns: Vec<&str> = vec![];
assert!(Dictionary::new(patterns).is_err());
}
#[test]
fn test_patterns() {
let patterns: Vec<&str> = vec!["foo", "bar"];
Dictionary::new(patterns).unwrap();
}
#[test]
fn test_same_patterns() {
let patterns: Vec<&str> = vec!["foo", "FOO"];
assert!(Dictionary::new(patterns).is_err());
}
}