1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
use regex::Regex;
use std::str;
use streamson_lib::Handler;
use streamson_lib::{error, path::Path};
type Replacement = (Regex, String, usize);
#[derive(Debug, Default)]
pub struct RegexConverter {
replacements: Vec<Replacement>,
}
impl Handler for RegexConverter {
fn handle(
&mut self,
_path: &Path,
_matcher_idx: usize,
data: Option<&[u8]>,
) -> Result<Option<Vec<u8>>, error::Handler> {
let mut output: String = str::from_utf8(data.unwrap())
.map_err(|e| error::Handler::new(e.to_string()))?
.to_string();
for (regex, into, limit) in &self.replacements {
let str_to_replace: &str = &into;
output = regex.replacen(&output, *limit, str_to_replace).to_string();
}
Ok(Some(output.as_bytes().to_vec()))
}
fn use_path(&self) -> bool {
false
}
fn buffering_required(&self) -> bool {
true
}
}
impl RegexConverter {
pub fn new() -> Self {
Self::default()
}
pub fn add_regex(mut self, regex: Regex, into: String, limit: usize) -> Self {
self.replacements.push((regex, into, limit));
self
}
}
#[cfg(test)]
mod tests {
use super::RegexConverter;
use regex::Regex;
use std::sync::{Arc, Mutex};
use streamson_lib::{matcher::Simple, strategy::Convert};
#[test]
fn regex_converter() {
let mut convert = Convert::new();
let regex_converter = RegexConverter::new().add_regex(
Regex::new("[Uu]ser([0-9]+)").unwrap(),
"user$1".to_string(),
1,
);
let matcher = Simple::new(r#"[]{"name"}"#).unwrap();
convert.add_matcher(
Box::new(matcher),
vec![Arc::new(Mutex::new(regex_converter))],
);
let output = convert
.process(br#"[{"name": "User1 User1"}, {"name": "user2"}]"#)
.unwrap();
let output: Vec<u8> = output.into_iter().flatten().collect();
assert_eq!(
String::from_utf8(output).unwrap(),
r#"[{"name": "user1 User1"}, {"name": "user2"}]"#
);
}
}