1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
#![allow(dead_code)]
pub mod iterator;
pub mod iterator_html;
pub mod parser;
pub mod renderer;
use nom::error::Error;
use nom::error::ErrorKind;
use nom::error::ParseError;
use nom::Err;
use nom::IResult;
pub fn take_until_unbalanced(
opening_bracket: char,
closing_bracket: char,
) -> impl Fn(&str) -> IResult<&str, &str> {
move |i: &str| {
let mut index = 0;
let mut bracket_counter = 0;
while let Some(n) = &i[index..].find(&[opening_bracket, closing_bracket, '\\'][..]) {
index += n;
let mut it = i[index..].chars();
match it.next().unwrap_or_default() {
c if c == '\\' => {
index += '\\'.len_utf8();
let c = it.next().unwrap_or_default();
index += c.len_utf8();
}
c if c == opening_bracket => {
bracket_counter += 1;
index += opening_bracket.len_utf8();
}
c if c == closing_bracket => {
bracket_counter -= 1;
index += closing_bracket.len_utf8();
}
_ => unreachable!(),
};
if bracket_counter == -1 {
index -= closing_bracket.len_utf8();
return Ok((&i[index..], &i[0..index]));
};
}
if bracket_counter == 0 {
Ok(("", i))
} else {
Err(Err::Error(Error::from_error_kind(i, ErrorKind::TakeUntil)))
}
}
}
#[cfg(test)]
mod tests {
use super::*;
use nom::error::ErrorKind;
#[test]
fn test_take_until_unmatched() {
assert_eq!(take_until_unbalanced('(', ')')("abc"), Ok(("", "abc")));
assert_eq!(
take_until_unbalanced('(', ')')("url)abc"),
Ok((")abc", "url"))
);
assert_eq!(
take_until_unbalanced('(', ')')("u()rl)abc"),
Ok((")abc", "u()rl"))
);
assert_eq!(
take_until_unbalanced('(', ')')("u(())rl)abc"),
Ok((")abc", "u(())rl"))
);
assert_eq!(
take_until_unbalanced('(', ')')("u(())r()l)abc"),
Ok((")abc", "u(())r()l"))
);
assert_eq!(
take_until_unbalanced('(', ')')("u(())r()labc"),
Ok(("", "u(())r()labc"))
);
assert_eq!(
take_until_unbalanced('(', ')')(r#"u\((\))r()labc"#),
Ok(("", r#"u\((\))r()labc"#))
);
assert_eq!(
take_until_unbalanced('(', ')')("u(())r(labc"),
Err(nom::Err::Error(nom::error::Error::new(
"u(())r(labc",
ErrorKind::TakeUntil
)))
);
assert_eq!(
take_until_unbalanced('€', 'ü')("€uü€€üürlüabc"),
Ok(("üabc", "€uü€€üürl"))
);
}
}