1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
use std::borrow::Cow;
mod error;
mod reader;
pub mod tag;
pub use self::error::Error;
pub use self::tag::Tag;
#[doc(hidden)]
pub use self::reader::Reader;
pub struct Parser<'l> {
#[allow(dead_code)]
content: Cow<'l, str>,
reader: Reader<'l>,
}
pub enum Event {
Error(Error),
Comment,
Declaration,
Instruction,
Tag(Tag),
}
pub type Result<T> = ::std::result::Result<T, Error>;
impl<'l> Parser<'l> {
#[inline]
pub fn new<T>(content: T) -> Self where T: Into<Cow<'l, str>> {
let content = content.into();
let reader = unsafe { ::std::mem::transmute(Reader::new(&*content)) };
Parser { content: content, reader: reader }
}
}
macro_rules! raise(
($parser:expr, $($argument:tt)*) => (
return Some(Event::Error(Error::new($parser.reader.position(), format!($($argument)*))));
);
);
impl<'l> Iterator for Parser<'l> {
type Item = Event;
fn next(&mut self) -> Option<Event> {
self.reader.consume_until_char('<');
if !self.reader.consume_char('<') {
return None;
}
let content = self.reader.capture(|reader| {
reader.consume_until_char('>');
}).and_then(|content| Some(String::from(content)));
if content.is_none() {
return raise!(self, "found an empty tag");
}
if !self.reader.consume_char('>') {
raise!(self, "missing a closing angle bracket");
}
let content = content.unwrap();
Some(if content.starts_with("!--") {
Event::Comment
} else if content.starts_with("!") {
Event::Declaration
} else if content.starts_with("?") {
Event::Instruction
} else {
match Tag::parse(&content) {
Ok(tag) => Event::Tag(tag),
Err(error) => Event::Error(error),
}
})
}
}
#[cfg(test)]
mod tests {
use parser::{Event, Parser, Tag};
#[test]
fn next() {
macro_rules! test(
($content:expr, $name:expr) => ({
let mut parser = Parser::new($content);
match parser.next().unwrap() {
Event::Tag(Tag::Unknown(_, name, _)) => assert_eq!(&*name, $name),
_ => unreachable!(),
}
})
);
test!("<foo>", "foo");
test!("<foo/>", "foo");
test!(" <foo/>", "foo");
test!("foo <bar>", "bar");
test!("foo> <bar>", "bar");
}
}