iregex/ir/
alternation.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
use std::{hash::Hash, ops::Deref};

use iregex_automata::{
	nfa::{BuildNFA, StateBuilder, Tags},
	Class, Map, Token, NFA,
};

use crate::{Atom, Boundary, CaptureTag, Concatenation};

/// Regular expression sequence disjunction.
#[derive(Debug, Clone)]
pub struct Alternation<T = char, B = ()>(Vec<Concatenation<T, B>>);

impl<T, B> Default for Alternation<T, B> {
	fn default() -> Self {
		Self(Vec::new())
	}
}

impl<T, B> Alternation<T, B> {
	pub fn new() -> Self {
		Self::default()
	}
}

impl<T, B> From<Concatenation<T, B>> for Alternation<T, B> {
	fn from(value: Concatenation<T, B>) -> Self {
		Self(vec![value])
	}
}

impl<T, B> From<Atom<T, B>> for Alternation<T, B> {
	fn from(value: Atom<T, B>) -> Self {
		Self(vec![value.into()])
	}
}

impl<T, B> Deref for Alternation<T, B> {
	type Target = [Concatenation<T, B>];

	fn deref(&self) -> &Self::Target {
		self.0.as_slice()
	}
}

impl<'a, T, B> IntoIterator for &'a Alternation<T, B> {
	type IntoIter = std::slice::Iter<'a, Concatenation<T, B>>;
	type Item = &'a Concatenation<T, B>;

	fn into_iter(self) -> Self::IntoIter {
		self.0.iter()
	}
}

impl<T, B> IntoIterator for Alternation<T, B> {
	type IntoIter = std::vec::IntoIter<Concatenation<T, B>>;
	type Item = Concatenation<T, B>;

	fn into_iter(self) -> Self::IntoIter {
		self.0.into_iter()
	}
}

impl<T, B> FromIterator<Concatenation<T, B>> for Alternation<T, B> {
	fn from_iter<I: IntoIterator<Item = Concatenation<T, B>>>(iter: I) -> Self {
		Self(Vec::from_iter(iter))
	}
}

impl<T, B, Q, C> BuildNFA<T, Q, C, CaptureTag> for Alternation<T, B>
where
	T: Token,
	B: Boundary<T, Class = C>,
	Q: Copy + Ord,
	C: Clone + Eq + Hash + Class<T>,
{
	fn build_nfa_from<S: StateBuilder<T, Q, C>>(
		&self,
		state_builder: &mut S,
		nfa: &mut NFA<Q, T>,
		tags: &mut Tags<Q, CaptureTag>,
		class: &C,
	) -> Result<(Q, C::Map<Q>), S::Error> {
		match self.0.as_slice() {
			[] => {
				let a = state_builder.next_state(nfa, class.clone())?;
				Ok((a, Default::default()))
			}
			[concat] => concat.build_nfa_from(state_builder, nfa, tags, class),
			list => {
				let a = state_builder.next_state(nfa, class.clone())?;
				let mut output: C::Map<Q> = Default::default();

				for concat in list {
					let (concat_a, concat_b_map) =
						concat.build_nfa_from(state_builder, nfa, tags, class)?;
					nfa.add(a, None, concat_a);

					for (b_class, concat_b) in concat_b_map.into_entries() {
						let b = *output.get_or_try_insert_with(&b_class, || {
							state_builder.next_state(nfa, b_class.clone())
						})?;

						nfa.add(concat_b, None, b);
					}
				}

				Ok((a, output))
			}
		}
	}
}