iregex/ir/
atom.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
use std::hash::Hash;

use iregex_automata::{
	nfa::{BuildNFA, StateBuilder, Tags},
	Class, Map, RangeSet, Token, NFA,
};

use crate::{Boundary, CaptureTag};

use super::{Alternation, CaptureGroupId, Repeat};

#[derive(Debug, Clone)]
pub enum Atom<T = char, B = ()> {
	/// Boundary.
	Boundary(B),

	/// Token.
	Token(RangeSet<T>),

	/// Repetition.
	Repeat(Alternation<T, B>, Repeat),

	/// Capture group.
	Capture(CaptureGroupId, Alternation<T, B>),
}

impl<T, B> Atom<T, B> {
	pub fn alternation(alt: Alternation<T, B>) -> Self {
		Self::Repeat(alt, Repeat::ONCE)
	}

	pub fn star(inner: Alternation<T, B>) -> Self {
		Self::Repeat(inner, Repeat::STAR)
	}
}

impl<T, B, Q, C> BuildNFA<T, Q, C, CaptureTag> for Atom<T, B>
where
	T: Token,
	B: Boundary<T, Class = C>,
	Q: Copy + Ord,
	C: Clone + Eq + Hash + Class<T>,
{
	fn build_nfa_from<S: StateBuilder<T, Q, C>>(
		&self,
		state_builder: &mut S,
		nfa: &mut NFA<Q, T>,
		tags: &mut Tags<Q, CaptureTag>,
		class: &B::Class,
	) -> Result<(Q, C::Map<Q>), S::Error> {
		match self {
			Self::Boundary(boundary) => {
				let a = state_builder.next_state(nfa, class.clone())?;
				let mut output: C::Map<Q> = Default::default();
				if let Some(b_class) = boundary.apply(class) {
					let b = state_builder.next_state(nfa, b_class.clone())?;
					output.set(b_class, b);
				}
				Ok((a, output))
			}
			Self::Token(set) => {
				let a = state_builder.next_state(nfa, class.clone())?;
				let mut output: C::Map<Q> = Default::default();
				for (b_class, set) in class.classify(set).into_entries() {
					let b = state_builder.next_state(nfa, b_class.clone())?;
					nfa.add(a, Some(set.into_owned()), b);
					output.set(b_class, b);
				}

				Ok((a, output))
			}
			Self::Repeat(alt, r) => r.build_nfa_for(alt, state_builder, nfa, tags, class),
			Self::Capture(_, alt) => alt.build_nfa_from(state_builder, nfa, tags, class),
		}
	}
}