1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
use std::fmt::Debug;
use anyhow::Result;
use bitflags::bitflags;
pub use generic_matcher::GenericMatcher;
pub use multi_eps_matcher::{MultiEpsMatcher, MultiEpsMatcherFlags};
pub use sorted_matcher::SortedMatcher;
use crate::fst_traits::ExpandedFst;
use crate::semirings::Semiring;
use crate::{Label, StateId};
use crate::{Tr, EPS_LABEL, NO_LABEL};
use std::sync::Arc;
mod generic_matcher;
mod multi_eps_matcher;
mod sorted_matcher;
bitflags! {
pub struct MatcherFlags: u32 {
const REQUIRE_MATCH = 1u32 << 0;
const INPUT_LOOKAHEAD_MATCHER = 1u32 << 4;
const OUTPUT_LOOKAHEAD_MATCHER = 1u32 << 5;
const LOOKAHEAD_WEIGHT = 1u32 << 6;
const LOOKAHEAD_PREFIX = 1u32 << 7;
const LOOKAHEAD_NON_EPSILONS = 1u32 << 8;
const LOOKAHEAD_EPSILONS = 1u32 << 9;
const LOOKAHEAD_NON_EPSILON_PREFIX = 1u32 << 10;
const LOOKAHEAD_FLAGS = Self::INPUT_LOOKAHEAD_MATCHER.bits |
Self::OUTPUT_LOOKAHEAD_MATCHER.bits |
Self::LOOKAHEAD_WEIGHT.bits |
Self::LOOKAHEAD_PREFIX.bits |
Self::LOOKAHEAD_NON_EPSILONS.bits |
Self::LOOKAHEAD_EPSILONS.bits |
Self::LOOKAHEAD_NON_EPSILON_PREFIX.bits;
const ILABEL_LOOKAHEAD_FLAGS = Self::INPUT_LOOKAHEAD_MATCHER.bits |
Self::LOOKAHEAD_WEIGHT.bits |
Self::LOOKAHEAD_PREFIX.bits |
Self::LOOKAHEAD_EPSILONS.bits |
Self::LOOKAHEAD_NON_EPSILON_PREFIX.bits;
const OLABEL_LOOKAHEAD_FLAGS = Self::OUTPUT_LOOKAHEAD_MATCHER.bits |
Self::LOOKAHEAD_WEIGHT.bits |
Self::LOOKAHEAD_PREFIX.bits |
Self::LOOKAHEAD_EPSILONS.bits |
Self::LOOKAHEAD_NON_EPSILON_PREFIX.bits;
}
}
pub static REQUIRE_PRIORITY: usize = std::usize::MAX;
#[derive(Copy, Debug, PartialOrd, PartialEq, Clone)]
pub enum MatchType {
MatchInput,
MatchOutput,
MatchBoth,
MatchNone,
MatchUnknown,
}
#[derive(Clone)]
pub enum IterItemMatcher<W: Semiring> {
Tr(Tr<W>),
EpsLoop,
}
impl<W: Semiring> IterItemMatcher<W> {
pub fn into_tr(self, state: StateId, match_type: MatchType) -> Result<Tr<W>> {
match self {
IterItemMatcher::Tr(tr) => Ok(tr),
IterItemMatcher::EpsLoop => eps_loop(state, match_type),
}
}
}
pub fn eps_loop<W: Semiring>(state: StateId, match_type: MatchType) -> Result<Tr<W>> {
let tr = match match_type {
MatchType::MatchInput => Tr::new(NO_LABEL, EPS_LABEL, W::one(), state),
MatchType::MatchOutput => Tr::new(EPS_LABEL, NO_LABEL, W::one(), state),
_ => bail!("Unsupported match_type : {:?}", match_type),
};
Ok(tr)
}
pub trait Matcher<W: Semiring>: Debug + Clone {
type F: ExpandedFst<W>;
type Iter: Iterator<Item = IterItemMatcher<W>> + Clone;
fn new(fst: Arc<Self::F>, match_type: MatchType) -> Result<Self>
where
Self: std::marker::Sized;
fn iter(&self, state: StateId, label: Label) -> Result<Self::Iter>;
fn final_weight(&self, state: StateId) -> Result<Option<W>>;
fn match_type(&self, test: bool) -> Result<MatchType>;
fn flags(&self) -> MatcherFlags;
fn priority(&self, state: StateId) -> Result<usize>;
fn fst(&self) -> &Arc<Self::F>;
}