lexgen 0.16.0

A fully-featured lexer generator implemented as a proc macro
Documentation
use super::{State, StateIdx, DFA};
use crate::collections::Map;
use crate::nfa::AcceptingState;

#[derive(Debug)]
pub enum Trans<A> {
    Accept(Vec<AcceptingState<A>>),
    Trans(StateIdx),
}

/// Removes accepting states with no transitions, makes the transitions to those states accepting.
pub fn simplify<K, A: Clone>(
    dfa: DFA<StateIdx, A>,
    dfa_state_indices: &mut Map<K, StateIdx>,
) -> DFA<Trans<A>, A> {
    let mut empty_states: Vec<(StateIdx, Vec<AcceptingState<A>>)> = vec![];

    let mut non_empty_states: Vec<(StateIdx, State<StateIdx, A>)> = vec![];

    for (state_idx, state) in dfa.into_state_indices() {
        if state.has_no_transitions() && !state.initial {
            empty_states.push((state_idx, state.accepting));
        } else {
            non_empty_states.push((state_idx, state));
        }
    }

    for (_, t) in dfa_state_indices.iter_mut() {
        let idx = match empty_states.binary_search_by(|(state_idx, _)| state_idx.cmp(t)) {
            Ok(idx) | Err(idx) => idx,
        };
        *t = t.map(|i| i - idx);
    }

    let map_transition = |t: StateIdx| -> Trans<A> {
        match empty_states.binary_search_by(|(state_idx, _action)| state_idx.cmp(&t)) {
            Ok(idx) => Trans::Accept(empty_states[idx].1.clone()),
            Err(idx) => Trans::Trans(t.map(|i| i - idx)),
        }
    };

    let new_states: Vec<State<Trans<A>, A>> = non_empty_states
        .into_iter()
        .map(|(_state_idx, state)| {
            let State {
                initial,
                char_transitions,
                range_transitions,
                any_transition,
                end_of_input_transition,
                accepting,
                predecessors,
                backtrack,
            } = state;

            let char_transitions = char_transitions
                .into_iter()
                .map(|(char, next)| (char, map_transition(next)))
                .collect();

            let range_transitions = range_transitions.map(map_transition);

            let any_transition = any_transition.map(map_transition);

            let end_of_input_transition = end_of_input_transition.map(map_transition);

            let predecessors = predecessors
                .into_iter()
                .map(|pred| match map_transition(pred) {
                    Trans::Trans(pred) => pred,
                    _ => {
                        // This pass should only remove nodes without successors, so it's a bug if
                        // we remove a predecessor
                        panic!("Predecessor of a state is removed in simplification")
                    }
                })
                .collect();

            State {
                initial,
                char_transitions,
                range_transitions,
                any_transition,
                end_of_input_transition,
                accepting,
                predecessors,
                backtrack,
            }
        })
        .collect();

    DFA::from_states(new_states)
}