1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
// Copyright (c) 2016-2020 Fabian Schuiki

use moore_common::errors::DiagBuilder2;
use moore_common::grind::Grinder;

/// A grinder that categorizes characters into different groups as per the VHDL
/// language standard.
pub struct Categorizer<T> {
    inner: T,
}

impl<T> Categorizer<T>
where
    T: Grinder<Item = Option<(usize, char, u8)>, Error = DiagBuilder2>,
{
    /// Create a new categorizer.
    pub fn new(inner: T) -> Categorizer<T> {
        Categorizer { inner: inner }
    }
}

impl<T> Grinder for Categorizer<T>
where
    T: Grinder<Item = Option<(usize, char, u8)>, Error = DiagBuilder2>,
{
    type Item = Option<(usize, char, u8, Category)>;
    type Error = DiagBuilder2;

    fn emit(&mut self, err: Self::Error) {
        self.inner.emit(err);
    }

    fn next(&mut self) -> Self::Item {
        let (offset, c, sz) = match self.inner.next() {
            Some(v) => v,
            None => return None,
        };
        let cat = match c {
            '"' | '#' | '&' | '\'' | '(' | ')' | '*' | '+' | ',' | '-' | '.' | '/' | ':' | ';'
            | '<' | '=' | '>' | '?' | '@' | '[' | ']' | '_' | '`' | '|' => Category::Special,
            c if c.is_alphabetic() => Category::Letter,
            c if c.is_digit(10) => Category::Digit,
            c if c.is_whitespace() => Category::Space,
            _ => Category::Other,
        };
        Some((offset, c, sz, cat))
    }
}

/// A character category. Special means the special characters as defined by the
/// VHDL standard to be meaningful syntactically.
#[derive(Copy, Clone, PartialEq, Eq, Debug)]
pub enum Category {
    Letter,
    Digit,
    Special,
    Space,
    Other,
}