1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
use std::convert::TryFrom;

use crate::{shared::NomErrorReason, take_uint, IResult, NomErr};
use nom::{bytes::complete::take, character::complete::char, combinator::map_res, sequence::tuple};
use serde::{Deserialize, Serialize};
use thiserror::Error;

// Todo: Enum for radical

/// Descriptor code for The Kanji Dictionary.
/// The code reference can be found here: <http://www.edrdg.org/wiki/index.php/KANJIDIC_Project>
#[derive(Debug, PartialEq, Eq, Clone, Copy, PartialOrd, Ord, Hash, Serialize, Deserialize)]
#[serde(rename_all = "camelCase")]
pub struct ShDesc {
    /// Number of strokes in the identifying radical.
    pub radical_strokes: u8,
    /// The letter for the radical in the identification system.
    pub radical: ShRadical,
    /// The number of strokes not included in the radical.
    pub other_strokes: u8,
    /// The position of the kanji in the sequence described
    /// by the other descriptor parts.
    pub sequence: u8,
}

/// An identifying radical in the Spahn and Hadamitzky classification system.
#[derive(Debug, PartialEq, Eq, Clone, Copy, PartialOrd, Ord, Hash, Serialize, Deserialize)]
#[serde(rename_all = "lowercase")]
pub enum ShRadical {
    A,
    B,
    C,
    D,
    E,
    F,
    G,
    H,
    I,
    J,
    K,
    L,
    M,
    N,
    O,
    P,
    Q,
    R,
    S,
    T,
    U,
    V,
    W,
    X,
    Y,
    Z,
}

#[derive(Debug, Error, PartialEq, Eq)]
pub enum ShRadicalParseError {
    #[error("(ShRadical) Unknown radical")]
    UnknownChar,
}

impl TryFrom<char> for ShRadical {
    type Error = ShRadicalParseError;

    fn try_from(value: char) -> Result<Self, Self::Error> {
        match value {
            'a' => Ok(ShRadical::A),
            'b' => Ok(ShRadical::B),
            'c' => Ok(ShRadical::C),
            'd' => Ok(ShRadical::D),
            'e' => Ok(ShRadical::E),
            'f' => Ok(ShRadical::F),
            'g' => Ok(ShRadical::G),
            'h' => Ok(ShRadical::H),
            'i' => Ok(ShRadical::I),
            'j' => Ok(ShRadical::J),
            'k' => Ok(ShRadical::K),
            'l' => Ok(ShRadical::L),
            'm' => Ok(ShRadical::M),
            'n' => Ok(ShRadical::N),
            'o' => Ok(ShRadical::O),
            'p' => Ok(ShRadical::P),
            'q' => Ok(ShRadical::Q),
            'r' => Ok(ShRadical::R),
            's' => Ok(ShRadical::S),
            't' => Ok(ShRadical::T),
            'u' => Ok(ShRadical::U),
            'v' => Ok(ShRadical::V),
            'w' => Ok(ShRadical::W),
            'x' => Ok(ShRadical::X),
            'y' => Ok(ShRadical::Y),
            'z' => Ok(ShRadical::Z),
            _ => Err(ShRadicalParseError::UnknownChar),
        }
    }
}

#[derive(Debug, Error, PartialEq, Eq, Clone)]
pub enum ShParseError {
    #[error("(Spahn Hadamitzky) Format: {0}")]
    Format(NomErrorReason),
}

impl<'a> From<NomErr<'a>> for ShParseError {
    fn from(err: NomErr<'a>) -> Self {
        Self::Format(err.into())
    }
}

impl TryFrom<&str> for ShDesc {
    type Error = ShParseError;

    fn try_from(text: &str) -> Result<Self, Self::Error> {
        let (_i, (radical_strokes, radical, other_strokes, _, sequence)) = parts(text)?;
        Ok(Self {
            radical_strokes,
            radical,
            other_strokes,
            sequence,
        })
    }
}

fn parts(s: &str) -> IResult<(u8, ShRadical, u8, char, u8)> {
    tuple((take_uint, radical, take_uint, char('.'), take_uint))(s)
}

fn radical(s: &str) -> IResult<ShRadical> {
    map_res(take(1u8), |s: &str| {
        let c = s.chars().next().unwrap();
        ShRadical::try_from(c)
    })(s)
}