vn-nlp 0.1.3

Vietnamese NLP library — tokenization, normalization, segmentation
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
use vn_nlp::normalize;

fn main() {
    let text = "  Xin   chào   Việt   Nam  ";
    println!("Input:      \"{text}\"");
    println!("Normalized: \"{}\"", normalize(text));

    let vn = "Tiếng Việt rất đẹp";
    println!("\nInput:      \"{vn}\"");
    println!(
        "No accents: \"{}\"",
        vn_nlp::normalize::strip_diacritics(vn)
    );
}