jayce
jayce is a tokenizer 🌌
Example
use jayce::{duos, Tokenizer};
use regex::Regex;
const SOURCE: &str = "Excalibur = 5000$; // Your own language!";
lazy_static::lazy_static! (
static ref DUOS: Vec<(&'static str, Regex)> = duos![
"whitespace", r"^[^\S\n]+",
"comment_line", r"^//(.*)",
"comment_block", r"^/\*(.|\n)*?\*/",
"newline", r"^\n",
"price", r"^[0-9]+\$",
"semicolon", r"^;",
"operator", r"^=",
"name", r"^[a-zA-Z_]+"
];
);
fn main() -> Result<(), Box<dyn std::error::Error>> {
let mut tokenizer = Tokenizer::new(SOURCE, &DUOS);
while let Some(token) = tokenizer.next()? {
println!("{:?}", token);
}
Ok(())
}
Result
Token { kind: "name", value: "Excalibur", pos: (1, 1) }
Token { kind: "whitespace", value: " ", pos: (1, 10) }
Token { kind: "operator", value: "=", pos: (1, 11) }
Token { kind: "whitespace", value: " ", pos: (1, 12) }
Token { kind: "price", value: "5000$", pos: (1, 13) }
Token { kind: "semicolon", value: ";", pos: (1, 18) }
Token { kind: "whitespace", value: " ", pos: (1, 19) }
Token { kind: "comment_line", value: "// Your own language!", pos: (1, 20) }
Info
next possible Result
Ok(Some(token)) Match is found
Ok(None) End of source
Err(error) An error occurs
tokenize_all possible Result
Ok(Vec<Tokens>) Tokens are found
Err(error) An error occurs
Performances
tokenization of 29 639 rust language tokens
Features
serialization
generic-simd
runtime-dispatch-simd enabled by default, to disable modify Cargo.toml as follows
jayce = { version = "X.X.X", default-features = false }