use parsitext::Parsitext;
fn main() {
let pt = Parsitext::default();
let original = "سلام داداش، چطوري؟ قيمتش حدود 1.5 میلیون تومنه، خيليييي گرونه!";
let result = pt.process(original);
println!("Original : {}", result.original);
println!("Normalized: {}", result.normalized);
println!();
println!(
"Contains Persian yeh (ی): {}",
result.normalized.contains('ی')
);
println!(
"Contains Persian digit (۱): {}",
result.normalized.contains('۱')
);
println!(
"Emphatic repetition reduced (no 3-in-a-row): {}",
!result
.normalized
.chars()
.collect::<Vec<_>>()
.windows(3)
.any(|w| w[0] == w[1] && w[1] == w[2])
);
println!();
let tokens = pt.tokenize_only(original);
println!("Token count: {}", tokens.len());
println!("Tokens : {:?}", tokens);
}