pub fn new_with_options(lang_config: &InfiLanguageConfig) -> Tokenizer