Skip to main content

Crate splintr

Crate splintr 

Source

Re-exports§

pub use core::ByteLevelStreamingDecoder;
pub use core::SentencePieceError;
pub use core::SentencePieceTokenizer;
pub use core::StreamingDecoder;
pub use core::Tokenize;
pub use core::TokenizeError;
pub use core::Tokenizer;
pub use core::TokenizerError;
pub use core::WordPieceTokenizer;
pub use core::CL100K_BASE_PATTERN;
pub use core::GPT2_PATTERN;
pub use core::LLAMA3_PATTERN;
pub use core::O200K_BASE_PATTERN;
pub use core::SENTENCEPIECE_PATTERN;
pub use core::pretrained;
pub use core::whisper;
pub use core::bos_token_id;
pub use core::bos_token_id_by_name;
pub use core::cl100k_base_special_tokens;
pub use core::deepseek_v3_special_tokens;
pub use core::eos_token_id;
pub use core::eos_token_id_by_name;
pub use core::from_pretrained;
pub use core::from_vocab;
pub use core::llama3_special_tokens;
pub use core::o200k_base_special_tokens;
pub use core::pad_token_id;
pub use core::pattern;
pub use core::special_tokens;
pub use core::uses_byte_level;
pub use core::PretrainedVocab;
pub use core::whisper_special_tokens;
pub use core::WhisperVariant;
pub use core::from_json_bytes;
pub use core::from_json_path;
pub use core::AnyTokenizer;
pub use core::Backend;
pub use core::HfJsonError;
pub use core::PostProcessor;

Modules§

core
Core tokenization engine for splintr.