wordchipper 0.9.2

HPC Rust LLM Tokenizer Library
Documentation
//! # Text Segmentation
//!
//! This module exists to factor out text spanners scanning.
//!
//! [`TextSpanningConfig`] describes the declarative needs of a tokenizer:
//! * `pattern` - the word/span split pattern.
//! * `specials` - a map of `{ Vec<u8> -> T }` special tokens to handle
//!   out-of-band.
//!
//! Most users will want to use the [`TextSpannerBuilder`] to construct a
//! [`TextSpanner`].

pub mod span_lexers;

mod spanner_builder;
mod spanning_config;
mod text_spanner;

#[doc(inline)]
pub use spanner_builder::*;
#[doc(inline)]
pub use spanning_config::*;
#[doc(inline)]
pub use text_spanner::*;