riptoken 0.2.3

Fast BPE tokenizer for LLMs — a faster, drop-in compatible reimplementation of tiktoken
Documentation
[package]
name = "riptoken"
version = "0.2.3"
edition = "2024"
rust-version = "1.85"
description = "Fast BPE tokenizer for LLMs — a faster, drop-in compatible reimplementation of tiktoken"
license = "MIT"
repository = "https://github.com/daechoi/riptoken"
homepage = "https://github.com/daechoi/riptoken"
documentation = "https://docs.rs/riptoken"
readme = "README.md"
keywords = ["tokenizer", "bpe", "llm", "tiktoken", "nlp"]
categories = ["text-processing", "science", "parser-implementations"]
authors = ["Dae Choi <daechoi70@gmail.com>"]
exclude = [
    "*.tiktoken",
    ".venv/",
    "dist/",
    "tests/python/",
    "scripts/",
]

[lib]
name = "riptoken"
crate-type = ["rlib", "cdylib"]

[features]
default = []
python = ["dep:pyo3"]

[dependencies]
rustc-hash = "2"
regex = "1.11"
fancy-regex = "0.17"
rayon = "1.10"
pyo3 = { version = "0.27.2", default-features = false, features = ["extension-module", "macros"], optional = true }

[dev-dependencies]
base64 = "0.22"

[[bench]]
name = "bpe"
harness = false

[profile.profiling]
inherits = "release"
debug = 2
strip = false

[profile.release]
lto = "fat"
codegen-units = 1
opt-level = 3
strip = true