[workspace]
members = [".", "packages/python", "packages/wasm"]
[package]
name = "chunk"
version = "0.9.2"
edition = "2024"
description = "The fastest semantic text chunking library — up to 1TB/s chunking throughput"
license = "MIT OR Apache-2.0"
repository = "https://github.com/chonkie-inc/chunk"
readme = "README.md"
keywords = ["chunking", "text", "simd", "nlp", "tokenization"]
categories = ["text-processing", "algorithms"]
exclude = ["benches/data/*", "packages/*", "assets/*", "scripts/*", "*.png", "*.svg"]
[dependencies]
memchr = "2"
daggrs = "0.1"
[dev-dependencies]
criterion = "0.5"
text-splitter = "0.18"
kiru = "0.1"
[[bench]]
name = "chunk"
harness = false
[[bench]]
name = "kiru"
harness = false
[[bench]]
name = "text_splitter"
harness = false