[package]
name = "code-chunker"
version = "0.2.0"
authors = ["Arc <attobop@gmail.com>"]
edition = "2021"
description = "AST-aware code chunking and late chunking for RAG"
license = "MIT OR Apache-2.0"
repository = "https://github.com/arclabs561/code-chunker"
keywords = ["chunking", "rag", "code", "tree-sitter", "embedding"]
categories = ["text-processing"]
rust-version = "1.81"
[workspace]
[dependencies]
thiserror = "2.0"
unicode-segmentation = ">=1.11, <1.13"
serde = { version = "1", features = ["derive"], optional = true }
tree-sitter = { version = "0.24", optional = true }
tree-sitter-rust = { version = "0.23", optional = true }
tree-sitter-python = { version = "0.23", optional = true }
tree-sitter-typescript = { version = "0.23", optional = true }
tree-sitter-go = { version = "0.23", optional = true }
[features]
default = []
serde = ["dep:serde"]
code = [
"dep:tree-sitter",
"dep:tree-sitter-rust",
"dep:tree-sitter-python",
"dep:tree-sitter-typescript",
"dep:tree-sitter-go",
]
[dev-dependencies]
proptest = "1.9"
[[example]]
name = "code_chunking"
required-features = ["code"]