[dependencies.rayon]
optional = true
version = "1.11.0"
[dependencies.thiserror]
version = "2.0.17"
[dev-dependencies.deunicode]
version = "1.6.2"
[dev-dependencies.hash32]
version = "1.0.0"
[dev-dependencies.lazy_static]
version = "1.5.0"
[dev-dependencies.regex]
version = "1.11.3"
[dev-dependencies.rust-stemmers]
version = "1.2.0"
[dev-dependencies.stop-words]
features = ["nltk"]
version = "0.9.0"
[dev-dependencies.unicode-segmentation]
version = "1.12.0"
[features]
parallelism = ["dep:rayon"]
[lib]
name = "bm25_vectorizer"
path = "src/lib.rs"
[package]
authors = ["Tristan Everitt <tristan.ecwhz@9epochs.com>"]
autobenches = false
autobins = false
autoexamples = false
autolib = false
autotests = false
build = false
categories = ["text-processing"]
description = "A minimal Rust library for creating sparse vector representations (embeddings) using the BM25 algorithm for information retrieval."
edition = "2021"
keywords = ["bm25", "sparse", "embed", "search", "nlp"]
license = "MIT"
name = "bm25-vectorizer"
readme = "README.md"
repository = "https://github.com/ep9io/bm25-vectorizer"
version = "1.0.0"