[[bench]]
harness = false
name = "ane_bench"
path = "benches/ane_bench.rs"
[[bench]]
harness = false
name = "attention_bench"
path = "benches/attention_bench.rs"
[[bench]]
harness = false
name = "e2e_bench"
path = "benches/e2e_bench.rs"
[[bench]]
harness = false
name = "lora_bench"
path = "benches/lora_bench.rs"
[[bench]]
harness = false
name = "matmul_bench"
path = "benches/matmul_bench.rs"
[[bench]]
harness = false
name = "metal_bench"
path = "benches/metal_bench.rs"
[[bench]]
harness = false
name = "norm_bench"
path = "benches/norm_bench.rs"
[[bench]]
harness = false
name = "rlm_bench"
path = "benches/rlm_bench.rs"
[[bench]]
harness = false
name = "rope_bench"
path = "benches/rope_bench.rs"
[[bench]]
harness = false
name = "ruvltra_benchmark"
path = "benches/ruvltra_benchmark.rs"
[[bench]]
harness = false
name = "serving_bench"
path = "benches/serving_bench.rs"
[dependencies.anyhow]
version = "1.0"
[dependencies.async-trait]
version = "0.1"
[dependencies.bincode]
features = ["serde"]
version = "2.0.0-rc.3"
[dependencies.candle-core]
optional = true
version = "0.8"
[dependencies.candle-nn]
optional = true
version = "0.8"
[dependencies.candle-transformers]
optional = true
version = "0.8"
[dependencies.chrono]
features = ["serde"]
version = "0.4"
[dependencies.dashmap]
version = "6.1"
[dependencies.dirs]
version = "5.0"
[dependencies.futures-core]
version = "0.3"
[dependencies.half]
version = "2.4"
[dependencies.hf-hub]
features = ["tokio"]
optional = true
version = "0.3"
[dependencies.lru]
version = "0.12"
[dependencies.md5]
version = "0.7"
[dependencies.memmap2]
optional = true
version = "0.9"
[dependencies.ndarray]
version = "0.16"
[dependencies.once_cell]
version = "1.20"
[dependencies.parking_lot]
version = "0.12"
[dependencies.rand]
version = "0.8"
[dependencies.rayon]
optional = true
version = "1.10"
[dependencies.regex]
version = "1.10"
[dependencies.ruvector-attention]
optional = true
version = "0.1.31"
[dependencies.ruvector-core]
default-features = false
features = ["storage", "hnsw", "parallel", "simd"]
version = "0.1.31"
[dependencies.ruvector-gnn]
optional = true
version = "0.1.31"
[dependencies.ruvector-graph]
default-features = false
optional = true
version = "0.1.31"
[dependencies.ruvector-sona]
default-features = false
features = ["serde-support"]
version = "0.1.4"
[dependencies.serde]
features = ["derive", "rc"]
version = "1.0"
[dependencies.serde_json]
version = "1.0"
[dependencies.sha2]
version = "0.10"
[dependencies.smallvec]
version = "1.13"
[dependencies.thiserror]
version = "2.0"
[dependencies.tokenizers]
default-features = false
features = ["onig"]
optional = true
version = "0.20"
[dependencies.tokio]
features = ["rt-multi-thread", "sync", "macros"]
optional = true
version = "1.41"
[dependencies.tokio-stream]
optional = true
version = "0.1"
[dependencies.tracing]
version = "0.1"
[dependencies.uuid]
features = ["v4", "serde", "js", "v4", "serde"]
version = "1.11"
[dev-dependencies.criterion]
features = ["html_reports"]
version = "0.5"
[dev-dependencies.tempfile]
version = "3.13"
[dev-dependencies.tracing-subscriber]
features = ["env-filter"]
version = "0.3"
[[example]]
name = "benchmark_model"
path = "examples/benchmark_model.rs"
[[example]]
name = "download_test_model"
path = "examples/download_test_model.rs"
[[example]]
name = "generate_claude_dataset"
path = "examples/generate_claude_dataset.rs"
[[example]]
name = "hub_cli"
path = "examples/hub_cli.rs"
[[example]]
name = "run_eval"
path = "examples/run_eval.rs"
required-features = ["async-runtime"]
[[example]]
name = "train_contrastive"
path = "examples/train_contrastive.rs"
[features]
accelerate = []
async-runtime = ["tokio", "tokio-stream"]
attention = ["dep:ruvector-attention"]
candle = ["candle-core", "candle-nn", "candle-transformers", "tokenizers", "hf-hub"]
coreml = ["dep:objc2", "dep:objc2-foundation", "dep:objc2-core-ml", "dep:block2"]
cuda = ["candle-core/cuda", "candle-nn/cuda", "candle-transformers/cuda"]
default = ["async-runtime", "candle"]
gguf-mmap = ["mmap"]
gnn = ["dep:ruvector-gnn"]
graph = ["dep:ruvector-graph"]
hybrid-ane = ["metal-compute", "coreml"]
inference-cuda = ["candle", "cuda"]
inference-metal = ["candle", "metal"]
inference-metal-native = ["candle", "metal", "metal-compute"]
metal = ["candle-core/metal", "candle-nn/metal", "candle-transformers/metal"]
metal-compute = ["dep:metal", "dep:objc"]
minimal = ["async-runtime"]
mmap = ["dep:memmap2"]
parallel = ["dep:rayon"]
rlm-core = []
rlm-full = ["rlm-core", "async-runtime"]
rlm-wasm = ["rlm-core", "wasm", "dep:wasm-bindgen", "dep:wasm-bindgen-futures", "dep:js-sys", "dep:web-sys"]
ruvector-full = ["attention", "graph", "gnn"]
wasm = []
[lib]
crate-type = ["rlib"]
name = "ruvllm"
path = "src/lib.rs"
[package]
authors = ["Ruvector Team"]
autobenches = false
autobins = false
autoexamples = false
autolib = false
autotests = false
build = false
description = "LLM serving runtime with Ruvector integration - Paged attention, KV cache, and SONA learning"
edition = "2021"
license = "MIT"
name = "ruvllm"
readme = "README.md"
repository = "https://github.com/ruvnet/ruvector"
rust-version = "1.77"
version = "2.0.1"
[target.'cfg(target_arch = "wasm32")'.dependencies.block2]
optional = true
version = "0.6"
[target.'cfg(target_arch = "wasm32")'.dependencies.getrandom]
features = ["js"]
version = "0.2"
[target.'cfg(target_arch = "wasm32")'.dependencies.js-sys]
optional = true
version = "0.3"
[target.'cfg(target_arch = "wasm32")'.dependencies.objc2]
optional = true
version = "0.6"
[target.'cfg(target_arch = "wasm32")'.dependencies.objc2-core-ml]
features = ["MLModel", "MLModelConfiguration", "MLFeatureProvider", "MLFeatureValue", "MLMultiArray", "MLPredictionOptions", "MLModelDescription", "MLFeatureDescription", "MLDictionaryFeatureProvider", "MLModelError"]
optional = true
version = "0.3"
[target.'cfg(target_arch = "wasm32")'.dependencies.objc2-foundation]
features = ["NSString", "NSError", "NSURL", "NSArray", "NSDictionary", "NSData"]
optional = true
version = "0.3"
[target.'cfg(target_arch = "wasm32")'.dependencies.wasm-bindgen]
optional = true
version = "0.2"
[target.'cfg(target_arch = "wasm32")'.dependencies.wasm-bindgen-futures]
optional = true
version = "0.4"
[target.'cfg(target_arch = "wasm32")'.dependencies.web-sys]
features = ["console", "Performance", "Window"]
optional = true
version = "0.3"
[target.'cfg(target_os = "macos")'.dependencies.metal]
optional = true
version = "0.29"
[target.'cfg(target_os = "macos")'.dependencies.objc]
optional = true
version = "0.2"
[[test]]
name = "adapter_integration"
path = "tests/adapter_integration.rs"
[[test]]
name = "ane_integration"
path = "tests/ane_integration.rs"
[[test]]
name = "ane_test_utils"
path = "tests/ane_test_utils.rs"
[[test]]
name = "autodetect_integration"
path = "tests/autodetect_integration.rs"
[[test]]
name = "backend_integration"
path = "tests/backend_integration.rs"
[[test]]
name = "cross_platform"
path = "tests/cross_platform.rs"
[[test]]
name = "cross_platform_v21"
path = "tests/cross_platform_v21.rs"
[[test]]
name = "e2e_integration"
path = "tests/e2e_integration.rs"
[[test]]
name = "e2e_integration_test"
path = "tests/e2e_integration_test.rs"
[[test]]
name = "gguf_integration"
path = "tests/gguf_integration.rs"
[[test]]
name = "gguf_loader_test"
path = "tests/gguf_loader_test.rs"
[[test]]
name = "kernel_integration"
path = "tests/kernel_integration.rs"
[[test]]
name = "lora_integration"
path = "tests/lora_integration.rs"
[[test]]
name = "mistral_backend_test"
path = "tests/mistral_backend_test.rs"
[[test]]
name = "model_arch_integration"
path = "tests/model_arch_integration.rs"
[[test]]
name = "real_model_test"
path = "tests/real_model_test.rs"
[[test]]
name = "rlm_integration"
path = "tests/rlm_integration.rs"
[[test]]
name = "ruvltra_e2e"
path = "tests/ruvltra_e2e.rs"
[[test]]
name = "ruvltra_tests"
path = "tests/ruvltra_tests.rs"
[[test]]
name = "serving_integration"
path = "tests/serving_integration.rs"
[[test]]
name = "sona_integration"
path = "tests/sona_integration.rs"
[[test]]
name = "speculative_integration"
path = "tests/speculative_integration.rs"