[package]
edition = "2024"
name = "spnl"
version = "0.17.0"
build = false
include = [
"src/**/*",
"Cargo.toml",
"README.md",
"docker/**/*",
]
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "A Span Query is a declarative way to specify which portions of a generative AI (GenAI) program should be run directly on model serving components."
readme = "README.md"
license = "Apache-2.0"
repository = "https://github.com/IBM/spnl"
[features]
cli_support = [
"print",
"dep:ptree",
]
cuda = [
"local",
"mistralrs/cuda",
]
cuda-flash-attn = [
"cuda",
"mistralrs/flash-attn",
]
cuda-flash-attn-v3 = [
"cuda",
"dep:mistralrs-core",
"mistralrs-core/flash-attn-v3",
]
default = [
"cli_support",
"lisp",
"run",
"ollama",
"openai",
"gemini",
"pull",
"yaml",
]
ffi = []
gce = [
"vllm",
"dep:google-cloud-compute-v1",
"dep:google-cloud-lro",
"dep:google-cloud-storage",
"dep:tokio",
"dep:base64",
"dep:flate2",
"dep:uuid",
"dep:rustls",
"dep:sha2",
"yaml",
"dep:russh",
"dep:russh-keys",
"dep:async-trait",
"dep:tabled",
]
gemini = ["openai"]
k8s = [
"vllm",
"dep:kube",
"dep:k8s-openapi",
"dep:schemars",
"dep:rustls",
"dep:uuid",
"dep:tokio-stream",
"dep:tokio",
"dep:futures",
]
lisp = ["dep:serde-lexpr"]
local = [
"run",
"dep:mistralrs",
"dep:tokio",
"dep:uuid",
"dep:indexmap",
"dep:either",
]
metal = [
"local",
"mistralrs/metal",
]
ollama = ["openai"]
openai = [
"dep:async-openai",
"dep:tokio",
]
openssl-vendored = ["dep:openssl"]
print = []
pull = [
"dep:reqwest",
"dep:tokio-util",
]
pypi = [
"ffi",
"tok",
"dep:pyo3",
"pyo3/extension-module",
"dep:thiserror",
]
rag = [
"run",
"dep:sha2",
"dep:lancedb",
"dep:tracing",
"dep:arrow-schema",
"dep:arrow-array",
"dep:itertools",
"dep:pdf-extract",
"dep:async-recursion",
"dep:regex",
"dep:rand",
]
rag-deep-debug = []
run = [
"dep:futures",
"dep:indicatif",
"dep:async-recursion",
"dep:thiserror",
"dep:tabled",
]
run_py = [
"run",
"pypi",
"pyo3/experimental-async",
"run",
"ollama",
"openai",
"gemini",
"dep:tokio",
"tokio/rt-multi-thread",
]
spnl-api = [
"dep:futures",
"dep:reqwest",
]
tok = [
"dep:pyo3",
"dep:itertools",
"dep:moka",
"dep:tokenizers",
]
vllm = [
"yaml",
"dep:flate2",
]
yaml = ["dep:serde_yaml2"]
[lib]
name = "spnl"
path = "src/lib.rs"
[dependencies.anyhow]
version = "1.0.98"
[dependencies.arrow-array]
version = "57.3"
optional = true
[dependencies.arrow-schema]
version = "57.3"
optional = true
[dependencies.async-openai]
version = "0.32.0"
features = [
"embedding",
"chat-completion",
"completions",
"_api",
]
optional = true
[dependencies.async-recursion]
version = "1.1.1"
optional = true
[dependencies.async-trait]
version = "0.1"
optional = true
[dependencies.base64]
version = "0.22"
optional = true
[dependencies.clap]
version = "4.5.45"
features = [
"derive",
"env",
]
[dependencies.derive_builder]
version = "0.20.2"
[dependencies.either]
version = "1.13"
optional = true
[dependencies.flate2]
version = "1.0"
optional = true
[dependencies.futures]
version = "0.3.31"
optional = true
[dependencies.google-cloud-compute-v1]
version = "2.1.0"
features = [
"instances",
"images",
]
optional = true
[dependencies.google-cloud-lro]
version = "1.3.0"
optional = true
[dependencies.google-cloud-storage]
version = "1"
optional = true
[dependencies.hf-hub]
version = "0.4.3"
features = ["tokio"]
optional = true
[dependencies.indexmap]
version = "2.7.0"
optional = true
[dependencies.indicatif]
version = "0.18.0"
optional = true
[dependencies.itertools]
version = "0.14.0"
optional = true
[dependencies.k8s-openapi]
version = "0.27.0"
features = [
"latest",
"schemars",
]
optional = true
[dependencies.kube]
version = "3.0.0"
features = [
"client",
"runtime",
"rustls-tls",
"ring",
"ws",
]
optional = true
default-features = false
[dependencies.lancedb]
version = "0.26.0"
optional = true
default-features = false
[dependencies.mistralrs]
version = "0.7.0"
optional = true
[dependencies.mistralrs-core]
version = "0.7.0"
optional = true
default-features = false
[dependencies.moka]
version = "0.12.10"
features = ["sync"]
optional = true
[dependencies.openssl]
version = "0.10"
features = ["vendored"]
optional = true
[dependencies.pdf-extract]
version = "0.10.0"
optional = true
[dependencies.ptree]
version = "0.5.2"
features = ["ansi"]
optional = true
default-features = false
[dependencies.pyo3]
version = "0.28.0"
features = ["macros"]
optional = true
[dependencies.rand]
version = "0.9.2"
features = ["os_rng"]
optional = true
[dependencies.regex]
version = "1.11.1"
optional = true
[dependencies.reqwest]
version = "0.12.20"
features = [
"json",
"stream",
]
optional = true
[dependencies.russh]
version = "0.57"
optional = true
[dependencies.russh-keys]
version = "0.49"
optional = true
[dependencies.rustls]
version = "0.23.36"
features = ["ring"]
optional = true
default-features = false
[dependencies.schemars]
version = "1"
optional = true
[dependencies.serde]
version = "1.0.219"
features = ["derive"]
[dependencies.serde-lexpr]
version = "0.1.3"
optional = true
[dependencies.serde_json]
version = "1.0.140"
[dependencies.serde_yaml2]
version = "0.1.3"
optional = true
[dependencies.sha2]
version = "0.10.9"
optional = true
[dependencies.tabled]
version = "0.20"
optional = true
[dependencies.thiserror]
version = "2.0.14"
optional = true
[dependencies.tokenizers]
version = "0.22.0"
features = [
"onig",
"esaxx_fast",
"hf-hub",
"http",
]
optional = true
default-features = false
[dependencies.tokio]
version = "1.44.1"
features = [
"io-std",
"io-util",
"signal",
]
optional = true
[dependencies.tokio-stream]
version = "0.1.18"
features = ["net"]
optional = true
[dependencies.tokio-util]
version = "0.7.16"
optional = true
[dependencies.tracing]
version = "0.1.41"
optional = true
[dependencies.uuid]
version = "1.19.0"
features = ["v4"]
optional = true
[dev-dependencies.cargo-husky]
version = "1"
features = ["user-hooks"]
default-features = false
[dev-dependencies.http]
version = "1.0"
[dev-dependencies.tower-test]
version = "0.4"