[package]
edition = "2021"
rust-version = "1.88"
name = "mistralrs-quant"
version = "0.7.0"
authors = ["Eric Buehler"]
build = "build.rs"
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Fast, flexible LLM inference."
homepage = "https://github.com/EricLBuehler/mistral.rs"
readme = "README.md"
keywords = ["machine-learning"]
categories = ["science"]
license = "MIT"
repository = "https://github.com/EricLBuehler/mistral.rs"
[features]
accelerate = [
"candle-core/accelerate",
"candle-nn/accelerate",
]
cuda = [
"candle-core/cuda",
"candle-nn/cuda",
"dep:bindgen_cuda",
]
cuda-11040 = []
cuda-11050 = []
cuda-11060 = []
cuda-11070 = []
cuda-11080 = []
cuda-12000 = []
cuda-12010 = []
cuda-12020 = []
cuda-12030 = []
cuda-12040 = []
cuda-12050 = []
cuda-12060 = []
cuda-12080 = []
cuda-12090 = []
cuda-13000 = []
metal = [
"candle-core/metal",
"candle-nn/metal",
"dep:objc2-metal",
"dep:objc2-foundation",
"dep:candle-metal-kernels",
]
nccl = [
"cuda",
"candle-core/nccl",
]
ring = []
[lib]
name = "mistralrs_quant"
path = "src/lib.rs"
[dependencies.byteorder]
version = "1.5.0"
[dependencies.candle-core]
version = "0.9.2"
[dependencies.candle-metal-kernels]
version = "0.9.2"
optional = true
[dependencies.candle-nn]
version = "0.9.2"
[dependencies.float8]
version = "0.6.0"
[dependencies.half]
version = "2.7.1"
[dependencies.hf-hub]
version = "0.4.3"
features = [
"ureq",
"tokio",
"rustls-tls",
]
default-features = false
[dependencies.lazy_static]
version = "1.5"
[dependencies.memmap2]
version = "0.9.9"
[dependencies.objc2-foundation]
version = "0.3.2"
optional = true
[dependencies.objc2-metal]
version = "0.3.2"
optional = true
[dependencies.paste]
version = "1.0.15"
[dependencies.rayon]
version = "1.11.0"
[dependencies.regex]
version = "1.12.2"
[dependencies.safetensors]
version = "0.7.0"
[dependencies.serde]
version = "1.0.228"
[dependencies.serde_json]
version = "1.0.149"
[dependencies.thiserror]
version = "2.0.18"
[dependencies.tokio]
version = "1.49.0"
features = [
"full",
"rt-multi-thread",
]
[dependencies.tracing]
version = "0.1.44"
[dependencies.yoke]
version = "0.8.1"
features = ["derive"]
[build-dependencies.bindgen_cuda]
version = "0.1.5"
optional = true