mistralrs-quant 0.7.0

Fast, flexible LLM inference.
Documentation
# THIS FILE IS AUTOMATICALLY GENERATED BY CARGO
#
# When uploading crates to the registry Cargo will automatically
# "normalize" Cargo.toml files for maximal compatibility
# with all versions of Cargo and also rewrite `path` dependencies
# to registry (e.g., crates.io) dependencies.
#
# If you are reading this file be aware that the original Cargo.toml
# will likely look very different (and much more reasonable).
# See Cargo.toml.orig for the original contents.

[package]
edition = "2021"
rust-version = "1.88"
name = "mistralrs-quant"
version = "0.7.0"
authors = ["Eric Buehler"]
build = "build.rs"
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Fast, flexible LLM inference."
homepage = "https://github.com/EricLBuehler/mistral.rs"
readme = "README.md"
keywords = ["machine-learning"]
categories = ["science"]
license = "MIT"
repository = "https://github.com/EricLBuehler/mistral.rs"

[features]
accelerate = [
    "candle-core/accelerate",
    "candle-nn/accelerate",
]
cuda = [
    "candle-core/cuda",
    "candle-nn/cuda",
    "dep:bindgen_cuda",
]
cuda-11040 = []
cuda-11050 = []
cuda-11060 = []
cuda-11070 = []
cuda-11080 = []
cuda-12000 = []
cuda-12010 = []
cuda-12020 = []
cuda-12030 = []
cuda-12040 = []
cuda-12050 = []
cuda-12060 = []
cuda-12080 = []
cuda-12090 = []
cuda-13000 = []
metal = [
    "candle-core/metal",
    "candle-nn/metal",
    "dep:objc2-metal",
    "dep:objc2-foundation",
    "dep:candle-metal-kernels",
]
nccl = [
    "cuda",
    "candle-core/nccl",
]
ring = []

[lib]
name = "mistralrs_quant"
path = "src/lib.rs"

[dependencies.byteorder]
version = "1.5.0"

[dependencies.candle-core]
version = "0.9.2"

[dependencies.candle-metal-kernels]
version = "0.9.2"
optional = true

[dependencies.candle-nn]
version = "0.9.2"

[dependencies.float8]
version = "0.6.0"

[dependencies.half]
version = "2.7.1"

[dependencies.hf-hub]
version = "0.4.3"
features = [
    "ureq",
    "tokio",
    "rustls-tls",
]
default-features = false

[dependencies.lazy_static]
version = "1.5"

[dependencies.memmap2]
version = "0.9.9"

[dependencies.objc2-foundation]
version = "0.3.2"
optional = true

[dependencies.objc2-metal]
version = "0.3.2"
optional = true

[dependencies.paste]
version = "1.0.15"

[dependencies.rayon]
version = "1.11.0"

[dependencies.regex]
version = "1.12.2"

[dependencies.safetensors]
version = "0.7.0"

[dependencies.serde]
version = "1.0.228"

[dependencies.serde_json]
version = "1.0.149"

[dependencies.thiserror]
version = "2.0.18"

[dependencies.tokio]
version = "1.49.0"
features = [
    "full",
    "rt-multi-thread",
]

[dependencies.tracing]
version = "0.1.44"

[dependencies.yoke]
version = "0.8.1"
features = ["derive"]

[build-dependencies.bindgen_cuda]
version = "0.1.5"
optional = true