[package]
edition = "2021"
rust-version = "1.88"
name = "hanzo-quant"
version = "0.6.1"
authors = ["Hanzo AI"]
build = "build.rs"
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Hanzo Engine - fast, flexible LLM inference engine written in Rust."
homepage = "https://github.com/hanzoai/engine"
readme = "README.md"
keywords = [
"llm",
"inference",
"machine-learning",
"ai",
"transformers",
]
categories = [
"science",
"api-bindings",
"text-processing",
]
license = "MIT"
repository = "https://github.com/hanzoai/engine"
[features]
accelerate = [
"hanzo-ml/accelerate",
"hanzo-nn/accelerate",
]
arm-nightly-feat = []
cuda = [
"hanzo-ml/cuda",
"hanzo-nn/cuda",
"dep:cudaforge",
]
cuda-11040 = []
cuda-11050 = []
cuda-11060 = []
cuda-11070 = []
cuda-11080 = []
cuda-12000 = []
cuda-12010 = []
cuda-12020 = []
cuda-12030 = []
cuda-12040 = []
cuda-12050 = []
cuda-12060 = []
cuda-12080 = []
cuda-12090 = []
cuda-13000 = []
metal = [
"hanzo-ml/metal",
"hanzo-nn/metal",
"dep:objc2-metal",
"dep:objc2-foundation",
"dep:dispatch2",
"dep:hanzo-metal-kernels",
]
nccl = [
"cuda",
"hanzo-ml/nccl",
]
ring = []
rocm = [
"hanzo-ml/rocm",
"hanzo-nn/rocm",
]
vulkan = [
"hanzo-ml/vulkan",
"hanzo-nn/vulkan",
]
[lib]
name = "hanzo_quant"
path = "src/lib.rs"
[dependencies.byteorder]
version = "1.5.0"
[dependencies.dispatch2]
version = "0.3.0"
features = ["block2"]
optional = true
default-features = false
[dependencies.float8]
version = "0.7.0"
[dependencies.half]
version = "2.7.1"
[dependencies.hanzo-metal-kernels]
version = "0.10.2"
optional = true
package = "hanzo-metal-kernels"
[dependencies.hanzo-ml]
version = "0.10.2"
package = "hanzo-ml"
[dependencies.hanzo-nn]
version = "0.10.2"
package = "hanzo-nn"
[dependencies.hf-hub]
version = "0.4.3"
features = [
"ureq",
"tokio",
"rustls-tls",
]
default-features = false
[dependencies.lazy_static]
version = "1.5"
[dependencies.memmap2]
version = "0.9.9"
[dependencies.objc2-foundation]
version = "0.3.2"
optional = true
[dependencies.objc2-metal]
version = "0.3.2"
optional = true
[dependencies.paste]
version = "1.0.15"
[dependencies.rayon]
version = "1.11.0"
[dependencies.regex]
version = "1.12.2"
[dependencies.safetensors]
version = "0.7.0"
[dependencies.serde]
version = "1.0.228"
[dependencies.serde_json]
version = "1.0.149"
[dependencies.thiserror]
version = "2.0.18"
[dependencies.tokio]
version = "1.49.0"
features = [
"full",
"rt-multi-thread",
]
[dependencies.tracing]
version = "0.1.44"
[dependencies.yoke]
version = "0.8.1"
features = ["derive"]
[build-dependencies.cudaforge]
version = "0.1.2"
optional = true