llama-rs 0.16.1

A high-performance Rust implementation of llama.cpp - LLM inference engine with full GGUF support

//! Quantization formats and dequantization functions

mod blocks;
mod dequant;
mod gpu_quantize;
mod iq_grids;
mod iq_quants;

pub use blocks::*;
pub use dequant::*;
pub use gpu_quantize::*;
pub use iq_quants::*;