pub enum QuantizationStrategy {
Show 16 variants
None,
Dynamic,
Static,
PostTraining,
QAT,
AWQ,
GPTQ,
SmoothQuant,
LLMInt8,
QLoRA,
GGML,
AdaptiveBitwidth,
OutlierAware,
HQQ,
SpQR,
AQLM,
}Expand description
Quantization strategies
Variants§
None
No quantization
Dynamic
Dynamic quantization - quantize weights only
Static
Static quantization - quantize weights and activations
PostTraining
Post-training quantization
QAT
Quantization-aware training (requires pre-quantized model)
AWQ
AWQ (Activation-aware Weight Quantization) - preserves important weights
GPTQ
GPTQ (Gradient-based Post-Training Quantization) - uses second-order information
SmoothQuant
SmoothQuant - balances weights and activations difficulty
LLMInt8
LLM.int8() - mixed-precision quantization for large models
QLoRA
QLoRA - Quantized Low-Rank Adaptation
GGML
GGML-style quantization for efficient inference
AdaptiveBitwidth
Adaptive bitwidth quantization with dynamic allocation
OutlierAware
Outlier-aware quantization for handling activation spikes
HQQ
HQQ (Half-Quadratic Quantization) - superior quality quantization using half-quadratic optimization
SpQR
SpQR (Sparse-Quantized Representation) - ultra-sparse models with mixed precision
AQLM
AQLM (Additive Quantization for Language Models) - additive quantization for transformers
Trait Implementations§
Source§impl Clone for QuantizationStrategy
impl Clone for QuantizationStrategy
Source§fn clone(&self) -> QuantizationStrategy
fn clone(&self) -> QuantizationStrategy
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source. Read moreSource§impl Debug for QuantizationStrategy
impl Debug for QuantizationStrategy
Source§impl<'de> Deserialize<'de> for QuantizationStrategy
impl<'de> Deserialize<'de> for QuantizationStrategy
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Source§impl From<QuantizationStrategy> for JsValue
impl From<QuantizationStrategy> for JsValue
Source§fn from(value: QuantizationStrategy) -> Self
fn from(value: QuantizationStrategy) -> Self
Source§impl FromWasmAbi for QuantizationStrategy
impl FromWasmAbi for QuantizationStrategy
Source§impl IntoWasmAbi for QuantizationStrategy
impl IntoWasmAbi for QuantizationStrategy
Source§impl PartialEq for QuantizationStrategy
impl PartialEq for QuantizationStrategy
Source§impl Serialize for QuantizationStrategy
impl Serialize for QuantizationStrategy
Source§impl VectorFromWasmAbi for QuantizationStrategy
impl VectorFromWasmAbi for QuantizationStrategy
type Abi = <Box<[JsValue]> as FromWasmAbi>::Abi
unsafe fn vector_from_abi(js: Self::Abi) -> Box<[QuantizationStrategy]>
Source§impl VectorIntoWasmAbi for QuantizationStrategy
impl VectorIntoWasmAbi for QuantizationStrategy
type Abi = <Box<[JsValue]> as IntoWasmAbi>::Abi
fn vector_into_abi(vector: Box<[QuantizationStrategy]>) -> Self::Abi
Source§impl WasmDescribeVector for QuantizationStrategy
impl WasmDescribeVector for QuantizationStrategy
impl Copy for QuantizationStrategy
impl Eq for QuantizationStrategy
impl StructuralPartialEq for QuantizationStrategy
Auto Trait Implementations§
impl Freeze for QuantizationStrategy
impl RefUnwindSafe for QuantizationStrategy
impl Send for QuantizationStrategy
impl Sync for QuantizationStrategy
impl Unpin for QuantizationStrategy
impl UnsafeUnpin for QuantizationStrategy
impl UnwindSafe for QuantizationStrategy
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> ReturnWasmAbi for Twhere
T: IntoWasmAbi,
impl<T> ReturnWasmAbi for Twhere
T: IntoWasmAbi,
Source§type Abi = <T as IntoWasmAbi>::Abi
type Abi = <T as IntoWasmAbi>::Abi
IntoWasmAbi::AbiSource§fn return_abi(self) -> <T as ReturnWasmAbi>::Abi
fn return_abi(self) -> <T as ReturnWasmAbi>::Abi
IntoWasmAbi::into_abi, except that it may throw and never
return in the case of Err.