pub fn quantize_4bit(
tensor: &Tensor,
config: &BitsAndBytesConfig,
) -> Result<QuantState>Expand description
4-bit quantization (NF4/FP4)
pub fn quantize_4bit(
tensor: &Tensor,
config: &BitsAndBytesConfig,
) -> Result<QuantState>4-bit quantization (NF4/FP4)