pub struct QuantizationParams {
pub scale: f32,
pub zero_point: i32,
pub dtype: DType,
pub qmin: i32,
pub qmax: i32,
}Expand description
Quantization parameters for symmetric and asymmetric quantization
Fields§
§scale: f32Scale factor for quantization (real_value = scale * quantized_value + zero_point)
zero_point: i32Zero point for asymmetric quantization (usually 0 for symmetric)
dtype: DTypeQuantized data type (Int8 or Int4)
qmin: i32Minimum quantized value (e.g., -128 for INT8)
qmax: i32Maximum quantized value (e.g., 127 for INT8)
Implementations§
Source§impl QuantizationParams
impl QuantizationParams
Sourcepub fn symmetric_int8(scale: f32) -> Self
pub fn symmetric_int8(scale: f32) -> Self
Create symmetric INT8 quantization parameters
Sourcepub fn asymmetric_int8(scale: f32, zero_point: i32) -> Self
pub fn asymmetric_int8(scale: f32, zero_point: i32) -> Self
Create asymmetric INT8 quantization parameters
Sourcepub fn symmetric_int4(scale: f32) -> Self
pub fn symmetric_int4(scale: f32) -> Self
Create symmetric INT4 quantization parameters
Sourcepub fn asymmetric_int4(scale: f32, zero_point: i32) -> Self
pub fn asymmetric_int4(scale: f32, zero_point: i32) -> Self
Create asymmetric INT4 quantization parameters
Trait Implementations§
Source§impl Clone for QuantizationParams
impl Clone for QuantizationParams
Source§fn clone(&self) -> QuantizationParams
fn clone(&self) -> QuantizationParams
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreAuto Trait Implementations§
impl Freeze for QuantizationParams
impl RefUnwindSafe for QuantizationParams
impl Send for QuantizationParams
impl Sync for QuantizationParams
impl Unpin for QuantizationParams
impl UnsafeUnpin for QuantizationParams
impl UnwindSafe for QuantizationParams
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more