pub struct QuantizationConfig {
pub scheme: QuantizationScheme,
pub granularity: QuantizationGranularity,
pub symmetric: bool,
pub calibration: CalibrationMethod,
}Expand description
Quantization configuration
Fields§
§scheme: QuantizationSchemeQuantization scheme (INT4, INT8, etc.)
granularity: QuantizationGranularityQuantization granularity
symmetric: boolUse symmetric quantization (zero_point = 0)
calibration: CalibrationMethodCalibration method for determining scale/zero-point
Implementations§
Source§impl QuantizationConfig
impl QuantizationConfig
Sourcepub fn int8_symmetric() -> Self
pub fn int8_symmetric() -> Self
Create INT8 symmetric per-tensor quantization config
Sourcepub fn int8_asymmetric() -> Self
pub fn int8_asymmetric() -> Self
Create INT8 asymmetric per-tensor quantization config
Sourcepub fn int8_per_channel(num_channels: usize) -> Self
pub fn int8_per_channel(num_channels: usize) -> Self
Create INT8 per-channel quantization config
Sourcepub fn int4_symmetric() -> Self
pub fn int4_symmetric() -> Self
Create INT4 symmetric per-tensor quantization config
Sourcepub fn int4_per_channel(num_channels: usize) -> Self
pub fn int4_per_channel(num_channels: usize) -> Self
Create INT4 per-channel quantization config
Trait Implementations§
Source§impl Clone for QuantizationConfig
impl Clone for QuantizationConfig
Source§fn clone(&self) -> QuantizationConfig
fn clone(&self) -> QuantizationConfig
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for QuantizationConfig
impl Debug for QuantizationConfig
Source§impl<'de> Deserialize<'de> for QuantizationConfig
impl<'de> Deserialize<'de> for QuantizationConfig
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for QuantizationConfig
impl RefUnwindSafe for QuantizationConfig
impl Send for QuantizationConfig
impl Sync for QuantizationConfig
impl Unpin for QuantizationConfig
impl UnwindSafe for QuantizationConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more