pub struct QuantizationConfig {
pub default_qtype: QuantizationType,
pub mode: QuantizationMode,
pub granularity: QuantizationGranularity,
pub symmetry: QuantizationSymmetry,
pub calibration: CalibrationStrategy,
pub calibration_samples: usize,
pub skip_ops: Vec<OpType>,
pub node_overrides: HashMap<NodeId, QuantizationType>,
}Expand description
Quantization configuration for a graph or model.
Fields§
§default_qtype: QuantizationTypeDefault quantization type
mode: QuantizationModeQuantization mode
granularity: QuantizationGranularityGranularity
symmetry: QuantizationSymmetrySymmetry mode
calibration: CalibrationStrategyCalibration strategy (for PTQ)
calibration_samples: usizeNumber of calibration samples
skip_ops: Vec<OpType>Operations to skip quantization
node_overrides: HashMap<NodeId, QuantizationType>Per-node quantization overrides
Implementations§
Source§impl QuantizationConfig
impl QuantizationConfig
Sourcepub fn qat(qtype: QuantizationType) -> Self
pub fn qat(qtype: QuantizationType) -> Self
Create a configuration for quantization-aware training.
Sourcepub fn per_channel(self, axis: usize) -> Self
pub fn per_channel(self, axis: usize) -> Self
Enable per-channel quantization.
Sourcepub fn asymmetric(self) -> Self
pub fn asymmetric(self) -> Self
Enable asymmetric quantization.
Sourcepub fn with_calibration(self, strategy: CalibrationStrategy) -> Self
pub fn with_calibration(self, strategy: CalibrationStrategy) -> Self
Set calibration strategy.
Trait Implementations§
Source§impl Clone for QuantizationConfig
impl Clone for QuantizationConfig
Source§fn clone(&self) -> QuantizationConfig
fn clone(&self) -> QuantizationConfig
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for QuantizationConfig
impl Debug for QuantizationConfig
Source§impl Default for QuantizationConfig
impl Default for QuantizationConfig
Source§impl<'de> Deserialize<'de> for QuantizationConfig
impl<'de> Deserialize<'de> for QuantizationConfig
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for QuantizationConfig
impl RefUnwindSafe for QuantizationConfig
impl Send for QuantizationConfig
impl Sync for QuantizationConfig
impl Unpin for QuantizationConfig
impl UnwindSafe for QuantizationConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more