pub struct QuantizationConfig {
pub target_precision: MobilePrecision,
pub enable_mixed_precision: bool,
pub dynamic_strategy: DynamicQuantizationStrategy,
pub hardware_aware: bool,
pub granularity: QuantizationGranularity,
pub quality_threshold: f32,
pub memory_constraint_mb: usize,
pub enable_gradient_quantization: bool,
pub kl_threshold: f32,
pub enable_ptq: bool,
pub enable_qat: bool,
}Expand description
Mobile quantization configuration
Fields§
§target_precision: MobilePrecisionTarget quantization precision
enable_mixed_precision: boolEnable mixed-precision quantization
dynamic_strategy: DynamicQuantizationStrategyDynamic quantization strategy
hardware_aware: boolHardware-aware optimizations
granularity: QuantizationGranularityQuantization granularity
quality_threshold: f32Quality preservation threshold
memory_constraint_mb: usizeMemory constraint (MB)
enable_gradient_quantization: boolEnable gradient-based quantization
kl_threshold: f32KL-divergence threshold for calibration
enable_ptq: boolEnable post-training quantization
enable_qat: boolEnable quantization-aware training
Trait Implementations§
Source§impl Clone for QuantizationConfig
impl Clone for QuantizationConfig
Source§fn clone(&self) -> QuantizationConfig
fn clone(&self) -> QuantizationConfig
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for QuantizationConfig
impl Debug for QuantizationConfig
Source§impl Default for QuantizationConfig
impl Default for QuantizationConfig
Source§impl<'de> Deserialize<'de> for QuantizationConfig
impl<'de> Deserialize<'de> for QuantizationConfig
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for QuantizationConfig
impl RefUnwindSafe for QuantizationConfig
impl Send for QuantizationConfig
impl Sync for QuantizationConfig
impl Unpin for QuantizationConfig
impl UnsafeUnpin for QuantizationConfig
impl UnwindSafe for QuantizationConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
Source§fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
Save to file
Source§fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
Load from file
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more