Struct FakeQuantize

Source

pub struct FakeQuantize {
    pub bits: u32,
    pub symmetric: bool,
    pub scale: f32,
    pub zero_point: i32,
    pub enabled: bool,
}

Expand description

Fake quantization operator for quantization-aware training (QAT).

Maintains the current scale and zero-point that are updated during calibration / training via an associated observer.

Fields§

§bits: u32

Quantization bit-width.

§symmetric: bool

Whether to use symmetric quantization (zp = 0).

§scale: f32

Current quantization scale (must be > 0).

§zero_point: i32

Current zero-point.

§enabled: bool

Whether fake quantization is enabled. When disabled, forward returns the input unchanged.

Implementations§

Source §

impl FakeQuantize

Source

pub fn new( bits: u32, symmetric: bool, scale: f32, zero_point: i32, ) -> QuantResult<Self>

Create a new fake quantizer with the given scale and zero-point.

§Errors

QuantError::InvalidBitWidth — bits is 0 or > 16.
QuantError::InvalidScale — scale is ≤ 0 or non-finite.

Source

pub fn with_defaults(bits: u32, symmetric: bool) -> QuantResult<Self>

Create with default scale=1.0, zp=0 for the given bit-width.

§Errors

QuantError::InvalidBitWidth — bits is 0 or > 16.

Source

pub fn update_params(&mut self, scale: f32, zero_point: i32) -> QuantResult<()>

Update scale and zero-point (e.g., from an observer).

§Errors

QuantError::InvalidScale — scale is ≤ 0 or non-finite.

Source

pub fn quant_range(&self) -> (i32, i32)

Integer quantization bounds [q_min, q_max].

Source

pub fn float_range(&self) -> (f32, f32)

Float clipping bounds [x_min, x_max] corresponding to the integer range.

Source

pub fn forward(&self, x: &[f32]) -> Vec<f32>

Forward pass: quantize-then-dequantize.

If enabled = false, returns the input unchanged.

Source

pub fn backward(&self, grad_output: &[f32], x: &[f32]) -> QuantResult<Vec<f32>>

Backward pass (Straight-Through Estimator).

Passes grad_output through where x is inside the representable float range; zeros the gradient where x is clipped.

§Errors

QuantError::DimensionMismatch — grad_output and x lengths differ.

Source

pub fn quantization_noise(&self, x: &[f32]) -> f32

Estimate quantization noise (MSE between input and fake-quantized output).

Useful for measuring quantization error at the current scale/zp.

Trait Implementations§

Source §

impl Clone for FakeQuantize

Source §

fn clone(&self) -> FakeQuantize

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for FakeQuantize

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations§

§

impl UnwindSafe for FakeQuantize

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Struct FakeQuantize Copy item path

Fields§

Implementations§

impl FakeQuantize

pub fn new( bits: u32, symmetric: bool, scale: f32, zero_point: i32, ) -> QuantResult<Self>

§Errors

pub fn with_defaults(bits: u32, symmetric: bool) -> QuantResult<Self>

§Errors

pub fn update_params(&mut self, scale: f32, zero_point: i32) -> QuantResult<()>

§Errors

pub fn quant_range(&self) -> (i32, i32)

pub fn float_range(&self) -> (f32, f32)

pub fn forward(&self, x: &[f32]) -> Vec<f32>

pub fn backward(&self, grad_output: &[f32], x: &[f32]) -> QuantResult<Vec<f32>>

§Errors

pub fn quantization_noise(&self, x: &[f32]) -> f32

Trait Implementations§

impl Clone for FakeQuantize

fn clone(&self) -> FakeQuantize

fn clone_from(&mut self, source: &Self)

impl Debug for FakeQuantize

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for FakeQuantize

impl RefUnwindSafe for FakeQuantize

impl Send for FakeQuantize

impl Sync for FakeQuantize

impl Unpin for FakeQuantize

impl UnsafeUnpin for FakeQuantize

impl UnwindSafe for FakeQuantize

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct FakeQuantize

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,