Struct QuantizationParams

Source

pub struct QuantizationParams {
    pub dtype: QuantizedDType,
    pub scheme: QuantizationScheme,
    pub scale: Vec<f32>,
    pub zero_point: Vec<i32>,
    pub block_size: Option<usize>,
    pub min_val: Option<f32>,
    pub max_val: Option<f32>,
}

Expand description

Quantization parameters

Contains all the parameters needed to quantize and dequantize tensors, including scale factors, zero points, and metadata about the quantization scheme being used.

Fields§

§dtype: QuantizedDType

Quantization data type

Specifies the target quantized data type (e.g., Int8, UInt8, Int4)

§scheme: QuantizationScheme

Quantization scheme

Defines how the quantization mapping is performed (linear, symmetric, etc.)

§scale: Vec<f32>

Scale factor(s)

Maps quantized values back to floating-point range. For per-channel quantization, contains one scale per channel. Formula: float_val = scale * (quantized_val - zero_point)

§zero_point: Vec<i32>

Zero point(s)

The quantized value that corresponds to floating-point zero. For per-channel quantization, contains one zero point per channel. For symmetric quantization, this is always 0.

§block_size: Option<usize>

Block size for block-wise quantization

When using block-wise quantization, specifies the size of each block that gets its own quantization parameters. None for other schemes.

§min_val: Option<f32>

Minimum value observed during calibration

Used for parameter calculation and validation. Set during calibration or when computing parameters from statistics.

§max_val: Option<f32>

Maximum value observed during calibration

Used for parameter calculation and validation. Set during calibration or when computing parameters from statistics.

Struct QuantizationParams Copy item path

Fields§

Implementations§

impl QuantizationParams

pub fn int8_symmetric() -> Self

§Examples

pub fn new(scale: f32, zero_point: i32) -> Self

§Arguments

§Examples

pub fn uint8_asymmetric() -> Self

§Examples

pub fn int4_symmetric() -> Self

§Examples

pub fn channel_wise(num_channels: usize, dtype: QuantizedDType) -> Self

§Arguments

§Examples

pub fn block_wise(block_size: usize, dtype: QuantizedDType) -> Self

§Arguments

§Examples

pub fn from_statistics( &mut self, min_val: f32, max_val: f32, ) -> BackendResult<()>

§Arguments

§Returns

§Examples

pub fn validate(&self) -> BackendResult<()>

pub fn num_parameter_sets(&self) -> usize

pub fn is_per_channel(&self) -> bool

pub fn quantization_error_bound(&self) -> f32

pub fn compression_ratio(&self) -> f32

Trait Implementations§

impl Clone for QuantizationParams

fn clone(&self) -> QuantizationParams

fn clone_from(&mut self, source: &Self)

impl Debug for QuantizationParams

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for QuantizationParams

fn default() -> Self

Auto Trait Implementations§

impl Freeze for QuantizationParams

impl RefUnwindSafe for QuantizationParams

impl Send for QuantizationParams

impl Sync for QuantizationParams

impl Unpin for QuantizationParams

impl UnsafeUnpin for QuantizationParams

impl UnwindSafe for QuantizationParams

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct QuantizationParams

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,