Enum QuantizationArguments

Source

pub enum QuantizationArguments<'a> {
    ScaleZeroPointDataType {
        scale: f64,
        zero_point: i64,
        data_type: DataType,
    },
    ScaleTensorZeroPointDataTypeAxis {
        scale_tensor: &'a Tensor,
        zero_point: f64,
        data_type: DataType,
        axis: i64,
    },
    ScaleTensorZeroPointTensorDataTypeAxis {
        scale_tensor: &'a Tensor,
        zero_point_tensor: &'a Tensor,
        data_type: DataType,
        axis: i64,
    },
}

Expand description

Arguments controlling how a floating-point tensor is quantized into an integer representation.

All variants follow the same conceptual formula but differ in whether the scale and zero-point are provided as scalars or tensors and whether the scaling is applied per-axis.

Variants§

§

ScaleZeroPointDataType

Quantize using scalar scale / zero_point.

§Details

Formula: result = (tensor / scale) + zero_point.

Fields

§scale: f64

Scale scalar parameter

§zero_point: i64

Bias scalar parameter (converted to dataType of resultTensor)

§data_type: DataType

Integer data type of the result tensor.

§

ScaleTensorZeroPointDataTypeAxis

Quantize using a per-axis scale_tensor and scalar zero_point.

§Details

Formula: result = (tensor / scale_tensor) + zero_point.

Fields

§scale_tensor: &'a Tensor

Scale 1D Tensor parameter with size == tensor.shape[axis]

§zero_point: f64

Bias scalar parameter (converted to dataType of resultTensor)

§data_type: DataType

Integer data type of the result tensor.

§axis: i64

Axis on which the scale 1D value is being broadcasted

§

ScaleTensorZeroPointTensorDataTypeAxis

Quantize using per-axis scale_tensor and zero_point_tensor.

§Details

Formula: result = (tensor / scale_tensor) + zero_point_tensor.

Fields

§scale_tensor: &'a Tensor

Scale scalar or 1D Tensor parameter with size == tensor.shape[axis]

§zero_point_tensor: &'a Tensor

Bias scalar or 1D Tensor parameter with size == tensor.shape[axis]

§data_type: DataType

Integer data type of the result tensor.

§axis: i64

Axis on which the scale 1D value is being broadcasted

Auto Trait Implementations§

§

impl<'a> UnsafeUnpin for QuantizationArguments<'a>

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> AutoreleaseSafe for T
where T: ?Sized,

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

QuantizationArguments

Enum QuantizationArguments

Variants§

ScaleZeroPointDataType

§Details

Fields

ScaleTensorZeroPointDataTypeAxis

§Details

Fields

ScaleTensorZeroPointTensorDataTypeAxis

§Details

Fields

Auto Trait Implementations§

impl<'a> !RefUnwindSafe for QuantizationArguments<'a>

impl<'a> !Send for QuantizationArguments<'a>

impl<'a> !Sync for QuantizationArguments<'a>

impl<'a> !UnwindSafe for QuantizationArguments<'a>

impl<'a> Freeze for QuantizationArguments<'a>

impl<'a> Unpin for QuantizationArguments<'a>

impl<'a> UnsafeUnpin for QuantizationArguments<'a>

Blanket Implementations§

impl<T> Any for T
where T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> AutoreleaseSafe for T
where T: ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T
where T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for T
where U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for T
where U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

QuantizationArguments

Enum QuantizationArguments Copy item path

Variants§

ScaleZeroPointDataType

§Details

Fields

ScaleTensorZeroPointDataTypeAxis

§Details

Fields

ScaleTensorZeroPointTensorDataTypeAxis

§Details

Fields

Auto Trait Implementations§

impl<'a> !RefUnwindSafe for QuantizationArguments<'a>

impl<'a> !Send for QuantizationArguments<'a>

impl<'a> !Sync for QuantizationArguments<'a>

impl<'a> !UnwindSafe for QuantizationArguments<'a>

impl<'a> Freeze for QuantizationArguments<'a>

impl<'a> Unpin for QuantizationArguments<'a>

impl<'a> UnsafeUnpin for QuantizationArguments<'a>

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> AutoreleaseSafe for Twhere T: ?Sized,

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Enum QuantizationArguments

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> AutoreleaseSafe for T
where T: ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,