Struct QuantizedLinear

Source

pub struct QuantizedLinear { /* private fields */ }

Expand description

Quantized Linear Layer

Performs matrix multiplication in INT8: output = (input @ weights^T + bias) * scale

Implementations§

Source §

impl QuantizedLinear

Source

pub fn from_fp32(linear: &Linear, input_scale: f32) -> Self

Create from FP32 Linear layer

§Arguments

linear - FP32 linear layer to quantize
input_scale - Expected input activation scale

Source

pub fn forward_int8( &self, input: &[u8], batch_size: usize, input_scale: f32, input_zero_point: u8, ) -> CnnResult<Tensor>

Forward pass with INT8 computation

§Arguments

input - Quantized u8 input tensor [batch, in_features]
batch_size - Batch size
input_scale - Input quantization scale
input_zero_point - Input quantization zero point

Source

pub fn in_features(&self) -> usize

Get input features

Source

pub fn out_features(&self) -> usize

Get output features

Trait Implementations§

Source §

impl Clone for QuantizedLinear

Source §

fn clone(&self) -> QuantizedLinear

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for QuantizedLinear

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations§

§

impl UnwindSafe for QuantizedLinear

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source §

QuantizedLinear

Struct QuantizedLinear Copy item path

Implementations§

impl QuantizedLinear

pub fn from_fp32(linear: &Linear, input_scale: f32) -> Self

§Arguments

pub fn forward_int8( &self, input: &[u8], batch_size: usize, input_scale: f32, input_zero_point: u8, ) -> CnnResult<Tensor>

§Arguments

pub fn in_features(&self) -> usize

pub fn out_features(&self) -> usize

Trait Implementations§

impl Clone for QuantizedLinear

fn clone(&self) -> QuantizedLinear

fn clone_from(&mut self, source: &Self)

impl Debug for QuantizedLinear

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for QuantizedLinear

impl RefUnwindSafe for QuantizedLinear

impl Send for QuantizedLinear

impl Sync for QuantizedLinear

impl Unpin for QuantizedLinear

impl UnsafeUnpin for QuantizedLinear

impl UnwindSafe for QuantizedLinear

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct QuantizedLinear

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,