Struct QuantizedTensor

Source

pub struct QuantizedTensor {
    pub data: Vec<u8>,
    pub shape: Vec<usize>,
    pub params: QuantizationParams,
    pub device: Device,
}

Expand description

Quantized tensor representation

Represents a tensor that has been quantized to a lower-precision format. The data is stored as raw bytes with associated quantization parameters that define how to interpret and convert the data back to floating-point.

Fields§

§data: Vec<u8>

Quantized data stored as raw bytes

The data layout depends on the quantization type:

For 8-bit and 16-bit types: one value per element
For 4-bit types: two values packed per byte
For binary: eight values packed per byte

§shape: Vec<usize>

Original tensor shape

Maintains the logical shape of the tensor for operations. The total number of elements is the product of all dimensions.

§params: QuantizationParams

Quantization parameters

Contains all information needed to convert between quantized and floating-point representations, including scale factors, zero points, and metadata about the quantization scheme.

§device: Device

Device where tensor is stored

Indicates whether the tensor data resides in CPU memory, GPU memory, or other accelerator memory.

Struct QuantizedTensor Copy item path

Fields§

Implementations§

impl QuantizedTensor

pub fn new( shape: Vec<usize>, params: QuantizationParams, device: Device, ) -> Self

§Arguments

§Examples

pub fn from_data( data: Vec<u8>, shape: Vec<usize>, params: QuantizationParams, device: Device, ) -> BackendResult<Self>

§Arguments

§Returns

pub fn num_elements(&self) -> usize

§Examples

pub fn memory_usage(&self) -> usize

§Examples

pub fn shape(&self) -> &[usize]

pub fn ndim(&self) -> usize

pub fn is_empty(&self) -> bool

pub fn size(&self, dim: usize) -> BackendResult<usize>

pub fn reshape(&self, new_shape: Vec<usize>) -> BackendResult<QuantizedTensor>

§Arguments

§Returns

pub fn view( &self, new_shape: Vec<usize>, ) -> BackendResult<QuantizedTensorView<'_>>

pub fn to_device(&self, device: Device) -> BackendResult<QuantizedTensor>

pub fn data_slice(&self, start: usize, len: usize) -> BackendResult<&[u8]>

§Arguments

§Safety

pub fn data_slice_mut( &mut self, start: usize, len: usize, ) -> BackendResult<&mut [u8]>

§Arguments

§Safety

pub fn storage_efficiency(&self) -> f32

pub fn compression_ratio(&self) -> f32

pub fn validate(&self) -> BackendResult<()>

Trait Implementations§

impl Clone for QuantizedTensor

fn clone(&self) -> QuantizedTensor

fn clone_from(&mut self, source: &Self)

impl Debug for QuantizedTensor

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for QuantizedTensor

impl RefUnwindSafe for QuantizedTensor

impl Send for QuantizedTensor

impl Sync for QuantizedTensor

impl Unpin for QuantizedTensor

impl UnsafeUnpin for QuantizedTensor

impl UnwindSafe for QuantizedTensor

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

Struct QuantizedTensor

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,