Struct QuantizationMetadata

Source

pub struct QuantizationMetadata {
    pub scheme: QuantizationScheme,
    pub group_size: u32,
    pub scale_bits: u16,
    pub zero_point: i8,
    pub has_per_group_scales: bool,
}

Expand description

Quantization metadata for HCT v2.

Contains information needed to dequantize INT4/INT8 weights.

Fields§

§scheme: QuantizationScheme

Quantization scheme used.

§group_size: u32

Group size for group-wise quantization (0 = per-tensor).

§scale_bits: u16

Global scale factor (f16 stored as u16 bits).

§zero_point: i8

Global zero point (for asymmetric quantization).

§has_per_group_scales: bool

Whether per-group scales are stored after compressed data.

Implementations§

Source §

impl QuantizationMetadata

Source

pub const SIZE: usize = 8

Size of quantization metadata in bytes.

Source

pub fn to_bytes(&self) -> [u8; 8]

Serialize to bytes.

Source

pub fn from_bytes(buf: &[u8; 8]) -> Result<Self>

Parse from bytes.

Trait Implementations§

Source §

impl Clone for QuantizationMetadata

Source §

fn clone(&self) -> QuantizationMetadata

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for QuantizationMetadata

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl Default for QuantizationMetadata

Source §

fn default() -> QuantizationMetadata

Returns the “default value” for a type. Read more

Source §

impl PartialEq for QuantizationMetadata

Source §

fn eq(&self, other: &QuantizationMetadata) -> bool

Tests for self and other values to be equal, and is used by ==.

1.0.0 · Source§

fn ne(&self, other: &Rhs) -> bool

Tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.

Source §

impl StructuralPartialEq for QuantizationMetadata

Auto Trait Implementations§

§

impl UnwindSafe for QuantizationMetadata

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Struct QuantizationMetadata Copy item path

Fields§

Implementations§

impl QuantizationMetadata

pub const SIZE: usize = 8

pub fn to_bytes(&self) -> [u8; 8]

pub fn from_bytes(buf: &[u8; 8]) -> Result<Self>

Trait Implementations§

impl Clone for QuantizationMetadata

fn clone(&self) -> QuantizationMetadata

fn clone_from(&mut self, source: &Self)

impl Debug for QuantizationMetadata

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for QuantizationMetadata

fn default() -> QuantizationMetadata

impl PartialEq for QuantizationMetadata

fn eq(&self, other: &QuantizationMetadata) -> bool

fn ne(&self, other: &Rhs) -> bool

impl StructuralPartialEq for QuantizationMetadata

Auto Trait Implementations§

impl Freeze for QuantizationMetadata

impl RefUnwindSafe for QuantizationMetadata

impl Send for QuantizationMetadata

impl Sync for QuantizationMetadata

impl Unpin for QuantizationMetadata

impl UnwindSafe for QuantizationMetadata

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct QuantizationMetadata

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,