Struct QuantizedMatmulIdParams

Source

pub struct QuantizedMatmulIdParams {
    pub m: u32,
    pub k: u32,
    pub n: u32,
    pub group_size: u32,
    pub bits: u32,
    pub n_expert_used: u32,
    pub num_experts: u32,
}

Expand description

Parameters describing the expert-routed quantized matmul dimensions.

Fields§

§m: u32

Number of input rows (tokens).

§k: u32

Inner dimension (shared between input and weight).

§n: u32

Number of output columns per expert.

§group_size: u32

Number of consecutive values sharing one scale/bias pair.

§bits: u32

Quantization bit width (4, 6, or 8).

§n_expert_used: u32

Number of experts each token is routed to (top-k).

§num_experts: u32

Total number of experts in the weight tensor.

Trait Implementations§

Source §

impl Clone for QuantizedMatmulIdParams

Source §

fn clone(&self) -> QuantizedMatmulIdParams

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for QuantizedMatmulIdParams

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl Copy for QuantizedMatmulIdParams

Auto Trait Implementations§

§

impl UnwindSafe for QuantizedMatmulIdParams

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

QuantizedMatmulIdParams

Struct QuantizedMatmulIdParams Copy item path

Fields§

Trait Implementations§

impl Clone for QuantizedMatmulIdParams

fn clone(&self) -> QuantizedMatmulIdParams

fn clone_from(&mut self, source: &Self)

impl Debug for QuantizedMatmulIdParams

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Copy for QuantizedMatmulIdParams

Auto Trait Implementations§

impl Freeze for QuantizedMatmulIdParams

impl RefUnwindSafe for QuantizedMatmulIdParams

impl Send for QuantizedMatmulIdParams

impl Sync for QuantizedMatmulIdParams

impl Unpin for QuantizedMatmulIdParams

impl UnsafeUnpin for QuantizedMatmulIdParams

impl UnwindSafe for QuantizedMatmulIdParams

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct QuantizedMatmulIdParams

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,