Enum Dtype

Source

pub enum Dtype {
    F32,
    F16,
    U32,
    I32,
    I8,
}

Variants§

§

F32

32-bit IEEE float. Default activation / weight dtype on the CPU path; fallback for backends without F16 hw support.

§

F16

16-bit IEEE half. Hot-path dtype on CUDA + Metal (decode q, K/V, GEMM outputs).

§

U32

32-bit unsigned integer. Block tables, context lens, sorted token ids, args buffers — anything previously tunneled through an FP buffer via alloc_u32 / write_u32.

§

I32

32-bit signed integer. Expert ids, position offsets, cu_seqlens_q, tpe (tokens-per-expert). Same byte width as U32; separate variant so kernel signatures (device const int* vs device const uint*) can stay type-honest at runtime.

§

I8

8-bit signed integer. INT8 quantized KV cache cells. Used by KvCacheQuant<B, KvInt8>’s paged stores.

Enum Dtype Copy item path

Variants§

F32

F16

U32

I32

I8

Implementations§

impl Dtype

pub const fn bytes_per_elem(self) -> usize

pub const fn name(self) -> &'static str

Trait Implementations§

impl Clone for Dtype

fn clone(&self) -> Dtype

fn clone_from(&mut self, source: &Self)

impl Copy for Dtype

impl Debug for Dtype

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Eq for Dtype

impl Hash for Dtype

fn hash<__H: Hasher>(&self, state: &mut __H)

fn hash_slice<H>(data: &[Self], state: &mut H)where H: Hasher, Self: Sized,

impl PartialEq for Dtype

fn eq(&self, other: &Dtype) -> bool

fn ne(&self, other: &Rhs) -> bool

impl StructuralPartialEq for Dtype

Auto Trait Implementations§

impl Freeze for Dtype

impl RefUnwindSafe for Dtype

impl Send for Dtype

impl Sync for Dtype

impl Unpin for Dtype

impl UnsafeUnpin for Dtype

impl UnwindSafe for Dtype

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> Same for T

type Output = T

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Enum Dtype

fn hash<H: Hasher>(&self, state: &mut H)

fn hash_slice<H>(data: &[Self], state: &mut H)
where H: Hasher, Self: Sized,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,