Struct Fp8E4M3

Source

#[repr(transparent)]
pub struct Fp8E4M3(pub u8);

Expand description

8-bit floating-point, E4M3 encoding (1 sign + 4 exponent + 3 mantissa, exponent bias 7).

#[repr(transparent)] around u8 storage — bit-compatible with __nv_fp8_storage_t on the CUDA side and with float8::F8E4M3 on the host side. A DeviceBuffer<u8> (byte substrate) can be reinterpreted as DeviceBuffer<Fp8E4M3> via view_as without copying.

Numerical range: ±448 (max finite). One NaN encoding only (S.1111.111); E4M3 has no infinities. The conversion path matches NVIDIA’s __nv_cvt_float_to_fp8(x, __NV_SATFINITE, __NV_E4M3): round-half-to-even, saturating-to-max-finite on overflow.

Routes through Ada Lovelace FP8 tensor cores (mma.sync.aligned.m16n8k32.row.col.f32.e4m3.e4m3.f32) with F32 accumulation and float alpha / beta scaling. First landed in baracuda-kernels Phase 2.

Tuple Fields§

§0: u8

Struct Fp8E4M3 Copy item path

Tuple Fields§

Implementations§

impl Fp8E4M3

pub fn from_f32(x: f32) -> Fp8E4M3

pub fn to_f32(self) -> f32

Trait Implementations§

impl Clone for Fp8E4M3

fn clone(&self) -> Fp8E4M3

fn clone_from(&mut self, source: &Self)

impl Copy for Fp8E4M3

impl Debug for Fp8E4M3

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

impl Default for Fp8E4M3

fn default() -> Fp8E4M3

impl DeviceRepr for Fp8E4M3

impl Eq for Fp8E4M3

impl FpElement for Fp8E4M3

impl Hash for Fp8E4M3

fn hash<__H>(&self, state: &mut __H)where __H: Hasher,

fn hash_slice<H>(data: &[Self], state: &mut H)where H: Hasher, Self: Sized,

impl KernelDtype for Fp8E4M3

const KIND: ElementKind = ElementKind::Fp8E4M3

impl Ord for Fp8E4M3

fn cmp(&self, other: &Fp8E4M3) -> Ordering

fn max(self, other: Self) -> Selfwhere Self: Sized,

fn min(self, other: Self) -> Selfwhere Self: Sized,

fn clamp(self, min: Self, max: Self) -> Selfwhere Self: Sized,

impl PartialEq for Fp8E4M3

fn eq(&self, other: &Fp8E4M3) -> bool

fn ne(&self, other: &Rhs) -> bool

impl PartialOrd for Fp8E4M3

fn partial_cmp(&self, other: &Fp8E4M3) -> Option<Ordering>

fn lt(&self, other: &Rhs) -> bool

fn le(&self, other: &Rhs) -> bool

fn gt(&self, other: &Rhs) -> bool

fn ge(&self, other: &Rhs) -> bool

impl StructuralPartialEq for Fp8E4M3

Auto Trait Implementations§

impl Freeze for Fp8E4M3

impl RefUnwindSafe for Fp8E4M3

impl Send for Fp8E4M3

impl Sync for Fp8E4M3

impl Unpin for Fp8E4M3

impl UnsafeUnpin for Fp8E4M3

impl UnwindSafe for Fp8E4M3

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct Fp8E4M3

fn hash<H>(&self, state: &mut H)
where __H: Hasher,

fn hash_slice<H>(data: &[Self], state: &mut H)
where H: Hasher, Self: Sized,

fn max(self, other: Self) -> Self
where Self: Sized,

fn min(self, other: Self) -> Self
where Self: Sized,

fn clamp(self, min: Self, max: Self) -> Self
where Self: Sized,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,