Struct GemmPlan

Source

pub struct GemmPlan<T>where
    T: Element,
{ /* private fields */ }

Expand description

Selected GEMM kernel and the host-side metadata needed to launch it.

Plans are cheap to construct, hold no device memory, and are Send + Sync for the same reason — they’re pure host data. The Phase-30 cuBLAS fast-path adds no per-plan state: cuBLAS handles live in a thread-local cache so the plan itself stays trivially thread-safe.

See the crate root for usage; key methods:

select — pick a kernel for a problem shape.
can_implement — host-side validation.
workspace_size — bytes of scratch needed.
run — launch on a stream.
sku — identity of the chosen kernel.
backend — which backend (CUTLASS / cuBLAS) was picked. Phase 30 added the cuBLAS fast-path for f16/bf16 low-M decode shapes; the heuristic is documented on should_use_cublas_for_fp.

Struct GemmPlan Copy item path

Implementations§

impl<T> GemmPlan<T>where T: Element,

pub fn select( stream: &Stream, desc: &GemmDescriptor, pref: PlanPreference, ) -> Result<GemmPlan<T>, Error>

pub fn backend(&self) -> BackendKind

pub fn can_implement(&self, args: &GemmArgs<'_, T>) -> Result<(), Error>

pub fn workspace_size(&self) -> usize

pub fn sku(&self) -> GemmSku

pub fn precision_guarantee(&self) -> PrecisionGuarantee

pub fn run( &self, stream: &Stream, workspace: Workspace<'_>, args: GemmArgs<'_, T>, ) -> Result<(), Error>

Trait Implementations§

impl<T> Debug for GemmPlan<T>where T: Debug + Element,

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

Auto Trait Implementations§

impl<T> Freeze for GemmPlan<T>

impl<T> RefUnwindSafe for GemmPlan<T>where T: RefUnwindSafe,

impl<T> Send for GemmPlan<T>where T: Send,

impl<T> Sync for GemmPlan<T>where T: Sync,

impl<T> Unpin for GemmPlan<T>where T: Unpin,

impl<T> UnsafeUnpin for GemmPlan<T>

impl<T> UnwindSafe for GemmPlan<T>where T: UnwindSafe,

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct GemmPlan

impl<T> GemmPlan<T>
where T: Element,

impl<T> Debug for GemmPlan<T>
where T: Debug + Element,

impl<T> RefUnwindSafe for GemmPlan<T>
where T: RefUnwindSafe,

impl<T> Send for GemmPlan<T>
where T: Send,

impl<T> Sync for GemmPlan<T>
where T: Sync,

impl<T> Unpin for GemmPlan<T>
where T: Unpin,

impl<T> UnwindSafe for GemmPlan<T>
where T: UnwindSafe,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,