FastDivmod

Enum FastDivmod 

Source
pub enum FastDivmod<I: FastDivmodInt> {
    Fast {
        divisor: I,
        multiplier: I,
        shift_right: u32,
    },
    Fallback {
        divisor: I,
    },
}
Expand description

Create a fast-divmod object if supported, or a regular fallback if not. This precalculates certain values on the host, in exchange for making division and modulo operations on the GPU much faster. Only supports u32 right now to allow for a simpler algorithm. It’s mostly used for indices regardless.

Implementation based on ONNX: https://github.com/microsoft/onnxruntime/blob/main/onnxruntime/core/providers/cuda/shared_inc/fast_divmod.h

Variants§

§

Fast

Fields

§divisor: I
§multiplier: I
§shift_right: u32
§

Fallback

Fields

§divisor: I

Implementations§

Source§

impl<I: FastDivmodInt> FastDivmod<I>

Source

pub fn new_Fast(divisor: I, multiplier: I, shift_right: u32) -> Self

Source

pub fn __expand_new_Fast( _: &mut Scope, divisor: <I as CubeType>::ExpandType, multiplier: <I as CubeType>::ExpandType, shift_right: <u32 as CubeType>::ExpandType, ) -> FastDivmodExpand<I>

Source

pub fn new_Fallback(divisor: I) -> Self

Source

pub fn __expand_new_Fallback( _: &mut Scope, divisor: <I as CubeType>::ExpandType, ) -> FastDivmodExpand<I>

Source§

impl<I: FastDivmodInt> FastDivmod<I>

Source

pub fn div(&self, dividend: I) -> I

Source

pub fn modulo(&self, dividend: I) -> I

Source

pub fn div_mod(&self, dividend: I) -> (I, I)

Source

pub fn __expand_div( scope: &mut Scope, this: <Self as CubeType>::ExpandType, dividend: <I as CubeType>::ExpandType, ) -> <I as CubeType>::ExpandType

Source

pub fn __expand_modulo( scope: &mut Scope, this: <Self as CubeType>::ExpandType, dividend: <I as CubeType>::ExpandType, ) -> <I as CubeType>::ExpandType

Source

pub fn __expand_div_mod( scope: &mut Scope, this: <Self as CubeType>::ExpandType, dividend: <I as CubeType>::ExpandType, ) -> <(I, I) as CubeType>::ExpandType

Trait Implementations§

Source§

impl<I: Clone + FastDivmodInt> Clone for FastDivmod<I>

Source§

fn clone(&self) -> FastDivmod<I>

Returns a duplicate of the value. Read more
1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
Source§

impl<I: FastDivmodInt> CubeDebug for FastDivmod<I>

Source§

fn set_debug_name(&self, scope: &mut Scope, name: &'static str)

Set the debug name of this type’s expansion. Should do nothing for types that don’t appear at runtime
Source§

impl<I: FastDivmodInt> CubeType for FastDivmod<I>

Source§

type ExpandType = FastDivmodExpand<I>

Source§

fn into_mut(scope: &mut Scope, expand: Self::ExpandType) -> Self::ExpandType

Wrapper around the init method, necessary to type inference.
Source§

impl<I: FastDivmodInt> LaunchArg for FastDivmod<I>

Source§

type RuntimeArg<'a, R: Runtime> = FastDivmodArgs<I>

The runtime argument for the kernel.
Source§

type CompilationArg = FastDivmodCompilationArg<I>

Compilation argument.
Source§

fn compilation_arg<'a, R: Runtime>( runtime_arg: &Self::RuntimeArg<'a, R>, ) -> Self::CompilationArg

Source§

fn expand( arg: &Self::CompilationArg, builder: &mut KernelBuilder, ) -> <Self as CubeType>::ExpandType

Register an input variable during compilation that fill the KernelBuilder.
Source§

fn expand_output( arg: &Self::CompilationArg, builder: &mut KernelBuilder, ) -> <Self as CubeType>::ExpandType

Register an output variable during compilation that fill the KernelBuilder.
Source§

impl<I: Copy + FastDivmodInt> Copy for FastDivmod<I>

Auto Trait Implementations§

§

impl<I> Freeze for FastDivmod<I>
where I: Freeze,

§

impl<I> RefUnwindSafe for FastDivmod<I>
where I: RefUnwindSafe,

§

impl<I> Send for FastDivmod<I>

§

impl<I> Sync for FastDivmod<I>

§

impl<I> Unpin for FastDivmod<I>
where I: Unpin,

§

impl<I> UnwindSafe for FastDivmod<I>
where I: UnwindSafe,

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> CloneToUninit for T
where T: Clone,

Source§

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)
Performs copy-assignment from self to dest. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoComptime for T

Source§

fn comptime(self) -> Self

Source§

impl<T> ToOwned for T
where T: Clone,

Source§

type Owned = T

The resulting type after obtaining ownership.
Source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
Source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V