Enum FastDivmod

Source
pub enum FastDivmod {
    Fast {
        divisor: u32,
        multiplier: u32,
        shift_right: u32,
    },
    PowerOfTwo {
        shift: u32,
        mask: u32,
    },
    Fallback {
        divisor: u32,
    },
}
Expand description

Create a fast-divmod object if supported, or a regular fallback if not. This precalculates certain values on the host, in exchange for making division and modulo operations on the GPU much faster. Only supports u32 right now to allow for a simpler algorithm. It’s mostly used for indices regardless.

Implementation based on ONNX: https://github.com/microsoft/onnxruntime/blob/main/onnxruntime/core/providers/cuda/shared_inc/fast_divmod.h

Variants§

§

Fast

Fields

§divisor: u32
§multiplier: u32
§shift_right: u32
§

PowerOfTwo

Fields

§shift: u32
§mask: u32
§

Fallback

Fields

§divisor: u32

Implementations§

Source§

impl FastDivmod

Source

pub fn new_Fast(divisor: u32, multiplier: u32, shift_right: u32) -> Self

Source

pub fn __expand_new_Fast( _: &mut Scope, divisor: <u32 as CubeType>::ExpandType, multiplier: <u32 as CubeType>::ExpandType, shift_right: <u32 as CubeType>::ExpandType, ) -> FastDivmodExpand

Source

pub fn new_PowerOfTwo(shift: u32, mask: u32) -> Self

Source

pub fn __expand_new_PowerOfTwo( _: &mut Scope, shift: <u32 as CubeType>::ExpandType, mask: <u32 as CubeType>::ExpandType, ) -> FastDivmodExpand

Source

pub fn new_Fallback(divisor: u32) -> Self

Source

pub fn __expand_new_Fallback( _: &mut Scope, divisor: <u32 as CubeType>::ExpandType, ) -> FastDivmodExpand

Source§

impl FastDivmod

Source

pub fn div(&self, dividend: u32) -> u32

Source

pub fn modulo(&self, dividend: u32) -> u32

Source

pub fn div_mod(&self, dividend: u32) -> (u32, u32)

Source

pub fn __expand_div( scope: &mut Scope, this: <Self as CubeType>::ExpandType, dividend: <u32 as CubeType>::ExpandType, ) -> <u32 as CubeType>::ExpandType

Source

pub fn __expand_modulo( scope: &mut Scope, this: <Self as CubeType>::ExpandType, dividend: <u32 as CubeType>::ExpandType, ) -> <u32 as CubeType>::ExpandType

Source

pub fn __expand_div_mod( scope: &mut Scope, this: <Self as CubeType>::ExpandType, dividend: <u32 as CubeType>::ExpandType, ) -> <(u32, u32) as CubeType>::ExpandType

Trait Implementations§

Source§

impl Clone for FastDivmod

Source§

fn clone(&self) -> FastDivmod

Returns a duplicate of the value. Read more
1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
Source§

impl CubeDebug for FastDivmod

Source§

fn set_debug_name(&self, scope: &mut Scope, name: &'static str)

Set the debug name of this type’s expansion. Should do nothing for types that don’t appear at runtime
Source§

impl CubeType for FastDivmod

Source§

type ExpandType = FastDivmodExpand

Source§

fn into_mut(scope: &mut Scope, expand: Self::ExpandType) -> Self::ExpandType

Wrapper around the init method, necessary to type inference.
Source§

impl LaunchArg for FastDivmod

Source§

type RuntimeArg<'a, R: Runtime> = FastDivmodArgs<'a, R>

The runtime argument for the kernel.
Source§

fn compilation_arg<'a, R: Runtime>( runtime_arg: &Self::RuntimeArg<'a, R>, ) -> Self::CompilationArg

Source§

impl LaunchArgExpand for FastDivmod

Source§

type CompilationArg = FastDivmodCompilationArg

Compilation argument.
Source§

fn expand( arg: &Self::CompilationArg, builder: &mut KernelBuilder, ) -> <Self as CubeType>::ExpandType

Register an input variable during compilation that fill the KernelBuilder.
Source§

fn expand_output( arg: &Self::CompilationArg, builder: &mut KernelBuilder, ) -> <Self as CubeType>::ExpandType

Register an output variable during compilation that fill the KernelBuilder.
Source§

impl Copy for FastDivmod

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> CloneToUninit for T
where T: Clone,

Source§

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)
Performs copy-assignment from self to dest. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> ToOwned for T
where T: Clone,

Source§

type Owned = T

The resulting type after obtaining ownership.
Source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
Source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V

Source§

impl<T> CubeLaunch for T