CuBlas

Struct CuBlas 

Source
pub struct CuBlas { /* private fields */ }
Expand description

cuBLAS handle wrapper

Implementations§

Source§

impl CuBlas

Source

pub fn new() -> CudaResult<Self>

Create new cuBLAS handle

Source

pub fn set_stream(&self, stream: &CudaStream) -> CudaResult<()>

Set stream for cuBLAS operations

Source

pub fn sgemm( &self, trans_a: bool, trans_b: bool, m: i32, n: i32, k: i32, alpha: f32, a: *const f32, lda: i32, b: *const f32, ldb: i32, beta: f32, c: *mut f32, ldc: i32, ) -> CudaResult<()>

SGEMM: C = alpha * op(A) * op(B) + beta * C

This is the core matrix multiplication operation.

§Arguments
  • trans_a - Whether to transpose A
  • trans_b - Whether to transpose B
  • m - Number of rows of op(A) and C
  • n - Number of columns of op(B) and C
  • k - Number of columns of op(A) and rows of op(B)
  • alpha - Scalar multiplier for A*B
  • a - Matrix A
  • lda - Leading dimension of A
  • b - Matrix B
  • ldb - Leading dimension of B
  • beta - Scalar multiplier for C
  • c - Matrix C (output)
  • ldc - Leading dimension of C
Source

pub fn saxpy( &self, n: i32, alpha: f32, x: *const f32, incx: i32, y: *mut f32, incy: i32, ) -> CudaResult<()>

SAXPY: y = alpha * x + y

Source

pub fn sdot( &self, n: i32, x: *const f32, incx: i32, y: *const f32, incy: i32, ) -> CudaResult<f32>

SDOT: result = x . y

Source

pub fn snrm2(&self, n: i32, x: *const f32, incx: i32) -> CudaResult<f32>

SNRM2: result = ||x||_2

Source

pub fn sscal( &self, n: i32, alpha: f32, x: *mut f32, incx: i32, ) -> CudaResult<()>

SSCAL: x = alpha * x

Source

pub fn matmul(&self, a: &CudaTensor, b: &CudaTensor) -> CudaResult<CudaTensor>

Matrix multiplication for CudaTensors

Trait Implementations§

Source§

impl Drop for CuBlas

Source§

fn drop(&mut self)

Executes the destructor for this type. Read more
Source§

impl Send for CuBlas

Source§

impl Sync for CuBlas

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoEither for T

Source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

impl<T> Pointable for T

Source§

const ALIGN: usize

The alignment of pointer.
Source§

type Init = T

The type for initializers.
Source§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
Source§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
Source§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
Source§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V