Struct CudaTensor

Source

pub struct CudaTensor { /* private fields */ }

Expand description

Tensor stored on CUDA device

Implementations§

Source §

impl CudaTensor

Source

pub fn new(shape: &[usize], dtype: DType, device_id: i32) -> CudaResult<Self>

Create new CUDA tensor with given shape (uninitialized)

Source

pub fn from_tensor(tensor: &Tensor, device_id: i32) -> CudaResult<Self>

Create CUDA tensor from CPU tensor (copies data to GPU)

Source

pub fn from_tensor_async( tensor: &Tensor, device_id: i32, stream: &CudaStream, ) -> CudaResult<Self>

Create CUDA tensor from CPU tensor (async copy)

Source

pub fn to_tensor(&self) -> CudaResult<Tensor>

Copy back to CPU tensor

Source

pub fn to_tensor_async(&self, stream: &CudaStream) -> CudaResult<Vec<f32>>

Copy back to CPU tensor (async)

Source

pub fn shape(&self) -> &Shape

Get shape

Source

pub fn dims(&self) -> &[usize]

Get dimensions

Source

pub fn numel(&self) -> usize

Get number of elements

Source

pub fn dtype(&self) -> DType

Get data type

Source

pub fn device_id(&self) -> i32

Get device ID

Source

pub fn as_ptr(&self) -> *const f32

Get raw buffer pointer

Source

pub fn as_mut_ptr(&mut self) -> *mut f32

Get mutable raw buffer pointer

Source

pub fn size_bytes(&self) -> usize

Get buffer size in bytes

Source

pub fn zeros(shape: &[usize], device_id: i32) -> CudaResult<Self>

Create zeros tensor

Source

pub fn ones(shape: &[usize], device_id: i32) -> CudaResult<Self>

Create ones tensor

Source

pub fn full(shape: &[usize], value: f32, device_id: i32) -> CudaResult<Self>

Create tensor filled with value

Source

pub fn reshape(&self, new_shape: &[usize]) -> CudaResult<Self>

Reshape tensor

Source

pub fn transpose(&self, dim0: usize, dim1: usize) -> CudaResult<Self>

Transpose dimensions

Source

pub fn is_contiguous(&self) -> bool

Check if tensor is contiguous

Source

pub fn clone_tensor(&self) -> CudaResult<Self>

Deep clone

Source

pub fn add(&self, other: &CudaTensor) -> CudaResult<CudaTensor>

Element-wise addition

Source

pub fn sub(&self, other: &CudaTensor) -> CudaResult<CudaTensor>

Element-wise subtraction

Source

pub fn mul_scalar(&self, scalar: f32) -> CudaResult<CudaTensor>

Scalar multiplication

Source

pub fn matmul(&self, other: &CudaTensor) -> CudaResult<CudaTensor>

Matrix multiplication

Source

pub fn dot(&self, other: &CudaTensor) -> CudaResult<f32>

Dot product

Source

pub fn norm(&self) -> CudaResult<f32>

L2 norm

Source

pub fn sum(&self) -> CudaResult<f32>

Sum all elements

Source

pub fn mean(&self) -> CudaResult<f32>

Mean of all elements

Source

pub fn max(&self) -> CudaResult<f32>

Max element

Source

pub fn min(&self) -> CudaResult<f32>

Min element

Source

pub fn relu(&self) -> CudaResult<CudaTensor>

ReLU activation (in-place capable)

Source

pub fn sigmoid(&self) -> CudaResult<CudaTensor>

Sigmoid activation

Source

pub fn gelu(&self) -> CudaResult<CudaTensor>

GELU activation

Source

pub fn softmax(&self, dim: i32) -> CudaResult<CudaTensor>

Softmax

Source

pub fn exp(&self) -> CudaResult<CudaTensor>

Exponential

Source

pub fn log(&self) -> CudaResult<CudaTensor>

Natural logarithm

Source

pub fn sqrt(&self) -> CudaResult<CudaTensor>

Square root

Source

pub fn pow(&self, exp: f32) -> CudaResult<CudaTensor>

Power

Trait Implementations§

Source §

impl Clone for CudaTensor

Source §

fn clone(&self) -> Self

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for CudaTensor

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations§

§

impl UnwindSafe for CudaTensor

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

impl<T> Pointable for T

Source §

const ALIGN: usize

The alignment of pointer.

Source §

type Init = T

The type for initializers.

Source §

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

Source §

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

Source §

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

Source §

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source §

CudaTensor

Struct CudaTensor Copy item path

Implementations§

impl CudaTensor

pub fn new(shape: &[usize], dtype: DType, device_id: i32) -> CudaResult<Self>

pub fn from_tensor(tensor: &Tensor, device_id: i32) -> CudaResult<Self>

pub fn from_tensor_async( tensor: &Tensor, device_id: i32, stream: &CudaStream, ) -> CudaResult<Self>

pub fn to_tensor(&self) -> CudaResult<Tensor>

pub fn to_tensor_async(&self, stream: &CudaStream) -> CudaResult<Vec<f32>>

pub fn shape(&self) -> &Shape

pub fn dims(&self) -> &[usize]

pub fn numel(&self) -> usize

pub fn dtype(&self) -> DType

pub fn device_id(&self) -> i32

pub fn as_ptr(&self) -> *const f32

pub fn as_mut_ptr(&mut self) -> *mut f32

pub fn size_bytes(&self) -> usize

pub fn zeros(shape: &[usize], device_id: i32) -> CudaResult<Self>

pub fn ones(shape: &[usize], device_id: i32) -> CudaResult<Self>

pub fn full(shape: &[usize], value: f32, device_id: i32) -> CudaResult<Self>

pub fn reshape(&self, new_shape: &[usize]) -> CudaResult<Self>

pub fn transpose(&self, dim0: usize, dim1: usize) -> CudaResult<Self>

pub fn is_contiguous(&self) -> bool

pub fn clone_tensor(&self) -> CudaResult<Self>

pub fn add(&self, other: &CudaTensor) -> CudaResult<CudaTensor>

pub fn sub(&self, other: &CudaTensor) -> CudaResult<CudaTensor>

pub fn mul_scalar(&self, scalar: f32) -> CudaResult<CudaTensor>

pub fn matmul(&self, other: &CudaTensor) -> CudaResult<CudaTensor>

pub fn dot(&self, other: &CudaTensor) -> CudaResult<f32>

pub fn norm(&self) -> CudaResult<f32>

pub fn sum(&self) -> CudaResult<f32>

pub fn mean(&self) -> CudaResult<f32>

pub fn max(&self) -> CudaResult<f32>

pub fn min(&self) -> CudaResult<f32>

pub fn relu(&self) -> CudaResult<CudaTensor>

pub fn sigmoid(&self) -> CudaResult<CudaTensor>

pub fn gelu(&self) -> CudaResult<CudaTensor>

pub fn softmax(&self, dim: i32) -> CudaResult<CudaTensor>

pub fn exp(&self) -> CudaResult<CudaTensor>

pub fn log(&self) -> CudaResult<CudaTensor>

pub fn sqrt(&self) -> CudaResult<CudaTensor>

pub fn pow(&self, exp: f32) -> CudaResult<CudaTensor>

Trait Implementations§

impl Clone for CudaTensor

fn clone(&self) -> Self

fn clone_from(&mut self, source: &Self)

impl Debug for CudaTensor

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for CudaTensor

impl RefUnwindSafe for CudaTensor

impl !Send for CudaTensor

impl !Sync for CudaTensor

impl Unpin for CudaTensor

impl UnwindSafe for CudaTensor

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

Struct CudaTensor

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,