Struct GpuContext

Source

pub struct GpuContext { /* private fields */ }

Expand description

GPU context for managing GPU resources and operations

Implementations§

Source §

impl GpuContext

Source

pub fn new(backend: GpuBackend) -> Result<GpuContext, GpuError>

Create a new GPU context with the specified backend

Source

pub fn backend(&self) -> GpuBackend

Get the backend type

Source

pub fn backend_name(&self) -> &str

Get the backend name

Source

pub fn create_buffer<T>(&self, size: usize) -> GpuBuffer<T>
where T: GpuDataType,

Create a buffer with the given size

Source

pub fn create_buffer_from_slice<T>(&self, data: &[T]) -> GpuBuffer<T>
where T: GpuDataType,

Create a buffer from a slice

Source

pub fn execute<F, R>(&self, f: F) -> R
where F: FnOnce(&GpuCompiler) -> R,

Execute a function with a compiler

Source

pub fn get_kernel(&self, name: &str) -> Result<GpuKernelHandle, GpuError>

Get a kernel from the registry

Source

pub fn get_specialized_kernel( &self, name: &str, params: &KernelParams, ) -> Result<GpuKernelHandle, GpuError>

Get a specialized kernel from the registry

Source

pub fn get_available_memory(&self) -> Option<usize>

Get available memory on the device

Source

pub fn get_total_memory(&self) -> Option<usize>

Get total memory on the device

Source

pub fn launch_kernel( &self, kernel_name: &str, grid_size: (usize, usize, usize), block_size: (usize, usize, usize), args: &[DynamicKernelArg], ) -> Result<(), GpuError>

Launch a kernel with the given parameters

Source

pub fn transfer_async_host_to_device<T>( &self, ptr: &GpuPtr<T>, data: &[T], ) -> Result<(), GpuError>
where T: GpuDataType,

Transfer data from host to device asynchronously

Source

pub fn transfer_host_to_device<T>( &self, ptr: &GpuPtr<T>, data: &[T], ) -> Result<(), GpuError>
where T: GpuDataType,

Transfer data from host to device synchronously

Source

pub fn transfer_async_device_to_host<T>( &self, ptr: &GpuPtr<T>, data: &mut [T], ) -> Result<(), GpuError>
where T: GpuDataType,

Transfer data from device to host asynchronously

Source

pub fn transfer_device_to_host<T>( &self, ptr: &GpuPtr<T>, data: &mut [T], ) -> Result<(), GpuError>
where T: GpuDataType,

Transfer data from device to host synchronously

Source

pub fn execute_kernel( &self, source: &str, buffers: &[GpuBuffer<f32>], work_groups: (u32, u32, u32), int_params: &[u32], float_params: &[f32], ) -> Result<(), GpuError>

Execute a kernel with dynamic compilation and parameter passing This method is expected by scirs2-vision for GPU operations

Source

pub fn read_buffer<T>(&self, buffer: &GpuBuffer<T>) -> Result<Vec<T>, GpuError>
where T: GpuDataType,

Read data from a GPU buffer This method is expected by scirs2-vision for reading GPU results

Source

pub fn sum_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Global sum reduction

Source

pub fn mean_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Global mean reduction

Source

pub fn max_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Global max reduction

Source

pub fn min_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Global min reduction

Source

pub fn sum_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Sum reduction along an axis

Source

pub fn mean_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Mean reduction along an axis

Source

pub fn max_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Max reduction along an axis

Source

pub fn min_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Min reduction along an axis

Source

pub fn broadcast<T>( &self, buffer: &GpuBuffer<T>, from_shape: &[usize], to_shape: &[usize], ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Broadcast a buffer to a different shape

Source

pub fn scale<T>( &self, buffer: &GpuBuffer<T>, scalar: T, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Scale a buffer by a scalar value

Source

pub fn gemm<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

General matrix multiplication: C = A @ B

Source

pub fn gemm_transpose_b<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

GEMM with transposed B: C = A @ B^T

Source

pub fn gemm_transpose_a<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

GEMM with transposed A: C = A^T @ B

Source

pub fn relu<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

ReLU activation forward pass

Source

pub fn relu_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

ReLU backward pass

Source

pub fn sigmoid<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Sigmoid activation forward pass

Source

pub fn sigmoid_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Sigmoid backward pass

Source

pub fn tanh<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Tanh activation forward pass

Source

pub fn tanh_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

Tanh backward pass

Source

pub fn gelu<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

GELU activation forward pass

Source

pub fn gelu_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

GELU backward pass

Trait Implementations§

Source §

impl Debug for GpuContext

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

Formats the value using the given formatter. Read more

Auto Trait Implementations§

§

impl !UnwindSafe for GpuContext

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

impl<T> Pointable for T

Source §

const ALIGN: usize

The alignment of pointer.

Source §

type Init = T

The type for initializers.

Source §

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

Source §

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

Source §

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

Source §

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source §

GpuContext

Struct GpuContext Copy item path

Implementations§

impl GpuContext

pub fn new(backend: GpuBackend) -> Result<GpuContext, GpuError>

pub fn backend(&self) -> GpuBackend

pub fn backend_name(&self) -> &str

pub fn create_buffer<T>(&self, size: usize) -> GpuBuffer<T>where T: GpuDataType,

pub fn create_buffer_from_slice<T>(&self, data: &[T]) -> GpuBuffer<T>where T: GpuDataType,

pub fn execute<F, R>(&self, f: F) -> Rwhere F: FnOnce(&GpuCompiler) -> R,

pub fn get_kernel(&self, name: &str) -> Result<GpuKernelHandle, GpuError>

pub fn get_specialized_kernel( &self, name: &str, params: &KernelParams, ) -> Result<GpuKernelHandle, GpuError>

pub fn get_available_memory(&self) -> Option<usize>

pub fn get_total_memory(&self) -> Option<usize>

pub fn launch_kernel( &self, kernel_name: &str, grid_size: (usize, usize, usize), block_size: (usize, usize, usize), args: &[DynamicKernelArg], ) -> Result<(), GpuError>

pub fn transfer_async_host_to_device<T>( &self, ptr: &GpuPtr<T>, data: &[T], ) -> Result<(), GpuError>where T: GpuDataType,

pub fn transfer_host_to_device<T>( &self, ptr: &GpuPtr<T>, data: &[T], ) -> Result<(), GpuError>where T: GpuDataType,

pub fn transfer_async_device_to_host<T>( &self, ptr: &GpuPtr<T>, data: &mut [T], ) -> Result<(), GpuError>where T: GpuDataType,

pub fn transfer_device_to_host<T>( &self, ptr: &GpuPtr<T>, data: &mut [T], ) -> Result<(), GpuError>where T: GpuDataType,

pub fn execute_kernel( &self, source: &str, buffers: &[GpuBuffer<f32>], work_groups: (u32, u32, u32), int_params: &[u32], float_params: &[f32], ) -> Result<(), GpuError>

pub fn read_buffer<T>(&self, buffer: &GpuBuffer<T>) -> Result<Vec<T>, GpuError>where T: GpuDataType,

pub fn sum_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn mean_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn max_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn min_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn sum_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn mean_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn max_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn min_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn broadcast<T>( &self, buffer: &GpuBuffer<T>, from_shape: &[usize], to_shape: &[usize], ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn scale<T>( &self, buffer: &GpuBuffer<T>, scalar: T, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn gemm<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn gemm_transpose_b<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn gemm_transpose_a<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn relu<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn relu_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn sigmoid<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn sigmoid_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn tanh<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn tanh_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn gelu<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

pub fn gelu_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>where T: GpuDataType,

Trait Implementations§

impl Debug for GpuContext

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

Auto Trait Implementations§

impl Freeze for GpuContext

impl !RefUnwindSafe for GpuContext

impl Send for GpuContext

impl Sync for GpuContext

impl Unpin for GpuContext

impl UnsafeUnpin for GpuContext

impl !UnwindSafe for GpuContext

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct GpuContext

pub fn create_buffer<T>(&self, size: usize) -> GpuBuffer<T>
where T: GpuDataType,

pub fn create_buffer_from_slice<T>(&self, data: &[T]) -> GpuBuffer<T>
where T: GpuDataType,

pub fn execute<F, R>(&self, f: F) -> R
where F: FnOnce(&GpuCompiler) -> R,

pub fn transfer_async_host_to_device<T>( &self, ptr: &GpuPtr<T>, data: &[T], ) -> Result<(), GpuError>
where T: GpuDataType,

pub fn transfer_host_to_device<T>( &self, ptr: &GpuPtr<T>, data: &[T], ) -> Result<(), GpuError>
where T: GpuDataType,

pub fn transfer_async_device_to_host<T>( &self, ptr: &GpuPtr<T>, data: &mut [T], ) -> Result<(), GpuError>
where T: GpuDataType,

pub fn transfer_device_to_host<T>( &self, ptr: &GpuPtr<T>, data: &mut [T], ) -> Result<(), GpuError>
where T: GpuDataType,

pub fn read_buffer<T>(&self, buffer: &GpuBuffer<T>) -> Result<Vec<T>, GpuError>
where T: GpuDataType,

pub fn sum_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn mean_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn max_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn min_all<T>( &self, buffer: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn sum_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn mean_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn max_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn min_axis<T>( &self, buffer: &GpuBuffer<T>, shape: &[usize], axis: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn broadcast<T>( &self, buffer: &GpuBuffer<T>, from_shape: &[usize], to_shape: &[usize], ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn scale<T>( &self, buffer: &GpuBuffer<T>, scalar: T, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn gemm<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn gemm_transpose_b<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn gemm_transpose_a<T>( &self, a: &GpuBuffer<T>, b: &GpuBuffer<T>, m: usize, k: usize, n: usize, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn relu<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn relu_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn sigmoid<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn sigmoid_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn tanh<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn tanh_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn gelu<T>(&self, input: &GpuBuffer<T>) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

pub fn gelu_backward<T>( &self, grad_output: &GpuBuffer<T>, input: &GpuBuffer<T>, ) -> Result<GpuBuffer<T>, GpuError>
where T: GpuDataType,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,