Struct CudaAllocator

Source

pub struct CudaAllocator { /* private fields */ }

Expand description

A caching GPU memory allocator with block pools, splitting, coalescing, and stream-aware reuse.

Wraps a GpuDevice and maintains two block pools (small and large). Allocation requests are served from cached free blocks when possible; only on cache miss does the allocator call through to the CUDA driver. Freed blocks are returned to the pool and coalesced with neighbors to reduce fragmentation.

Struct CudaAllocator Copy item path

§CL-323

Implementations§

impl CudaAllocator

pub fn new(device: Arc<GpuDevice>) -> Self

pub fn alloc_zeros<T>(&self, count: usize) -> GpuResult<CudaBuffer<T>>where T: DeviceRepr + ValidAsZeroBits,

§Errors

pub fn alloc_copy<T>(&self, data: &[T]) -> GpuResult<CudaBuffer<T>>where T: DeviceRepr,

§Errors

pub fn free<T>(&self, buffer: CudaBuffer<T>)

pub fn memory_allocated(&self) -> usize

pub fn max_memory_allocated(&self) -> usize

pub fn memory_reserved(&self) -> usize

pub fn reset_peak_stats(&self)

pub fn empty_cache(&self)

§CL-323

pub fn device(&self) -> &GpuDevice

pub fn record_stream_on_block(&self, block_idx: usize, stream: StreamId)

§CL-323

pub fn block_count(&self) -> usize

pub fn free_block_count(&self) -> usize

pub fn cache_stats(&self) -> (usize, usize)

pub fn cached_bytes(&self) -> usize

pub fn cache_find( &self, size: usize, stream: StreamId, ) -> Option<(usize, usize)>

§CL-323

pub fn cache_insert( &self, requested_size: usize, driver_alloc_size: usize, ptr: usize, stream: StreamId, ) -> (usize, usize)

§CL-323

pub fn cache_free(&self, block_idx: usize)

§CL-323

pub fn driver_alloc_size(size: usize) -> usize

Trait Implementations§

impl Debug for CudaAllocator

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl !Freeze for CudaAllocator

impl RefUnwindSafe for CudaAllocator

impl Send for CudaAllocator

impl Sync for CudaAllocator

impl Unpin for CudaAllocator

impl UnsafeUnpin for CudaAllocator

impl UnwindSafe for CudaAllocator

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> ByRef<T> for T

fn by_ref(&self) -> &T

impl<T> DistributionExt for Twhere T: ?Sized,

fn rand<T>(&self, rng: &mut (impl Rng + ?Sized)) -> Twhere Self: Distribution<T>,

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T, U> Imply<T> for Uwhere T: ?Sized, U: ?Sized,

Struct CudaAllocator

pub fn alloc_zeros<T>(&self, count: usize) -> GpuResult<CudaBuffer<T>>
where T: DeviceRepr + ValidAsZeroBits,

pub fn alloc_copy<T>(&self, data: &[T]) -> GpuResult<CudaBuffer<T>>
where T: DeviceRepr,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> DistributionExt for T
where T: ?Sized,

fn rand<T>(&self, rng: &mut (impl Rng + ?Sized)) -> T
where Self: Distribution<T>,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

impl<T, U> Imply<T> for U
where T: ?Sized, U: ?Sized,