pub fn cuda_malloc(size: usize) -> CudaRtResult<DevicePtr>
Allocate device memory (mirrors cudaMalloc).
cudaMalloc