pub unsafe extern "C" fn cuda_memcpy_async_to_gpu( dest: *mut c_void, src: *const c_void, size: u64, stream: *mut c_void, gpu_index: u32, )