cublas-hgemm 0.1.0

HGEMM kernels with Tensor Core support built on cuda-oxide
Documentation
1
2
3
4
5
pub mod half;
pub mod tensor_core;

// Re-export Tensor Core variant as the default (best performance).
pub use tensor_core::hgemm_tensor_core as hgemm;