numr 0.5.2

High-performance numerical computing with multi-backend GPU acceleration (CPU/CUDA/WebGPU)
Documentation
1
2
3
4
5
6
7
8
9
10
//! CUDA GEMM epilogue kernels and launchers.

mod bwd_launcher;
mod launcher;

pub use bwd_launcher::{launch_gemm_bias_act_bwd_batched_kernel, launch_gemm_bias_act_bwd_kernel};
pub use launcher::{
    launch_gemm_bias_act_batched_kernel, launch_gemm_bias_act_kernel,
    launch_gemm_bias_residual_batched_kernel, launch_gemm_bias_residual_kernel,
};