use crate::error::{BlasError, BlasResult};
use crate::handle::BlasHandle;
use crate::types::{FillMode, GpuFloat, MatrixDesc, MatrixDescMut, Transpose};
use super::syrk_tc;
pub fn syrk<T: GpuFloat>(
handle: &BlasHandle,
fill_mode: FillMode,
trans: Transpose,
alpha: T,
a: &MatrixDesc<T>,
beta: T,
c: &mut MatrixDescMut<T>,
) -> BlasResult<()> {
if trans == Transpose::ConjTrans {
return Err(BlasError::InvalidArgument(
"SYRK: use HERK for conjugate-transpose; ConjTrans is not valid here".into(),
));
}
if c.rows != c.cols {
return Err(BlasError::InvalidDimension(format!(
"SYRK: output C must be square, got {}x{}",
c.rows, c.cols
)));
}
let n = c.rows;
let (a_n, _a_k) = match trans {
Transpose::NoTrans => (a.rows, a.cols),
Transpose::Trans | Transpose::ConjTrans => (a.cols, a.rows),
};
if a_n != n {
return Err(BlasError::DimensionMismatch(format!(
"SYRK: op(A) has {a_n} rows but C is {n}x{n}"
)));
}
if n == 0 {
return Ok(()); }
{
let sm = handle.sm_version();
if syrk_tc::is_tc_applicable(sm, n) && fill_mode != FillMode::Full {
let tile = syrk_tc::syrk_tc_tile_config(sm, n);
let config =
syrk_tc::SyrkTcConfig::new(tile.tile_m, tile.tile_n, tile.tile_k, sm, fill_mode);
let _tc_kernel = syrk_tc::generate_syrk_tc_ptx(&config);
}
}
let (trans_left, trans_right) = match trans {
Transpose::NoTrans => (Transpose::NoTrans, Transpose::Trans),
Transpose::Trans => (Transpose::Trans, Transpose::NoTrans),
Transpose::ConjTrans => unreachable!(), };
super::gemm_api::gemm(handle, trans_left, trans_right, alpha, a, a, beta, c)
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn syrk_rejects_conj_trans() {
let err = BlasError::InvalidArgument("SYRK: use HERK".into());
assert!(err.to_string().contains("HERK"));
}
#[test]
fn syrk_validates_square_c() {
let err = BlasError::InvalidDimension("SYRK: output C must be square, got 3x5".into());
assert!(err.to_string().contains("square"));
}
#[test]
fn trans_choices() {
let (tl, tr) = match Transpose::NoTrans {
Transpose::NoTrans => (Transpose::NoTrans, Transpose::Trans),
_ => (Transpose::Trans, Transpose::NoTrans),
};
assert_eq!(tl, Transpose::NoTrans);
assert_eq!(tr, Transpose::Trans);
}
}