pub fn mse_loss<const N: usize>( output: &[Float; N], target: &[Float; N], grad: &mut [Float; N], ) -> Float