use std::ops::{Add, AddAssign};
use crate::Group;
use utils::xor_inplace;
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct ByteGroup<const LAMBDA: usize>(pub [u8; LAMBDA]);
impl<const LAMBDA: usize> Add for ByteGroup<LAMBDA> {
type Output = Self;
fn add(mut self, rhs: Self) -> Self::Output {
xor_inplace(&mut self.0, &[&rhs.0]);
self
}
}
impl<const LAMBDA: usize> AddAssign for ByteGroup<LAMBDA> {
fn add_assign(&mut self, rhs: Self) {
xor_inplace(&mut self.0, &[&rhs.0])
}
}
impl<const LAMBDA: usize> Group<LAMBDA> for ByteGroup<LAMBDA> {
fn zero() -> Self {
ByteGroup([0; LAMBDA])
}
fn add_inverse(self) -> Self {
self
}
}
impl<const LAMBDA: usize> From<[u8; LAMBDA]> for ByteGroup<LAMBDA> {
fn from(value: [u8; LAMBDA]) -> Self {
Self(value)
}
}
impl<const LAMBDA: usize> From<ByteGroup<LAMBDA>> for [u8; LAMBDA] {
fn from(value: ByteGroup<LAMBDA>) -> Self {
value.0
}
}
pub mod utils {
use std::simd::{u8x16, u8x32, u8x64};
pub fn xor<const LAMBDA: usize>(xs: &[&[u8; LAMBDA]]) -> [u8; LAMBDA] {
let mut res = [0; LAMBDA];
xor_inplace(&mut res, xs);
res
}
pub fn xor_inplace<const LAMBDA: usize>(lhs: &mut [u8; LAMBDA], rhss: &[&[u8; LAMBDA]]) {
rhss.iter().fold(lhs, |lhs, &rhs| {
let mut i = 0;
while i < LAMBDA {
let left = LAMBDA - i;
if left >= 64 {
let lhs_simd = u8x64::from_slice(&lhs[i..i + 64]);
let rhs_simd = u8x64::from_slice(&rhs[i..i + 64]);
lhs[i..i + 64].copy_from_slice((lhs_simd ^ rhs_simd).as_array());
i += 64;
} else if left >= 32 {
let lhs_simd = u8x32::from_slice(&lhs[i..i + 32]);
let rhs_simd = u8x32::from_slice(&rhs[i..i + 32]);
lhs[i..i + 32].copy_from_slice((lhs_simd ^ rhs_simd).as_array());
i += 32;
} else if left >= 16 {
let lhs_simd = u8x16::from_slice(&lhs[i..i + 16]);
let rhs_simd = u8x16::from_slice(&rhs[i..i + 16]);
lhs[i..i + 16].copy_from_slice((lhs_simd ^ rhs_simd).as_array());
i += 16;
} else {
lhs[i..]
.iter_mut()
.zip(&rhs[i..])
.for_each(|(l, r)| *l ^= r);
break;
}
}
lhs
});
}
}