#[cfg(target_arch = "x86_64")]
use std::is_x86_feature_detected;
pub fn distance_naive(x: &[u8], y: &[u8]) -> u64 {
assert_eq!(x.len(), y.len());
let mut distance = x
.chunks_exact(8)
.zip(y.chunks_exact(8))
.map(|(x_chunk, y_chunk)| {
let x_val = u64::from_ne_bytes(x_chunk.try_into().unwrap());
let y_val = u64::from_ne_bytes(y_chunk.try_into().unwrap());
(x_val ^ y_val).count_ones() as u64
})
.sum::<u64>();
if x.len() % 8 != 0 {
distance += x
.chunks_exact(8)
.remainder()
.iter()
.zip(y.chunks_exact(8).remainder())
.map(|(x_byte, y_byte)| (x_byte ^ y_byte).count_ones() as u64)
.sum::<u64>();
}
distance
}
pub fn weight_naive(x: &[u8]) -> u64 {
let mut accum: u64 = 0;
for byte in x.iter() {
accum += byte.count_ones() as u64;
}
accum
}
pub fn distance(x: &[u8], y: &[u8]) -> u64 {
assert_eq!(x.len(), y.len());
#[cfg(target_arch = "x86_64")]
unsafe {
if is_x86_feature_detected!("avx2") && x.len() >= 1024 {
return lib_avx2::distance_vect(x, y);
}
}
distance_naive(x, y)
}
pub fn weight(x: &[u8]) -> u64 {
#[cfg(target_arch = "x86_64")]
unsafe {
if is_x86_feature_detected!("avx2") {
return lib_avx2::weight_vect(x);
}
}
weight_naive(x)
}
#[cfg(target_arch = "x86_64")]
pub mod lib_avx2;
pub mod utils;
#[cfg(test)]
pub mod lib_test;