use super::*;
pick! {
if #[cfg(target_feature="avx512f")] {
#[derive(Default, Clone, Copy, PartialEq, Eq)]
#[repr(C, align(64))]
pub struct i64x8 { pub(crate) avx512: m512i }
} else {
#[derive(Default, Clone, Copy, PartialEq, Eq)]
#[repr(C, align(64))]
pub struct i64x8 { pub(crate) a : i64x4, pub(crate) b : i64x4 }
}
}
int_uint_consts!(i64, 8, i64x8, 512);
unsafe impl Zeroable for i64x8 {}
unsafe impl Pod for i64x8 {}
impl AlignTo for i64x8 {
type Elem = i64;
}
impl Add for i64x8 {
type Output = Self;
#[inline]
fn add(self, rhs: Self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: add_i64_m512i(self.avx512, rhs.avx512) }
} else {
Self {
a : self.a.add(rhs.a),
b : self.b.add(rhs.b),
}
}
}
}
}
impl Sub for i64x8 {
type Output = Self;
#[inline]
fn sub(self, rhs: Self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: sub_i64_m512i(self.avx512, rhs.avx512) }
} else {
Self {
a : self.a.sub(rhs.a),
b : self.b.sub(rhs.b),
}
}
}
}
}
impl Mul for i64x8 {
type Output = Self;
#[inline]
fn mul(self, rhs: Self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
let arr1: [i64; 8] = cast(self);
let arr2: [i64; 8] = cast(rhs);
cast([
arr1[0].wrapping_mul(arr2[0]),
arr1[1].wrapping_mul(arr2[1]),
arr1[2].wrapping_mul(arr2[2]),
arr1[3].wrapping_mul(arr2[3]),
arr1[4].wrapping_mul(arr2[4]),
arr1[5].wrapping_mul(arr2[5]),
arr1[6].wrapping_mul(arr2[6]),
arr1[7].wrapping_mul(arr2[7]),
])
} else {
Self { a: self.a.mul(rhs.a), b: self.b.mul(rhs.b) }
}
}
}
}
impl Shr for i64x8 {
type Output = Self;
#[inline]
fn shr(self, rhs: Self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
let a: [i64; 8] = cast(self);
let r: [i64; 8] = cast(rhs);
cast([
a[0].wrapping_shr(r[0] as u32),
a[1].wrapping_shr(r[1] as u32),
a[2].wrapping_shr(r[2] as u32),
a[3].wrapping_shr(r[3] as u32),
a[4].wrapping_shr(r[4] as u32),
a[5].wrapping_shr(r[5] as u32),
a[6].wrapping_shr(r[6] as u32),
a[7].wrapping_shr(r[7] as u32),
])
} else {
Self {
a: self.a.shr(rhs.a),
b: self.b.shr(rhs.b),
}
}
}
}
}
impl Shl for i64x8 {
type Output = Self;
#[inline]
fn shl(self, rhs: Self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
let a: [i64; 8] = cast(self);
let r: [i64; 8] = cast(rhs);
cast([
a[0].wrapping_shl(r[0] as u32),
a[1].wrapping_shl(r[1] as u32),
a[2].wrapping_shl(r[2] as u32),
a[3].wrapping_shl(r[3] as u32),
a[4].wrapping_shl(r[4] as u32),
a[5].wrapping_shl(r[5] as u32),
a[6].wrapping_shl(r[6] as u32),
a[7].wrapping_shl(r[7] as u32),
])
} else {
Self {
a: self.a.shl(rhs.a),
b: self.b.shl(rhs.b),
}
}
}
}
}
impl Add<i64> for i64x8 {
type Output = Self;
#[inline]
fn add(self, rhs: i64) -> Self::Output {
self.add(Self::splat(rhs))
}
}
impl Sub<i64> for i64x8 {
type Output = Self;
#[inline]
fn sub(self, rhs: i64) -> Self::Output {
self.sub(Self::splat(rhs))
}
}
impl Mul<i64> for i64x8 {
type Output = Self;
#[inline]
fn mul(self, rhs: i64) -> Self::Output {
self.mul(Self::splat(rhs))
}
}
impl Add<i64x8> for i64 {
type Output = i64x8;
#[inline]
fn add(self, rhs: i64x8) -> Self::Output {
i64x8::splat(self).add(rhs)
}
}
impl Sub<i64x8> for i64 {
type Output = i64x8;
#[inline]
fn sub(self, rhs: i64x8) -> Self::Output {
i64x8::splat(self).sub(rhs)
}
}
impl Mul<i64x8> for i64 {
type Output = i64x8;
#[inline]
fn mul(self, rhs: i64x8) -> Self::Output {
i64x8::splat(self).mul(rhs)
}
}
impl BitAnd for i64x8 {
type Output = Self;
#[inline]
fn bitand(self, rhs: Self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: bitand_m512i(self.avx512, rhs.avx512) }
} else {
Self {
a : self.a.bitand(rhs.a),
b : self.b.bitand(rhs.b),
}
}
}
}
}
impl BitOr for i64x8 {
type Output = Self;
#[inline]
fn bitor(self, rhs: Self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: bitor_m512i(self.avx512, rhs.avx512) }
} else {
Self {
a : self.a.bitor(rhs.a),
b : self.b.bitor(rhs.b),
}
}
}
}
}
impl BitXor for i64x8 {
type Output = Self;
#[inline]
fn bitxor(self, rhs: Self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: bitxor_m512i(self.avx512, rhs.avx512) }
} else {
Self {
a : self.a.bitxor(rhs.a),
b : self.b.bitxor(rhs.b),
}
}
}
}
}
macro_rules! impl_shl_t_for_i64x8 {
($($shift_type:ty),+ $(,)?) => {
$(impl Shl<$shift_type> for i64x8 {
type Output = Self;
#[inline]
fn shl(self, rhs: $shift_type) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
let shift = cast(rhs as u64);
Self { avx512: shl_all_u64_m512i(self.avx512, shift) }
} else {
Self {
a : self.a.shl(rhs),
b : self.b.shl(rhs),
}
}
}
}
})+
};
}
impl_shl_t_for_i64x8!(i8, u8, i16, u16, i32, u32, i64, u64, i128, u128);
macro_rules! impl_shr_t_for_i64x8 {
($($shift_type:ty),+ $(,)?) => {
$(impl Shr<$shift_type> for i64x8 {
type Output = Self;
#[inline]
fn shr(self, rhs: $shift_type) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
let shift = cast(rhs as u64);
Self { avx512: shr_all_i64_m512i(self.avx512, shift) }
} else {
Self {
a : self.a.shr(rhs),
b : self.b.shr(rhs),
}
}
}
}
})+
};
}
impl_shr_t_for_i64x8!(i8, u8, i16, u16, i32, u32, i64, u64, i128, u128);
impl CmpEq for i64x8 {
type Output = Self;
#[inline]
fn simd_eq(self, rhs: Self) -> Self::Output {
Self::simd_eq(self, rhs)
}
}
impl CmpGt for i64x8 {
type Output = Self;
#[inline]
fn simd_gt(self, rhs: Self) -> Self::Output {
Self::simd_gt(self, rhs)
}
}
impl CmpLt for i64x8 {
type Output = Self;
#[inline]
fn simd_lt(self, rhs: Self) -> Self::Output {
Self::simd_lt(self, rhs)
}
}
impl i64x8 {
#[inline]
#[must_use]
pub const fn new(array: [i64; 8]) -> Self {
unsafe { core::mem::transmute(array) }
}
#[inline]
#[must_use]
pub fn simd_eq(self, rhs: Self) -> Self {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: cmp_op_mask_i64_m512i::<{cmp_int_op!(Eq)}>(self.avx512, rhs.avx512) }
} else {
Self {
a : self.a.simd_eq(rhs.a),
b : self.b.simd_eq(rhs.b),
}
}
}
}
#[inline]
#[must_use]
pub fn simd_gt(self, rhs: Self) -> Self {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: cmp_op_mask_i64_m512i::<{cmp_int_op!(Nle)}>(self.avx512, rhs.avx512) }
} else {
Self {
a : self.a.simd_gt(rhs.a),
b : self.b.simd_gt(rhs.b),
}
}
}
}
#[inline]
#[must_use]
pub fn simd_lt(self, rhs: Self) -> Self {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: cmp_op_mask_i64_m512i::<{cmp_int_op!(Lt)}>(self.avx512, rhs.avx512) }
} else {
Self {
a : rhs.a.simd_gt(self.a),
b : rhs.b.simd_gt(self.b),
}
}
}
}
#[inline]
#[must_use]
pub fn blend(self, t: Self, f: Self) -> Self {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: blend_varying_i8_m512i(f.avx512,t.avx512,movepi8_mask_m512i(self.avx512)) }
} else {
Self {
a : self.a.blend(t.a, f.a),
b : self.b.blend(t.b, f.b),
}
}
}
}
#[inline]
#[must_use]
pub fn abs(self) -> Self {
pick! {
if #[cfg(target_feature="avx512f")] {
let arr: [i64; 8] = cast(self);
cast(
[
arr[0].wrapping_abs(),
arr[1].wrapping_abs(),
arr[2].wrapping_abs(),
arr[3].wrapping_abs(),
arr[4].wrapping_abs(),
arr[5].wrapping_abs(),
arr[6].wrapping_abs(),
arr[7].wrapping_abs(),
])
} else {
Self {
a : self.a.abs(),
b : self.b.abs(),
}
}
}
}
#[inline]
#[must_use]
pub fn unsigned_abs(self) -> u64x8 {
pick! {
if #[cfg(target_feature="avx512f")] {
let arr: [i64; 8] = cast(self);
cast(
[
arr[0].unsigned_abs(),
arr[1].unsigned_abs(),
arr[2].unsigned_abs(),
arr[3].unsigned_abs(),
arr[4].unsigned_abs(),
arr[5].unsigned_abs(),
arr[6].unsigned_abs(),
arr[7].unsigned_abs(),
])
} else {
u64x8 {
a : self.a.unsigned_abs(),
b : self.b.unsigned_abs(),
}
}
}
}
#[inline]
#[must_use]
pub fn round_float(self) -> f64x8 {
let arr: [i64; 8] = cast(self);
cast([
arr[0] as f64,
arr[1] as f64,
arr[2] as f64,
arr[3] as f64,
arr[4] as f64,
arr[5] as f64,
arr[6] as f64,
arr[7] as f64,
])
}
#[inline]
#[must_use]
pub fn to_bitmask(self) -> u32 {
pick! {
if #[cfg(target_feature="avx512dq")] {
movepi64_mask_m512d(cast(self.avx512)) as u32
} else {
self.a.to_bitmask() | (self.b.to_bitmask() << 2)
}
}
}
#[inline]
#[must_use]
pub fn any(self) -> bool {
pick! {
if #[cfg(target_feature="avx512f")] {
movepi64_mask_m512d(cast(self.avx512)) != 0
} else {
(self.a | self.b).any()
}
}
}
#[inline]
#[must_use]
pub fn all(self) -> bool {
pick! {
if #[cfg(target_feature="avx512bw")] {
movepi64_mask_m512d(cast(self.avx512)) == 0b11111111
} else {
(self.a & self.b).all()
}
}
}
#[inline]
#[must_use]
pub fn none(self) -> bool {
!self.any()
}
#[inline]
pub fn to_array(self) -> [i64; 8] {
cast(self)
}
#[inline]
pub fn as_array(&self) -> &[i64; 8] {
cast_ref(self)
}
#[inline]
pub fn as_mut_array(&mut self) -> &mut [i64; 8] {
cast_mut(self)
}
#[inline]
#[must_use]
pub fn min(self, rhs: Self) -> Self {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: min_i64_m512i(self.avx512, rhs.avx512) }
} else {
Self {
a: self.a.min(rhs.a),
b: self.b.min(rhs.b),
}
}
}
}
#[inline]
#[must_use]
pub fn max(self, rhs: Self) -> Self {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: max_i64_m512i(self.avx512, rhs.avx512) }
} else {
Self {
a: self.a.max(rhs.a),
b: self.b.max(rhs.b),
}
}
}
}
}
impl Not for i64x8 {
type Output = Self;
#[inline]
fn not(self) -> Self::Output {
pick! {
if #[cfg(target_feature="avx512f")] {
Self { avx512: bitxor_m512i(self.avx512, set_splat_i64_m512i(-1)) }
} else {
Self {
a : self.a.not(),
b : self.b.not(),
}
}
}
}
}