flacenc 0.5.1 - Docs.rs

// Copyright 2023-2024 Google LLC
// Copyright 2025- flacenc-rs developers
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//      http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! Fake SIMD module is a minimal subset of `std::simd` of `portable_simd`
//! feature in a nightly rust. This module only implement the functions that
//! are used in flacenc.

use num_traits::NumCast;
use std::array;

// ===
// TYPE DEFINITION
// ===
#[derive(Clone, Copy, Debug, Eq, PartialEq, PartialOrd)]
#[repr(transparent)]
pub struct Simd<T: SimdElement, const LANES: usize>([T; LANES]);

#[derive(Clone, Copy, Debug, Eq, PartialEq, PartialOrd)]
pub struct Mask<T: SimdElement, const LANES: usize> {
    mask: [bool; LANES],
    phantom_data: std::marker::PhantomData<T>,
}

// ===
// SIMD ELEMENT TRAITS and `SupportedLaneCount`
// ===
pub trait SimdElement: Copy + std::fmt::Debug {
    type Mask;

    fn simd_element_add(self, rhs: Self) -> Self;
    fn simd_element_sub(self, rhs: Self) -> Self;
}

impl SimdElement for i8 {
    type Mask = Self;

    fn simd_element_add(self, rhs: Self) -> Self {
        self.wrapping_add(rhs)
    }
    fn simd_element_sub(self, rhs: Self) -> Self {
        self.wrapping_sub(rhs)
    }
}

impl SimdElement for i16 {
    type Mask = Self;

    fn simd_element_add(self, rhs: Self) -> Self {
        self.wrapping_add(rhs)
    }
    fn simd_element_sub(self, rhs: Self) -> Self {
        self.wrapping_sub(rhs)
    }
}

impl SimdElement for i32 {
    type Mask = Self;

    fn simd_element_add(self, rhs: Self) -> Self {
        self.wrapping_add(rhs)
    }
    fn simd_element_sub(self, rhs: Self) -> Self {
        self.wrapping_sub(rhs)
    }
}

impl SimdElement for u32 {
    type Mask = Self;

    fn simd_element_add(self, rhs: Self) -> Self {
        self.wrapping_add(rhs)
    }
    fn simd_element_sub(self, rhs: Self) -> Self {
        self.wrapping_sub(rhs)
    }
}

impl SimdElement for u64 {
    type Mask = Self;

    fn simd_element_add(self, rhs: Self) -> Self {
        self.wrapping_add(rhs)
    }
    fn simd_element_sub(self, rhs: Self) -> Self {
        self.wrapping_sub(rhs)
    }
}

impl SimdElement for i64 {
    type Mask = Self;

    fn simd_element_add(self, rhs: Self) -> Self {
        self.wrapping_add(rhs)
    }
    fn simd_element_sub(self, rhs: Self) -> Self {
        self.wrapping_sub(rhs)
    }
}

impl SimdElement for f32 {
    type Mask = Self;

    fn simd_element_add(self, rhs: Self) -> Self {
        self + rhs
    }
    fn simd_element_sub(self, rhs: Self) -> Self {
        self - rhs
    }
}

impl SimdElement for f64 {
    type Mask = Self;

    fn simd_element_add(self, rhs: Self) -> Self {
        self + rhs
    }
    fn simd_element_sub(self, rhs: Self) -> Self {
        self - rhs
    }
}

pub trait SupportedLaneCount {}
pub struct LaneCount<const LANES: usize>;
impl SupportedLaneCount for LaneCount<1> {}
impl SupportedLaneCount for LaneCount<2> {}
impl SupportedLaneCount for LaneCount<4> {}
impl SupportedLaneCount for LaneCount<8> {}
impl SupportedLaneCount for LaneCount<16> {}
impl SupportedLaneCount for LaneCount<32> {}
impl SupportedLaneCount for LaneCount<64> {}

pub trait SimdCast: SimdElement + NumCast {}
impl<T: SimdElement + NumCast> SimdCast for T {}

// ===
// SIMD OP TRAITS
// ===
pub trait SimdUint {
    type Scalar;
    fn reduce_max(self) -> Self::Scalar;
    fn reduce_min(self) -> Self::Scalar;
    fn reduce_sum(self) -> Self::Scalar;
}

#[allow(dead_code)]
pub trait SimdInt {
    type Scalar;
    type Cast<T: SimdElement>;
    #[allow(clippy::return_self_not_must_use)]
    fn abs(self) -> Self;
    #[allow(clippy::return_self_not_must_use)]
    fn signum(self) -> Self;
    fn reduce_sum(self) -> Self::Scalar;
    fn cast<T: SimdCast>(self) -> Self::Cast<T>;
}

pub trait SimdFloat {
    type Scalar;
    type Cast<T: SimdElement>;
    fn reduce_sum(self) -> Self::Scalar;
    #[allow(dead_code)]
    fn cast<T: SimdCast>(self) -> Self::Cast<T>;
}

#[allow(dead_code)]
pub trait StdFloat {}

#[allow(dead_code)]
pub trait SimdPartialEq {
    type Mask;
    fn simd_eq(self, other: Self) -> Self::Mask;
}

#[allow(dead_code)]
pub trait SimdPartialOrd {
    type Mask;
    fn simd_le(self, other: Self) -> Self::Mask;
    fn simd_lt(self, other: Self) -> Self::Mask;
}

pub trait SimdOrd {
    #[allow(clippy::return_self_not_must_use)]
    fn simd_min(self, other: Self) -> Self;

    #[allow(clippy::return_self_not_must_use)]
    fn simd_max(self, other: Self) -> Self;
}

// ===
// TYPE ALIASES
// ===
#[allow(non_camel_case_types)]
#[allow(dead_code)] // only for tests currently.
pub type i8x1 = Simd<i16, 1>;

#[allow(non_camel_case_types)]
#[allow(dead_code)] // only for tests currently.
pub type i16x4 = Simd<i16, 4>;

#[allow(non_camel_case_types)]
pub type i16x32 = Simd<i16, 32>;

#[allow(non_camel_case_types)]
#[allow(dead_code)] // not used currently.
pub type i32x16 = Simd<i32, 16>;

#[allow(non_camel_case_types)]
pub type u32x16 = Simd<u32, 16>;

#[allow(non_camel_case_types)]
#[allow(dead_code)] // only for tests currently.
pub type u64x64 = Simd<u64, 64>;

#[allow(non_camel_case_types)]
#[allow(dead_code)]
pub type f32x32 = Simd<f32, 32>;

// ===
// IMPLEMENTATION OF `fakesimd::Simd` (non-trait methods)
// ===
impl<T, const N: usize> Simd<T, N>
where
    T: SimdElement,
{
    #[inline]
    pub const fn from_array(array: [T; N]) -> Self {
        Self(array)
    }

    #[inline]
    pub fn from_slice(slice: &[T]) -> Self {
        Self::from_array(std::array::from_fn(|d| slice[d]))
    }

    #[inline]
    pub fn as_array(&self) -> &[T; N] {
        &self.0
    }

    #[inline]
    pub fn as_mut_array(&mut self) -> &mut [T; N] {
        &mut self.0
    }

    #[inline]
    pub fn splat(v: T) -> Self {
        Self([v; N])
    }

    #[allow(clippy::return_self_not_must_use)]
    #[inline]
    pub fn rotate_elements_right<const OFFSET: usize>(self) -> Self {
        Self(array::from_fn(|i| self.0[(i + N - OFFSET) % N]))
    }

    #[allow(clippy::return_self_not_must_use)]
    #[inline]
    pub fn rotate_elements_left<const OFFSET: usize>(self) -> Self {
        Self(array::from_fn(|i| self.0[(i + OFFSET) % N]))
    }
}

// ===
// IMPLEMENTATION OF `fakesimd::Mask`
// ===
impl<T, const N: usize> Mask<T, N>
where
    T: SimdElement,
{
    #[inline]
    pub fn select(self, true_values: Simd<T, N>, false_values: Simd<T, N>) -> Simd<T, N> {
        Simd(array::from_fn(|i| {
            if self.mask[i] {
                true_values.0[i]
            } else {
                false_values.0[i]
            }
        }))
    }
}

// ===
// IMPLEMENTATION OF SIMD-SPECIFIC OPS
// ===
impl<T, const N: usize> SimdInt for Simd<T, N>
where
    T: SimdElement + num_traits::PrimInt + num_traits::Signed + std::iter::Sum,
{
    type Scalar = T;
    type Cast<U: SimdElement> = Simd<U, N>;
    #[inline]
    fn abs(self) -> Self {
        Self(array::from_fn(|i| num_traits::sign::abs(self.0[i])))
    }

    #[inline]
    fn signum(self) -> Self {
        Self(array::from_fn(|i| num_traits::sign::signum(self.0[i])))
    }

    #[inline]
    fn reduce_sum(self) -> T {
        self.0.into_iter().sum()
    }

    #[inline]
    fn cast<U: SimdCast>(self) -> Simd<U, N> {
        Simd::<U, N>(array::from_fn(|i| U::from(self.0[i]).unwrap()))
    }
}

impl<T, const N: usize> SimdUint for Simd<T, N>
where
    T: SimdElement + num_traits::PrimInt + std::iter::Sum,
{
    type Scalar = T;
    #[inline]
    fn reduce_max(self) -> T {
        self.0
            .into_iter()
            .max()
            .expect("INTERNAL ERROR in `reduce_max` of fakesimd.")
    }
    #[inline]
    fn reduce_min(self) -> T {
        self.0
            .into_iter()
            .min()
            .expect("INTERNAL ERROR in `reduce_min` of fakesimd.")
    }

    #[inline]
    fn reduce_sum(self) -> T {
        self.0.into_iter().sum()
    }
}

impl<T, const N: usize> SimdFloat for Simd<T, N>
where
    T: SimdElement + num_traits::Float + std::iter::Sum,
{
    type Scalar = T;
    type Cast<U: SimdElement> = Simd<U, N>;
    #[inline]
    fn reduce_sum(self) -> T {
        self.0.into_iter().sum()
    }
    #[inline]
    fn cast<U: SimdCast>(self) -> Simd<U, N> {
        Simd::<U, N>(array::from_fn(|i| U::from(self.0[i]).unwrap()))
    }
}

impl<T, const N: usize> SimdPartialEq for Simd<T, N>
where
    T: SimdElement + PartialEq,
{
    type Mask = Mask<T, N>;
    #[inline]
    fn simd_eq(self, other: Self) -> Self::Mask {
        Mask {
            mask: array::from_fn(|i| self.0[i] == other.0[i]),
            phantom_data: std::marker::PhantomData,
        }
    }
}

impl<T, const N: usize> SimdPartialOrd for Simd<T, N>
where
    T: SimdElement + PartialOrd,
{
    type Mask = Mask<T, N>;
    #[inline]
    fn simd_le(self, other: Self) -> Self::Mask {
        Mask {
            mask: array::from_fn(|i| self.0[i] <= other.0[i]),
            phantom_data: std::marker::PhantomData,
        }
    }

    fn simd_lt(self, other: Self) -> Self::Mask {
        Mask {
            mask: array::from_fn(|i| self.0[i] < other.0[i]),
            phantom_data: std::marker::PhantomData,
        }
    }
}

impl<T, const N: usize> SimdOrd for Simd<T, N>
where
    T: SimdElement + Ord,
{
    #[inline]
    fn simd_min(self, other: Self) -> Self {
        Self(array::from_fn(|i| self.0[i].min(other.0[i])))
    }

    #[inline]
    fn simd_max(self, other: Self) -> Self {
        Self(array::from_fn(|i| self.0[i].max(other.0[i])))
    }
}

impl<T, const N: usize> StdFloat for Simd<T, N> where T: SimdElement + num_traits::Float {}

// ===
// IMPLEMENTATION OF OPERATOR OVERRIDES
// ===

macro_rules! def_binop {
    ($trait:ident, $fnname:ident, $var_x:ident, $var_y:ident, $body:block) => {
        impl<T, const N: usize> std::ops::$trait<Self> for Simd<T, N>
        where
            T: SimdElement + std::ops::$trait<T, Output = T>,
        {
            type Output = Self;

            #[inline]
            fn $fnname(self, rhs: Self) -> Self::Output {
                Self(array::from_fn(|i| {
                    let $var_x = self.0[i];
                    let $var_y = rhs.0[i];
                    $body
                }))
            }
        }
    };
}

macro_rules! def_binop_assign {
    ($trait:ident, $binop: ident, $fnname:ident, $var_x:ident, $var_y:ident, $body:block) => {
        impl<U, T, const N: usize> std::ops::$trait<U> for Simd<T, N>
        where
            T: SimdElement,
            Self: std::ops::$binop<U, Output = Self>,
        {
            #[inline]
            fn $fnname(&mut self, $var_y: U) {
                let $var_x = *self;
                *self = $body;
            }
        }
    };
}

def_binop!(Add, add, x, y, { x.simd_element_add(y) });
def_binop!(Sub, sub, x, y, { x.simd_element_sub(y) });
def_binop!(Mul, mul, x, y, { x * y });
def_binop!(Div, div, x, y, { x / y });
def_binop!(BitAnd, bitand, x, y, { x & y });
def_binop!(BitOr, bitor, x, y, { x | y });
def_binop!(Shr, shr, x, y, { x >> y });
def_binop!(Shl, shl, x, y, { x << y });

def_binop_assign!(AddAssign, Add, add_assign, x, y, { x + y });
def_binop_assign!(SubAssign, Sub, sub_assign, x, y, { x - y });
def_binop_assign!(MulAssign, Mul, mul_assign, x, y, { x * y });

impl<T, const N: usize> std::convert::AsRef<[T; N]> for Simd<T, N>
where
    T: SimdElement,
{
    #[inline]
    fn as_ref(&self) -> &[T; N] {
        &self.0
    }
}

impl<T, const N: usize> std::convert::From<Simd<T, N>> for [T; N]
where
    T: SimdElement,
{
    #[inline]
    fn from(t: Simd<T, N>) -> [T; N] {
        t.0
    }
}

impl<I, T, const N: usize> std::ops::Index<I> for Simd<T, N>
where
    T: SimdElement,
    I: std::slice::SliceIndex<[T]>,
{
    type Output = <I as std::slice::SliceIndex<[T]>>::Output;
    #[inline]
    fn index(&self, index: I) -> &Self::Output {
        &self.as_array()[index]
    }
}

impl<I, T, const N: usize> std::ops::IndexMut<I> for Simd<T, N>
where
    T: SimdElement,
    I: std::slice::SliceIndex<[T]>,
{
    #[inline]
    fn index_mut(&mut self, index: I) -> &mut <I as std::slice::SliceIndex<[T]>>::Output {
        &mut self.as_mut_array()[index]
    }
}

impl<T, const N: usize> Default for Simd<T, N>
where
    T: SimdElement + Default,
    LaneCount<N>: SupportedLaneCount,
{
    #[inline]
    fn default() -> Self {
        Self::splat(T::default())
    }
}

pub mod prelude {
    #[allow(unused_imports)]
    pub use super::SimdFloat;
    #[allow(unused_imports)]
    pub use super::SimdInt;
    #[allow(unused_imports)]
    pub use super::SimdOrd;
    #[allow(unused_imports)]
    pub use super::SimdPartialEq;
    #[allow(unused_imports)]
    pub use super::SimdPartialOrd;
    #[allow(unused_imports)]
    pub use super::SimdUint;
}