slas 0.3.1 - Docs.rs

use crate::{backends::*, prelude::*};
use paste::paste;
use std::mem::transmute;

/// Tensor shape with static dimensions but with optionally dynamic shape.
/// To achive a static shape the trait should be const implemented.
pub trait Shape<const NDIM: usize> {
    /// Length in the nth dimension.
    ///
    /// ## Example
    /// ```rust
    /// use slas::tensor::Shape;
    /// let s = slas::tensor::MatrixShape::<2, 3>;
    /// assert_eq!(s.axis_len(0), 3);
    /// ```
    ///
    /// For a matrix the height is specified before the width.
    /// axis_len(0) is should always be the width of a tensor.
    fn axis_len(&self, n: usize) -> usize;

    /// Total amount of elements in a tensor with shape.
    /// ## Example
    /// ```rust
    /// use slas::tensor::Shape;
    /// let s = slas::tensor::MatrixShape::<2, 3>;
    /// assert_eq!(s.volume(), 6);
    /// ```
    fn volume(&self) -> usize {
        (0..NDIM).map(|n| self.axis_len(n)).product()
    }

    fn slice(&self) -> &[usize; NDIM];
}

impl<const LEN: usize> Shape<LEN> for [usize; LEN] {
    fn axis_len(&self, n: usize) -> usize {
        self[n]
    }

    fn slice(&self) -> &[usize; LEN] {
        self
    }
}

impl<const LEN: usize> Shape<LEN> for &[usize; LEN] {
    fn axis_len(&self, n: usize) -> usize {
        self[n]
    }

    fn slice(&self) -> &[usize; LEN] {
        self
    }
}

impl<const LEN: usize> Shape<LEN> for [usize] {
    #[inline(always)]
    fn axis_len(&self, n: usize) -> usize {
        self[n]
    }

    #[inline(always)]
    fn slice(&self) -> &[usize; LEN] {
        assert_eq!(self.len(), LEN);
        unsafe { &*(self.as_ptr() as *const [usize; LEN]) }
    }
}

impl Shape<2> for (usize, usize) {
    #[inline(always)]
    fn axis_len(&self, n: usize) -> usize {
        match n {
            0 => self.1,
            1 => self.0,
            _ => panic!(
                "{}",
                format!("Index {n} out of range 2 (when trying to index into Shape)")
            ),
        }
    }

    #[inline(always)]
    fn slice(&self) -> &[usize; 2] {
        unimplemented!()
    }
}

/// Static matrix shape.
#[derive(Clone, Copy)]
pub struct MatrixShape<const M: usize, const K: usize>;

impl<const M: usize, const K: usize> const Shape<2> for MatrixShape<M, K> {
    #[inline(always)]
    fn axis_len(&self, n: usize) -> usize {
        match n {
            0 => K,
            1 => M,
            _ => panic!("Cannot get len of axis higher than 1, as a matrix only has 2 axies (rows and columns)"),
        }
    }
    #[inline(always)]
    fn volume(&self) -> usize {
        M * K
    }
    #[inline(always)]
    fn slice(&self) -> &[usize; 2] {
        &[K, M]
    }
}

/// Statically allocated tensor.
/// See [`StaticVec::reshape`] for constructing a tensor.
/// The use of `&'static dyn Shape<NDIM>` does not mean slower performance,
/// as long as Shape is [const implemented](https://github.com/rust-lang/rust/issues/67792) for the type of the shape instance.
#[derive(Clone, Copy)]
pub struct Tensor<
    T,
    U: StaticVec<T, LEN>,
    B: Backend<T>,
    const NDIM: usize,
    const LEN: usize,
    S: Shape<NDIM> = [usize; NDIM],
> {
    pub data: WithStaticBackend<T, U, B, LEN>,
    pub shape: S,
}

impl<T, U: StaticVec<T, LEN>, B: Backend<T>, const LEN: usize, S: Shape<2>>
    Tensor<T, U, B, 2, LEN, S>
{
    pub const fn matrix(self) -> Matrix<T, U, B, LEN, false, S> {
        Matrix(self)
    }
    pub const fn backend(&self) -> &B {
        &self.data.backend
    }
    pub const fn vec_ref(&self) -> &U {
        &self.data.data
    }
    pub const fn mut_vec_ref(&mut self) -> &mut U {
        &mut self.data.data
    }
}

//impl<T, U: StaticVec<T, LEN>, B: Backend<T>, const LEN: usize> const std::ops::Index<()>
//    for Tensor<T, U, B, 2, LEN>
//{
//    type Output = Matrix<T, U, B, LEN>;
//    fn index<'a>(&'a self, _: ()) -> &'a Self::Output {
//        unsafe { transmute(self) }
//    }
//}
//
//impl<T, U: StaticVec<T, LEN>, B: Backend<T>, const LEN: usize> const std::ops::IndexMut<()>
//    for Tensor<T, U, B, 2, LEN>
//{
//    fn index_mut<'a>(&'a mut self, _: ()) -> &'a mut Self::Output {
//        unsafe { transmute(self) }
//    }
//}

impl<
        T: Float + std::fmt::Debug,
        B: Backend<T>,
        S: Shape<2>,
        U: StaticVec<T, LEN>,
        const LEN: usize,
        const IS_TRANS: bool,
    > std::fmt::Debug for Matrix<T, U, B, LEN, IS_TRANS, S>
{
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.write_str("[\n")?;
        let m = self.rows();
        let k = self.columns();
        debug_assert_eq!(m * k, LEN);

        for r in 0..m {
            f.write_str("   ")?;
            f.debug_list()
                .entries((0..k).map(|c| self[(r, c)]))
                .finish()?;
            f.write_str(",\n")?;
        }
        f.write_str("]")?;
        Ok(())
    }
}

fn debug_shape<const NDIM: usize>(s: &dyn Shape<NDIM>) -> String {
    (0..NDIM)
        .map(|n| s.axis_len(n).to_string())
        .collect::<Vec<_>>()
        .join(", ")
}

#[inline(always)]
fn tensor_index<T: Shape<NDIM>, const NDIM: usize>(s: &T, o: &[usize; NDIM]) -> usize {
    let mut sum = 0;
    let mut product = 1;
    for n in 0..NDIM {
        let i = o.axis_len(n);
        let j = s.axis_len(n);
        assert!(
            i < j,
            "Index [{}] out of bounds [{}]",
            debug_shape(o),
            debug_shape(s)
        );
        sum += i * product;
        product *= j;
    }
    sum
}

impl<
        T,
        U: StaticVec<T, LEN>,
        B: Backend<T>,
        S: Shape<NDIM>,
        const NDIM: usize,
        const LEN: usize,
    > std::ops::Index<[usize; NDIM]> for Tensor<T, U, B, NDIM, LEN, S>
{
    type Output = T;

    #[inline(always)]
    fn index(&self, i: [usize; NDIM]) -> &T {
        unsafe { self.data.data.get_unchecked(tensor_index(&self.shape, &i)) }
    }
}
impl<
        T,
        U: StaticVec<T, LEN>,
        B: Backend<T>,
        S: Shape<NDIM>,
        const NDIM: usize,
        const LEN: usize,
    > std::ops::IndexMut<[usize; NDIM]> for Tensor<T, U, B, NDIM, LEN, S>
where
    T: Copy,
{
    fn index_mut(&mut self, i: [usize; NDIM]) -> &mut T {
        unsafe {
            self.data
                .data
                .get_unchecked_mut(tensor_index(&self.shape, &i))
        }
    }
}

impl<T, U: StaticVec<T, LEN>, B: Backend<T>, S: Shape<2>, const LEN: usize>
    std::ops::Index<(usize, usize)> for Tensor<T, U, B, 2, LEN, S>
{
    type Output = T;

    #[inline(always)]
    fn index(&self, i: (usize, usize)) -> &T {
        unsafe {
            self.data
                .data
                .get_unchecked(tensor_index(&self.shape, &[i.1, i.0]))
        }
    }
}
impl<T, U: StaticVec<T, LEN>, B: Backend<T>, S: Shape<2>, const LEN: usize>
    std::ops::IndexMut<(usize, usize)> for Tensor<T, U, B, 2, LEN, S>
where
    T: Copy,
{
    fn index_mut(&mut self, i: (usize, usize)) -> &mut T {
        unsafe {
            self.data
                .data
                .get_unchecked_mut(tensor_index(&mut self.shape, &[i.1, i.0]))
        }
    }
}

impl<
        T,
        U: StaticVec<T, LEN>,
        B: Backend<T>,
        S: Shape<2>,
        const IS_TRANS: bool,
        const LEN: usize,
    > std::ops::Index<(usize, usize)> for Matrix<T, U, B, LEN, IS_TRANS, S>
{
    type Output = T;

    #[inline(always)]
    fn index(&self, i: (usize, usize)) -> &T {
        let i = if IS_TRANS { [i.0, i.1] } else { [i.1, i.0] };
        let i = tensor_index(&self.0.shape, &i);
        unsafe { self.0.data.data.get_unchecked(i) }
    }
}
impl<
        T,
        U: StaticVec<T, LEN>,
        B: Backend<T>,
        S: Shape<2>,
        const IS_TRANS: bool,
        const LEN: usize,
    > std::ops::IndexMut<(usize, usize)> for Matrix<T, U, B, LEN, IS_TRANS, S>
where
    T: Copy,
{
    fn index_mut(&mut self, i: (usize, usize)) -> &mut T {
        let i = if IS_TRANS { [i.0, i.1] } else { [i.1, i.0] };
        let i = tensor_index(&self.0.shape, &i);
        unsafe { self.0.data.data.get_unchecked_mut(i) }
    }
}

macro_rules! impl_index_slice {
	($($mut: tt)?) => {
		impl<'a, T, U: StaticVec<T, LEN> + 'a, S: Shape<NDIM>, B: Backend<T>, const NDIM: usize, const LEN: usize>
            Tensor<T, U, B, NDIM, LEN, S>
        where
            [(); NDIM - 1]: Sized,
            &'a $($mut)? U: StaticVec<T, LEN>,
        {
            paste!{pub fn [<index_slice $(_$mut)?>] (&'a $($mut)? self, i: usize) -> Tensor<T, &'a $($mut)? [T; LEN], B, { NDIM - 1 }, LEN> {
                assert!(NDIM > 1);
                assert!(i < self.shape.axis_len(0));

                unsafe {
                    transmute::<*const T, &'a $($mut)? [T; LEN]>(
                        self.data
                            .[< as $(_$mut)? _ptr>]()
                            .add(i * (self.shape.volume() / self.shape.axis_len(NDIM - 1))),
                    )
                    .[<reshape_unchecked_ref $(_$mut)? >](
                        *transmute::<*const usize, &[usize; NDIM - 1]>(
                            self.shape.slice()[0..NDIM - 1].as_ptr(),
                        ),
                        B::default(),
                    )
                }
            }}
        }
	};
}

impl_index_slice!();
impl_index_slice!(mut);

impl<
        T: Float + Sized,
        U: StaticVec<T, LEN>,
        B: Backend<T> + operations::MatrixMul<T>,
        const LEN: usize,
        const IS_TRANS_1: bool,
        S1: Shape<2>,
    > Matrix<T, U, B, LEN, IS_TRANS_1, S1>
{
    #[inline(always)]
    pub fn matrix_mul_buffer<
        U2: StaticVec<T, LEN2>,
        U3: StaticVec<T, OLEN>,
        const LEN2: usize,
        const OLEN: usize,
        const IS_TRANS_2: bool,
        S2: Shape<2>,
    >(
        &self,
        other: &Matrix<T, U2, B, LEN2, IS_TRANS_2, S2>,
        buffer: &mut U3,
    ) {
        let m = self.rows();
        let k = other.rows();
        let n = other.columns();

        let lda = self.0.shape.axis_len(0);
        let ldb = other.0.shape.axis_len(0);
        let ldc = n;

        assert_eq!(self.0.shape.volume(), LEN);
        assert_eq!(other.0.shape.volume(), LEN2);
        assert_eq!(
            m * n,
            OLEN,
            "Matrix::matrix_mul_buffer expected buffer of {} elements, found one of {OLEN}",
            m * n,
        );

        <B as Backend<T>>::matrix_mul(
            &self.0.data.backend,
            &self.0.data.data,
            &other.0.data.data,
            buffer,
            m,
            n,
            k,
            lda,
            ldb,
            ldc,
            IS_TRANS_1,
            IS_TRANS_2,
        );
    }

    #[inline(always)]
    pub fn vector_mul_buffer<
        U2: StaticVec<T, LEN2>,
        U3: StaticVec<T, OLEN>,
        const LEN2: usize,
        const OLEN: usize,
    >(
        &self,
        other: &U2,
        buffer: &mut U3,
    ) {
        assert_eq!(
            self.rows(),
            OLEN,
            "Matrix::vector_mul_buffer expected buffer of {} elements, found one of {OLEN}",
            self.rows()
        );
        assert_eq!(LEN2, self.columns());

        <B as Backend<T>>::matrix_vector_mul(
            &self.0.data.backend,
            &self.0.data.data,
            other,
            buffer,
            self.0.shape.axis_len(0),
            self.0.shape.axis_len(1),
            self.0.shape.axis_len(0),
            IS_TRANS_1,
        );
    }

    #[inline(always)]
    pub fn matrix_mul<
        U2: StaticVec<T, LEN2>,
        const LEN2: usize,
        const OLEN: usize,
        const IS_TRANS_2: bool,
        S2: Shape<2>,
    >(
        &self,
        other: &Matrix<T, U2, B, LEN2, IS_TRANS_2, S2>,
    ) -> [T; OLEN] {
        let mut buffer = [num!(0); OLEN];
        self.matrix_mul_buffer(other, &mut buffer);
        buffer
    }

    #[inline(always)]
    pub fn vector_mul<U2: StaticVec<T, LEN2>, const LEN2: usize, const OLEN: usize>(
        &self,
        other: &U2,
    ) -> [T; OLEN] {
        let mut buffer = [num!(0); OLEN];
        self.vector_mul_buffer(other, &mut buffer);
        buffer
    }
}

#[macro_export]
macro_rules! m {
    ($m: expr, $k: expr) => {
        MatrixShape::<$m, $k>
    };
}

/// A wrapper around a 2D tensor, which allows for lazy transposing
#[derive(Clone, Copy)]
pub struct Matrix<
    T,
    U: StaticVec<T, LEN>,
    B: Backend<T>,
    const LEN: usize,
    const IS_TRANS: bool = false,
    S: Shape<2> = [usize; 2],
>(Tensor<T, U, B, 2, LEN, S>);

impl<
        T,
        U: StaticVec<T, LEN>,
        B: Backend<T>,
        S: Shape<2>,
        const LEN: usize,
        const IS_TRANS: bool,
    > Matrix<T, U, B, LEN, IS_TRANS, S>
{
    #[inline(always)]
    pub fn rows(&self) -> usize {
        if IS_TRANS {
            self.0.shape.axis_len(0)
        } else {
            self.0.shape.axis_len(1)
        }
    }

    #[inline(always)]
    pub fn columns(&self) -> usize {
        if IS_TRANS {
            self.0.shape.axis_len(1)
        } else {
            self.0.shape.axis_len(0)
        }
    }

    pub fn transpose(self) -> Matrix<T, U, B, LEN, { !IS_TRANS }, S> {
        Matrix(self.0)
    }

    pub fn as_transposed<'a>(&'a self) -> &'a Matrix<T, U, B, LEN, { !IS_TRANS }, S> {
        unsafe { transmute(self) }
    }

    pub fn as_transposed_mut<'a>(&'a mut self) -> &'a mut Matrix<T, U, B, LEN, { !IS_TRANS }, S> {
        unsafe { transmute(self) }
    }
}

/// # Panics
/// Will panic when attempting to deref immutably and Matrix is lazily transposed.
impl<
        T,
        U: StaticVec<T, LEN>,
        B: Backend<T>,
        const LEN: usize,
        const IS_TRANS: bool,
        S: Shape<2>,
    > const std::ops::Deref for Matrix<T, U, B, LEN, IS_TRANS, S>
{
    type Target = Tensor<T, U, B, 2, LEN, S>;
    fn deref(&self) -> &Self::Target {
        if IS_TRANS {
            panic!("Cannot deref lazily transposed matrix immutably. Try using &self.deref_mut() instead")
        } else {
            &self.0
        }
    }
}

impl<T: Copy, U: StaticVec<T, LEN>, B: Backend<T>, const LEN: usize, const IS_TRANS: bool>
    std::ops::DerefMut for Matrix<T, U, B, LEN, IS_TRANS, [usize; 2]>
where
    crate::backends::Rust: crate::backends::Backend<T>,
{
    fn deref_mut(&mut self) -> &mut Self::Target {
        if IS_TRANS {
            Rust.transpose_inplace(self.0.data.data.mut_moo_ref(), self.0.shape.axis_len(1));
            {
                let tmp = self.0.shape[0];
                self.0.shape[0] = self.0.shape[1];
                self.0.shape[1] = tmp;
            }
            &mut self.0
        } else {
            &mut self.0
        }
    }
}

impl<
        T,
        U: StaticVec<T, LEN>,
        B: Backend<T>,
        const LEN: usize,
        const IS_TRANS: bool,
        S: Shape<2>,
    > const From<Tensor<T, U, B, 2, LEN, S>> for Matrix<T, U, B, LEN, IS_TRANS, S>
{
    fn from(t: Tensor<T, U, B, 2, LEN, S>) -> Self {
        Matrix(t)
    }
}