1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
use super::utils::move_tape_and_add_backward_op;
use crate::prelude::*;
pub fn sum_axis<T: Reduce1<I>, const I: isize>(t: T) -> T::Reduced {
let mut result = <T::Reduced as Tensor>::NoTape::zeros();
T::DeviceR::reduce_into(t.data(), result.mut_data(), |a, b| a + b);
move_tape_and_add_backward_op(t, result, move |t, result, grads| {
let (t_grad, result_grad) = grads.mut_and_ref(&t, &result);
T::DeviceR::foreach_br(t_grad, result_grad, &mut |l, r| {
*l += r;
})
})
}
macro_rules! sum_axis_impl {
($typename:ident, [$($Vs:tt),*]) => {
impl<$(const $Vs: usize, )* H: Tape> $typename<$($Vs, )* H> {
pub fn sum_axis<const I: isize>(self) -> <Self as Reduce1<I>>::Reduced
where
Self: Reduce1<I>
{
sum_axis::<Self, I>(self)
}
}
};
}
sum_axis_impl!(Tensor0D, []);
sum_axis_impl!(Tensor1D, [M]);
sum_axis_impl!(Tensor2D, [M, N]);
sum_axis_impl!(Tensor3D, [M, N, O]);
sum_axis_impl!(Tensor4D, [M, N, O, P]);
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_valids_sum_axis() {
let _: Tensor0D = Tensor1D::<5>::zeros().sum_axis::<-1>();
let _: Tensor1D<3> = Tensor2D::<5, 3>::zeros().sum_axis::<0>();
let _: Tensor1D<5> = Tensor2D::<5, 3>::zeros().sum_axis::<-1>();
let _: Tensor2D<5, 3> = Tensor3D::<7, 5, 3>::zeros().sum_axis::<0>();
let _: Tensor2D<7, 3> = Tensor3D::<7, 5, 3>::zeros().sum_axis::<1>();
let _: Tensor2D<7, 5> = Tensor3D::<7, 5, 3>::zeros().sum_axis::<-1>();
let _: Tensor3D<7, 5, 3> = Tensor4D::<9, 7, 5, 3>::zeros().sum_axis::<0>();
let _: Tensor3D<9, 5, 3> = Tensor4D::<9, 7, 5, 3>::zeros().sum_axis::<1>();
let _: Tensor3D<9, 7, 3> = Tensor4D::<9, 7, 5, 3>::zeros().sum_axis::<2>();
let _: Tensor3D<9, 7, 5> = Tensor4D::<9, 7, 5, 3>::zeros().sum_axis::<-1>();
}
#[test]
fn test_sum_axis_0_2d() {
let t: Tensor2D<2, 3> = Tensor2D::new([[1.0, 2.0, 3.0], [-2.0, 4.0, -6.0]]);
let r = t.trace().sum_axis::<0>();
assert_eq!(r.data(), &[-1.0, 6.0, -3.0]);
let gradients = r.exp().mean().backward();
assert_eq!(
gradients.ref_gradient(&t),
&[[0.12262648, 134.47627, 0.01659569]; 2]
);
}
#[test]
fn test_sum_axis_1_2d() {
let t: Tensor2D<2, 3> = Tensor2D::new([[1.0, 2.0, 3.0], [-2.0, 4.0, -6.0]]);
let r = t.trace().sum_axis::<-1>();
assert_eq!(r.data(), &[6.0, -4.0]);
let gradients = r.exp().mean().backward();
assert_eq!(
gradients.ref_gradient(&t),
&[[201.7144; 3], [0.00915782; 3]]
);
}
}