#[cfg(test)]
use super::{assert_almost_equals, new_backward_input, new_input, new_tensor};
use super::{
expect_tensor, expect_tensor_mut, push_mat_vec_gradient, push_vec_mat_gradient, Backward, Data,
DotDim, Forward, Gradient, Overwrite, Tensor,
};
use ndarray::{linalg::general_mat_vec_mul, s, Ix1, Ix2, NewAxis};
use std::{
cell::{Cell, Ref, RefCell, RefMut},
fmt::{Debug, Display},
rc::Rc,
};
pub struct MatrixVectorMul<Lhs, Rhs>
where
Lhs: Data<Dim = Ix2>,
Rhs: Data<Dim = Ix1>,
{
left: Rc<Lhs>,
right: Rc<Rhs>,
data: RefCell<Tensor<Ix1>>,
computed: Cell<bool>,
}
impl<Lhs, Rhs> MatrixVectorMul<Lhs, Rhs>
where
Lhs: Data<Dim = Ix2>,
Rhs: Data<Dim = Ix1>,
{
pub fn new(left: Rc<Lhs>, right: Rc<Rhs>) -> Self {
let shape = DotDim::shape(left.data().raw_dim(), right.data().raw_dim());
let data = RefCell::new(Tensor::zeros(shape[0]));
Self {
left,
right,
data,
computed: Cell::new(false),
}
}
}
impl<Lhs, Rhs> Data for MatrixVectorMul<Lhs, Rhs>
where
Lhs: Data<Dim = Ix2>,
Rhs: Data<Dim = Ix1>,
{
type Dim = Ix1;
fn data(&self) -> Ref<Tensor<Self::Dim>> {
self.data.borrow()
}
fn data_mut(&self) -> RefMut<Tensor<Self::Dim>> {
self.data.borrow_mut()
}
}
impl<Lhs, Rhs> Forward for MatrixVectorMul<Lhs, Rhs>
where
Lhs: Data<Dim = Ix2>,
Rhs: Data<Dim = Ix1>,
{
fn forward(&self) {
if self.was_computed() {
return;
}
self.computed.set(true);
general_mat_vec_mul(
1.0,
&*self.left.data(),
&*self.right.data(),
0.0,
&mut *self.data.borrow_mut(),
);
}
fn was_computed(&self) -> bool {
self.computed.get()
}
fn reset_computation(&self) {
self.computed.set(false);
}
}
impl<Lhs, Rhs> Debug for MatrixVectorMul<Lhs, Rhs>
where
Lhs: Data<Dim = Ix2>,
Rhs: Data<Dim = Ix1>,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
f.debug_struct("MatrixVectorMul")
.field("data", &self.data.borrow())
.field("computed", &self.computed.get())
.finish()
}
}
impl<Lhs, Rhs> Display for MatrixVectorMul<Lhs, Rhs>
where
Lhs: Data<Dim = Ix2>,
Rhs: Data<Dim = Ix1>,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> Result<(), std::fmt::Error> {
write!(f, "{}", &self.data.borrow())
}
}
pub struct MatrixVectorMulBackward<LhsD, LhsG, RhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
gradient: RefCell<Option<Tensor<Ix1>>>,
shape: Ix1,
overwrite: Cell<bool>,
left_data: Rc<LhsD>,
left_grad: Rc<LhsG>,
right_data: Rc<RhsD>,
right_grad: Rc<RhsG>,
}
impl<LhsD, LhsG, RhsD, RhsG> MatrixVectorMulBackward<LhsD, LhsG, RhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
pub fn new(
left_data: Rc<LhsD>,
left_grad: Rc<LhsG>,
right_data: Rc<RhsD>,
right_grad: Rc<RhsG>,
) -> Self {
let shape = DotDim::shape(
left_grad.gradient().raw_dim(),
right_grad.gradient().raw_dim(),
);
Self {
gradient: RefCell::new(Some(Tensor::zeros(shape))),
shape,
overwrite: Cell::new(true),
left_data,
left_grad,
right_data,
right_grad,
}
}
}
impl<LhsD, LhsG, RhsD, RhsG> Gradient for MatrixVectorMulBackward<LhsD, LhsG, RhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
type Dim = Ix1;
fn gradient(&self) -> Ref<Tensor<Self::Dim>> {
expect_tensor(&self.gradient)
}
fn gradient_mut(&self) -> RefMut<Tensor<Self::Dim>> {
expect_tensor_mut(&self.gradient)
}
}
impl<LhsD, LhsG, RhsD, RhsG> Overwrite for MatrixVectorMulBackward<LhsD, LhsG, RhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
fn can_overwrite(&self) -> bool {
self.overwrite.get()
}
fn set_overwrite(&self, state: bool) {
self.overwrite.set(state);
}
}
impl<LhsD, LhsG, RhsD, RhsG> Backward for MatrixVectorMulBackward<LhsD, LhsG, RhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
fn backward(&self) {
let gradient = self.gradient();
push_mat_vec_gradient(
&*self.left_grad,
&gradient.slice(s![.., NewAxis]),
&self.right_data.data(),
);
push_vec_mat_gradient(&*self.right_grad, &self.left_data.data().t(), &gradient);
}
fn no_grad(&self) {
*self.gradient.borrow_mut() = None;
}
fn with_grad(&self) {
*self.gradient.borrow_mut() = Some(Tensor::zeros(self.shape));
}
}
impl<LhsD, LhsG, RhsD, RhsG> Debug for MatrixVectorMulBackward<LhsD, LhsG, RhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
f.debug_struct("MatrixVectorMulBackward")
.field("gradient", &self.gradient.borrow())
.field("overwrite", &self.overwrite.get())
.finish()
}
}
impl<LhsD, LhsG, RhsD, RhsG> Display for MatrixVectorMulBackward<LhsD, LhsG, RhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> Result<(), std::fmt::Error> {
match &*self.gradient.borrow() {
Some(gradient) => write!(f, "{}", &gradient),
None => write!(f, "None"),
}
}
}
pub struct MatrixVectorMulBackwardLeft<LhsG, RhsD>
where
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
{
gradient: RefCell<Option<Tensor<Ix1>>>,
shape: Ix1,
overwrite: Cell<bool>,
left_grad: Rc<LhsG>,
right_data: Rc<RhsD>,
}
impl<LhsG, RhsD> MatrixVectorMulBackwardLeft<LhsG, RhsD>
where
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
{
pub fn new(left_grad: Rc<LhsG>, right_data: Rc<RhsD>) -> Self {
let shape = DotDim::shape(left_grad.gradient().raw_dim(), right_data.data().raw_dim());
Self {
gradient: RefCell::new(Some(Tensor::zeros(shape))),
shape,
overwrite: Cell::new(true),
left_grad,
right_data,
}
}
}
impl<LhsG, RhsD> Gradient for MatrixVectorMulBackwardLeft<LhsG, RhsD>
where
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
{
type Dim = Ix1;
fn gradient(&self) -> Ref<Tensor<Self::Dim>> {
expect_tensor(&self.gradient)
}
fn gradient_mut(&self) -> RefMut<Tensor<Self::Dim>> {
expect_tensor_mut(&self.gradient)
}
}
impl<LhsG, RhsD> Overwrite for MatrixVectorMulBackwardLeft<LhsG, RhsD>
where
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
{
fn can_overwrite(&self) -> bool {
self.overwrite.get()
}
fn set_overwrite(&self, state: bool) {
self.overwrite.set(state);
}
}
impl<LhsG, RhsD> Backward for MatrixVectorMulBackwardLeft<LhsG, RhsD>
where
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
{
fn backward(&self) {
push_mat_vec_gradient(
&*self.left_grad,
&self.gradient().slice(s![.., NewAxis]),
&self.right_data.data(),
);
}
fn no_grad(&self) {
*self.gradient.borrow_mut() = None;
}
fn with_grad(&self) {
*self.gradient.borrow_mut() = Some(Tensor::zeros(self.shape));
}
}
impl<LhsG, RhsD> Debug for MatrixVectorMulBackwardLeft<LhsG, RhsD>
where
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
f.debug_struct("MatrixVectorMulBackwardLeft")
.field("gradient", &self.gradient.borrow())
.field("overwrite", &self.overwrite.get())
.finish()
}
}
impl<LhsG, RhsD> Display for MatrixVectorMulBackwardLeft<LhsG, RhsD>
where
RhsD: Data<Dim = Ix1>,
LhsG: Gradient<Dim = Ix2> + Overwrite,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> Result<(), std::fmt::Error> {
match &*self.gradient.borrow() {
Some(gradient) => write!(f, "{}", &gradient),
None => write!(f, "None"),
}
}
}
pub struct MatrixVectorMulBackwardRight<LhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
gradient: RefCell<Option<Tensor<Ix1>>>,
shape: Ix1,
overwrite: Cell<bool>,
left_data: Rc<LhsD>,
right_grad: Rc<RhsG>,
}
impl<LhsD, RhsG> MatrixVectorMulBackwardRight<LhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
pub fn new(left_data: Rc<LhsD>, right_grad: Rc<RhsG>) -> Self {
let shape = DotDim::shape(left_data.data().raw_dim(), right_grad.gradient().raw_dim());
Self {
gradient: RefCell::new(Some(Tensor::zeros(shape))),
shape,
overwrite: Cell::new(true),
left_data,
right_grad,
}
}
}
impl<LhsD, RhsG> Gradient for MatrixVectorMulBackwardRight<LhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
type Dim = Ix1;
fn gradient(&self) -> Ref<Tensor<Self::Dim>> {
expect_tensor(&self.gradient)
}
fn gradient_mut(&self) -> RefMut<Tensor<Self::Dim>> {
expect_tensor_mut(&self.gradient)
}
}
impl<LhsD, RhsG> Overwrite for MatrixVectorMulBackwardRight<LhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
fn can_overwrite(&self) -> bool {
self.overwrite.get()
}
fn set_overwrite(&self, state: bool) {
self.overwrite.set(state);
}
}
impl<LhsD, RhsG> Backward for MatrixVectorMulBackwardRight<LhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
fn backward(&self) {
push_vec_mat_gradient(
&*self.right_grad,
&self.left_data.data().t(),
&self.gradient(),
);
}
fn no_grad(&self) {
*self.gradient.borrow_mut() = None;
}
fn with_grad(&self) {
*self.gradient.borrow_mut() = Some(Tensor::zeros(self.shape));
}
}
impl<LhsD, RhsG> Debug for MatrixVectorMulBackwardRight<LhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
f.debug_struct("MatrixVectorMulBackwardRight")
.field("gradient", &self.gradient.borrow())
.field("overwrite", &self.overwrite.get())
.finish()
}
}
impl<LhsD, RhsG> Display for MatrixVectorMulBackwardRight<LhsD, RhsG>
where
LhsD: Data<Dim = Ix2>,
RhsG: Gradient<Dim = Ix1> + Overwrite,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> Result<(), std::fmt::Error> {
match &*self.gradient.borrow() {
Some(gradient) => write!(f, "{}", &gradient),
None => write!(f, "None"),
}
}
}
#[cfg(test)]
mod test;