1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
use crate::internal::*;
use ndarray::*;
use tract_linalg::frame::Packer;
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub struct MatMatMulPack {
pub(crate) packer: Packer,
pub(crate) k_axis: usize,
pub(crate) mn_axis: usize,
}
impl DynHash for MatMatMulPack {
fn dyn_hash(&self, hasher: &mut dyn std::hash::Hasher) {
dyn_hash(self, hasher)
}
}
impl Op for MatMatMulPack {
fn name(&self) -> Cow<str> {
"MatMatMulPack".into()
}
fn same_as(&self, other: &dyn Op) -> bool {
other.downcast_ref::<Self>().map(|other| other == self).unwrap_or(false)
}
op_as_typed_op!();
}
impl EvalOp for MatMatMulPack {
fn is_stateless(&self) -> bool {
true
}
fn eval(&self, mut inputs: TVec<TValue>) -> TractResult<TVec<TValue>> {
let b = args_1!(inputs);
let dt = b.datum_type();
unsafe {
let output_shape = self.output_shape(b.shape());
let mut packed =
Tensor::uninitialized_aligned_dt(dt, &output_shape, self.packer.alignment())
.unwrap();
let mut bc_shape: TVec<usize> = b.shape().into();
bc_shape[self.k_axis] = 1;
bc_shape[self.mn_axis] = 1;
for coord in indices(&*bc_shape) {
let offset = coord
.as_array_view()
.iter()
.zip(b.strides())
.map(|(x, s)| *x as isize * s)
.sum::<isize>()
* b.datum_type().size_of() as isize;
let mut prefix: TVec<usize> = coord.slice().into();
prefix.remove(self.k_axis.max(self.mn_axis));
prefix.remove(self.k_axis.min(self.mn_axis));
self.packer.pack(
&mut packed.view_at_prefix_mut(&prefix)?,
TensorView::from_bytes(&b, offset, b.shape(), b.strides()),
self.k_axis,
self.mn_axis,
)
}
Ok(tvec!(packed.into_tvalue()))
}
}
}
impl TypedOp for MatMatMulPack {
fn output_facts(&self, inputs: &[&TypedFact]) -> TractResult<TVec<TypedFact>> {
Ok(tvec!(inputs[0].datum_type.fact(self.output_shape(&inputs[0].shape))))
}
as_op!();
}
impl MatMatMulPack {
fn output_shape<D: DimLike>(&self, input: &[D]) -> TVec<D> {
let mut packed_shape: TVec<D> = input.into();
packed_shape.remove(self.mn_axis.max(self.k_axis));
packed_shape.remove(self.mn_axis.min(self.k_axis));
packed_shape.push(self.packer.len(input[self.k_axis].clone(), input[self.mn_axis].clone()));
packed_shape
}
}