pub fn inner_product_loop<T: TensorTrait<T>>( max_indices: Vec<i32>, f: fn(&mut Tensor<T>, &Tensor<T>, &Tensor<T>, &[i32]), t1: &Tensor<T>, t2: &Tensor<T>, t3: &mut Tensor<T>, )