#pragma once
#include "src/common/opr_delegate.h"
#include "src/naive/batched_matrix_mul/opr_impl.h"
namespace megdnn {
namespace fallback {
class BatchedMatrixMulForwardImpl : public naive::BatchedMatrixMulForwardImpl {
public:
using naive::BatchedMatrixMulForwardImpl::BatchedMatrixMulForwardImpl;
void exec(
_megdnn_tensor_in A, _megdnn_tensor_in B, _megdnn_tensor_out C,
_megdnn_workspace workspace) override;
size_t get_workspace_in_bytes(
const TensorLayout&, const TensorLayout&, const TensorLayout&) override;
bool is_thread_safe() const override { return true; }
class AlgoBase;
class AlgoDefault;
class AlgoPack;
static const AlgoPack& algo_pack() { return sm_algo_pack; }
Algorithm* get_algorithm_from_desc(const AlgorithmDesc&) override;
private:
std::vector<Algorithm*> get_all_algorithms(
const TensorLayout& , const TensorLayout& ,
const TensorLayout& ) override;
std::vector<Algorithm*> get_all_algorithms_safe(
const TensorLayout& , const TensorLayout& ,
const TensorLayout& ) override;
Algorithm* get_algorithm_heuristic(
const TensorLayout& , const TensorLayout& ,
const TensorLayout& , size_t ,
const AlgoAttribute& ,
const AlgoAttribute& ) override;
const char* get_algorithm_set_name() const override {
return "FALLBACK BATCHED MATMUL";
}
static AlgoPack sm_algo_pack;
};
} }