#pragma once
#include "megdnn/oprs.h"
namespace megdnn {
namespace rocm {
class BatchedMatrixMulForwardImpl : public BatchedMatrixMulForward {
public:
using BatchedMatrixMulForward::BatchedMatrixMulForward;
void exec(
_megdnn_tensor_in A, _megdnn_tensor_in B, _megdnn_tensor_out C,
_megdnn_workspace workspace) override;
size_t get_workspace_in_bytes(
const TensorLayout&, const TensorLayout&, const TensorLayout&) override;
bool is_thread_safe() const override { return true; }
class AlgoBase;
class AlgoBlas;
class AlgoPack;
static const AlgoPack& algo_pack() { return sm_algo_pack; }
Algorithm* get_algorithm_from_desc(const AlgorithmDesc&) override;
private:
std::vector<Algorithm*> get_all_algorithms(
const TensorLayout& , const TensorLayout& ,
const TensorLayout& ) override;
std::vector<Algorithm*> get_all_algorithms_safe(
const TensorLayout& , const TensorLayout& ,
const TensorLayout& ) override;
Algorithm* get_algorithm_heuristic(
const TensorLayout& , const TensorLayout& ,
const TensorLayout& , size_t ,
const AlgoAttribute& ,
const AlgoAttribute& ) override;
const char* get_algorithm_set_name() const override {
return "ROCM BATCHED MATMUL";
}
static AlgoPack sm_algo_pack;
};
} }