#include "src/x86/matrix_mul/opr_impl.h"
#include "src/common/metahelper.h"
#include "src/x86/matrix_mul/algos.h"
using namespace megdnn;
using namespace x86;
class MatrixMulImpl::AlgoPack : NonCopyableObj {
AlgoF32Blas f32blas;
#if MEGDNN_X86_WITH_MKL && SUPPORT_MKL_PACKED_GEMM
AlgoF32MKLPackA f32mkl_packa;
#endif
#if MEGDNN_X86_WITH_VNNI
AlgoInt8x8x32Vnni algoint8x8x32vnni;
#endif
#if MEGDNN_X86_WITH_MKL_DNN
AlgoInt8x8x32Mkldnn algoint8x8x32mkldnn;
#endif
AlgoInt8x8x32AVX2M4N16K2 algoint8x8x32avx2_m4n16k2;
AlgoInt8x8x32AVX2M2N4K16 algoint8x8x32avx2_m2n4k16;
AlgoInt8x8x32SSEM4N8K2 algoint8x8x32sse_m4n8k2;
AlgoInt8x8x16AVX2 algoint8x8x16avx2_m4n16k2;
AlgoInt8x8x16SSE algoint8x8x16sse_m4n8k2;
AlgoF32MK8_8x8 algof32mk8_8x8;
AlgoFloatAVX2M6N16 algof32_6x16;
SmallVector<fallback::MatrixMulImpl::AlgoBase*> m_all_algos;
fallback::MatrixMulImpl::AlgoBase::Mapper m_all_algos_map;
public:
AlgoPack() {
if (is_supported(SIMDType::VNNI)) {
#if MEGDNN_X86_WITH_VNNI
m_all_algos.emplace_back(&algoint8x8x32vnni);
#endif
}
m_all_algos.emplace_back(&algoint8x8x32avx2_m4n16k2);
m_all_algos.emplace_back(&algoint8x8x16avx2_m4n16k2);
m_all_algos.emplace_back(&algoint8x8x32avx2_m2n4k16);
m_all_algos.emplace_back(&algoint8x8x32sse_m4n8k2);
m_all_algos.emplace_back(&algoint8x8x16sse_m4n8k2);
m_all_algos.emplace_back(&algof32mk8_8x8);
#if MEGDNN_X86_WITH_MKL_DNN
m_all_algos.emplace_back(&algoint8x8x32mkldnn);
#endif
m_all_algos.emplace_back(&f32blas);
#if MEGDNN_X86_WITH_MKL && SUPPORT_MKL_PACKED_GEMM
m_all_algos.emplace_back(&f32mkl_packa);
#endif
m_all_algos.emplace_back(&algof32_6x16);
for (auto&& algo : m_all_algos) {
m_all_algos_map.emplace(algo->info().desc, algo);
}
}
const SmallVector<fallback::MatrixMulImpl::AlgoBase*>& all_algos() const {
return m_all_algos;
}
const AlgoBase::Mapper& all_algos_map() const { return m_all_algos_map; }
};
const MatrixMulImpl::AlgoPack& MatrixMulImpl::algo_pack() {
static AlgoPack algo_pack;
return algo_pack;
}
fallback::MatrixMulImpl::AlgoBase* MatrixMulImpl::get_algo_from_desc(
const AlgorithmDesc& desc) {
megdnn_assert(
algo_pack().all_algos_map().find(desc) !=
algo_pack().all_algos_map().end());
return algo_pack().all_algos_map().at(desc);
}
SmallVector<fallback::MatrixMulImpl::AlgoBase*> MatrixMulImpl::get_all_packed_algo() {
auto&& algos = fallback::MatrixMulImpl::get_all_packed_algo();
algos.insert(
algos.begin(), algo_pack().all_algos().begin(),
algo_pack().all_algos().end());
return std::move(algos);
}