#pragma once
#include "src/x86/conv_bias/opr_impl.h"
namespace megdnn {
namespace x86 {
class ConvBiasImpl::AlgoChanWiseAvx2Stride1Qint8 final : public AlgoBase {
SmallVector<NCBKern> get_kimpls(const NCBKernSizeParam& param) const;
static WorkspaceBundle get_bundle(const NCBKernSizeParam& param);
public:
AlgoAttribute attribute() const override { return AlgoAttribute::REPRODUCIBLE; }
const char* name() const override {
return "X86_CONV_BIAS_CHANWISE_AVX2_INT8_STRIDE1";
}
bool usable(
const NCBKernSizeParam& param,
AlgoSelectionStrategy algo_selection_strategy) const override;
size_t get_workspace(const NCBKernSizeParam& param) const override;
virtual SmallVector<NCBKern> dispatch_kerns(
const NCBKernSizeParam& param) const override {
return get_kimpls(param);
}
bool is_preferred(const NCBKernSizeParam& param) const override;
ConvAlgoTypePack get_algo_type() const override {
return {AlgoDataType::QINT8X8X32, AlgoCategory::DIRECT};
}
MEGDNN_DECL_ALGO_TYPE(X86_CHANWISE_AVX2_STRD1_QINT8)
};
class ConvBiasImpl::AlgoChanWiseAvx2Stride2Qint8 final : public AlgoBase {
SmallVector<NCBKern> get_kimpls(const NCBKernSizeParam& param) const;
static WorkspaceBundle get_bundle(const NCBKernSizeParam& param);
public:
AlgoAttribute attribute() const override { return AlgoAttribute::REPRODUCIBLE; }
const char* name() const override {
return "X86_CONV_BIAS_CHANWISE_AVX2_INT8_STRIDE2";
}
bool usable(
const NCBKernSizeParam& param,
AlgoSelectionStrategy algo_selection_strategy) const override;
size_t get_workspace(const NCBKernSizeParam& param) const override;
virtual SmallVector<NCBKern> dispatch_kerns(
const NCBKernSizeParam& param) const override {
return get_kimpls(param);
}
bool is_preferred(const NCBKernSizeParam& param) const override;
ConvAlgoTypePack get_algo_type() const override {
return {AlgoDataType::QINT8X8X32, AlgoCategory::DIRECT};
}
MEGDNN_DECL_ALGO_TYPE(X86_CHANWISE_AVX2_STRD2_QINT8)
};
class ConvBiasImpl::AlgoDirectAvx2Stride1Int8 final : public AlgoBase {
SmallVector<NCBKern> get_kimpls(const NCBKernSizeParam& param) const;
static WorkspaceBundle get_bundle(const NCBKernSizeParam& param);
public:
AlgoAttribute attribute() const override { return AlgoAttribute::REPRODUCIBLE; }
const char* name() const override {
return "X86_CONV_BIAS_DIRECT_AVX2_INT8_STRIDE1";
}
bool usable(
const NCBKernSizeParam& param,
AlgoSelectionStrategy algo_selection_strategy) const override;
size_t get_workspace(const NCBKernSizeParam& param) const override;
virtual SmallVector<NCBKern> dispatch_kerns(
const NCBKernSizeParam& param) const override {
return get_kimpls(param);
}
bool is_preferred(const NCBKernSizeParam& param) const override;
ConvAlgoTypePack get_algo_type() const override {
return {AlgoDataType::QINT8X8X32, AlgoCategory::DIRECT};
}
MEGDNN_DECL_ALGO_TYPE(X86_DIRECT_AVX2_STRD1_INT8)
};
class ConvBiasImpl::AlgoAVX2DirectConvStride2 final : public AlgoBase {
SmallVector<NCBKern> get_kimpls(const NCBKernSizeParam& param) const;
static WorkspaceBundle get_bundle(const NCBKernSizeParam& param);
public:
AlgoAttribute attribute() const override { return AlgoAttribute::REPRODUCIBLE; }
const char* name() const override {
return "X86_CONV_BIAS_DIRECT_AVX2_INT8_STRIDE2";
}
bool usable(
const NCBKernSizeParam& param,
AlgoSelectionStrategy algo_selection_strategy) const override;
size_t get_workspace(const NCBKernSizeParam& param) const override;
SmallVector<NCBKern> dispatch_kerns(const NCBKernSizeParam& param) const override {
return get_kimpls(param);
}
bool is_preferred(const NCBKernSizeParam& param) const override;
ConvAlgoTypePack get_algo_type() const override {
return {AlgoDataType::QINT8X8X32, AlgoCategory::DIRECT};
}
MEGDNN_DECL_ALGO_TYPE(X86_DIRECT_AVX2_STRD2_INT8)
};
#if MEGDNN_X86_WITH_MKL_DNN
class ConvBiasImpl::AlgoMkldnnQint8 final : public AlgoBase {
static void kern_mkldnn_s8x8x32(const NCBKernParam& param, const NCBKernIndex&);
static WorkspaceBundle get_bundle(const NCBKernSizeParam& param);
public:
AlgoMkldnnQint8() {}
AlgoAttribute attribute() const override { return AlgoAttribute::REPRODUCIBLE; }
const char* name() const override { return "MKLDNN_INT8"; }
bool usable(const NCBKernSizeParam& param, AlgoSelectionStrategy) const override;
size_t get_workspace(const NCBKernSizeParam& param) const override {
size_t nr_threads = param.nr_threads;
return get_bundle(param).total_size_in_bytes() * nr_threads;
}
SmallVector<NCBKern> dispatch_kerns(const NCBKernSizeParam& param) const override {
size_t group = param.filter_meta.group;
size_t n = param.n;
auto workspace_per_thread = get_bundle(param).total_size_in_bytes();
auto kern = [workspace_per_thread](
const NCBKernParam& param, const NCBKernIndex& ncb_index) {
auto thread_param = param;
thread_param.workspace_ptr = reinterpret_cast<void*>(
reinterpret_cast<ptrdiff_t>(param.workspace_ptr) +
ncb_index.thread_id * workspace_per_thread);
kern_mkldnn_s8x8x32(thread_param, std::move(ncb_index));
};
return {{kern, {group, n, 1_z}}};
}
bool is_preferred(const NCBKernSizeParam& param) const override;
ConvAlgoTypePack get_algo_type() const override {
return {AlgoDataType::QINT8X8X32, AlgoCategory::DIRECT};
}
MEGDNN_DECL_ALGO_TYPE(X86_MKLDNN_QINT8)
};
class ConvBiasImpl::AlgoMkldnnMatmulQint8 final : public AlgoBase {
static MatrixMul* get_matmul_opr();
static void kern_mkldnn_matmul_s8x8x32(
const NCBKernParam& param, const NCBKernIndex&);
static WorkspaceBundle get_bundle(const NCBKernSizeParam& param);
public:
AlgoAttribute attribute() const override { return AlgoAttribute::REPRODUCIBLE; }
const char* name() const override { return "MKLDNN_MATMUL_INT8"; }
bool usable(const NCBKernSizeParam& param, AlgoSelectionStrategy) const override;
size_t get_workspace(const NCBKernSizeParam& param) const override {
return get_bundle(param).total_size_in_bytes();
}
SmallVector<NCBKern> dispatch_kerns(const NCBKernSizeParam& param) const override {
size_t group = param.filter_meta.group;
return {{kern_mkldnn_matmul_s8x8x32, {group, 1_z, 1_z}}};
}
bool is_preferred(const NCBKernSizeParam& param) const override;
ConvAlgoTypePack get_algo_type() const override {
return {AlgoDataType::QINT8X8X32, AlgoCategory::IM2COL};
}
MEGDNN_DECL_ALGO_TYPE(X86_MKLDNN_MATMUL_QINT8)
};
#endif
} }