megenginelite-sys 1.8.2

A safe megenginelite wrapper in Rust
Documentation
/**
 * \file dnn/src/arm_common/convolution/int8x8x32/algos.cpp
 * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
 *
 * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 */

#include "src/arm_common/convolution/int8x8x32/algos.h"
#include "src/arm_common/convolution/img2col_helper.h"
#include "src/arm_common/convolution/int8x8x32/conv_backdata_stride1.h"
#include "src/arm_common/convolution/int8x8x32/conv_backdata_stride2.h"
#include "src/common/opr_delegate.h"

#include "midout.h"

MIDOUT_DECL(megdnn_arm_conv_int8832_kimpl)

using namespace megdnn;
using namespace arm_common;

#if MGB_ENABLE_DOT
/* ===================== ConvolutionBackwardData  ===================== */
/* ===================== direct stride 1 algo ===================== */
bool ConvolutionBackwardDataImpl::AlgoSdot8DirectStride1::usable(
        fallback::ConvolutionBackwardDataImpl*, const NCBKernSizeParam& param) const {
    if (!cpuinfo_has_arm_neon_dot()) {
        return false;
    }
    return deconv::can_stride1_int8x8x32_dot(param);
}

size_t ConvolutionBackwardDataImpl::AlgoSdot8DirectStride1::get_workspace(
        fallback::ConvolutionBackwardDataImpl*, const NCBKernSizeParam& param) const {
    MIDOUT_BEGIN(
            megdnn_arm_conv_int8832_kimpl,
            midout_iv("AlgoSdot8DirectStride1::get_workspace"_hash)) {
        return deconv::get_workspace_in_bytes_stride1_int8x8x32_dot(param);
    }
    MIDOUT_END();
    return 0;
}

ConvolutionBackwardDataImpl::ncb_kern_t ConvolutionBackwardDataImpl::
        AlgoSdot8DirectStride1::dispatch_kern(
                fallback::ConvolutionBackwardDataImpl*, const NCBKernSizeParam&) const {
    MIDOUT_BEGIN(
            megdnn_arm_conv_int8832_kimpl,
            midout_iv("AlgoSdot8DirectStride1::dispatch_kern"_hash)) {
        return deconv::stride1_int8x8x32_dot;
    }
    MIDOUT_END();
    return {};
}

/* ===================== direct stride 2 algo ===================== */
bool ConvolutionBackwardDataImpl::AlgoSdot8DirectStride2::usable(
        fallback::ConvolutionBackwardDataImpl*, const NCBKernSizeParam& param) const {
    if (!cpuinfo_has_arm_neon_dot()) {
        return false;
    }
    return deconv::can_stride2_int8x8x32_dot(param);
}

size_t ConvolutionBackwardDataImpl::AlgoSdot8DirectStride2::get_workspace(
        fallback::ConvolutionBackwardDataImpl*, const NCBKernSizeParam& param) const {
    MIDOUT_BEGIN(
            megdnn_arm_conv_int8832_kimpl,
            midout_iv("AlgoSdot8DirectStride2::get_workspace"_hash)) {
        return deconv::get_workspace_in_bytes_stride2_int8x8x32_dot(param);
    }
    MIDOUT_END();
    return 0;
}

ConvolutionBackwardDataImpl::ncb_kern_t ConvolutionBackwardDataImpl::
        AlgoSdot8DirectStride2::dispatch_kern(
                fallback::ConvolutionBackwardDataImpl*, const NCBKernSizeParam&) const {
    MIDOUT_BEGIN(
            megdnn_arm_conv_int8832_kimpl,
            midout_iv("AlgoSdot8DirectStride2::dispatch_kern"_hash)) {
        return deconv::stride2_int8x8x32_dot;
    }
    MIDOUT_END();
    return {};
}

#endif

// vim: syntax=cpp.doxygen