/** * \file dnn/src/arm_common/conv_bias/int8/algos.h * MegEngine is Licensed under the Apache License, Version 2.0 (the "License") * * Copyright (c) 2014-2020 Megvii Inc. All rights reserved. * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or * implied. */ #pragma once #include "src/arm_common/conv_bias/opr_impl.h" namespace megdnn { namespace arm_common { class ConvBiasImpl::AlgoS8DirectStride1 final : public AlgoBase { bool m_large_group; public: AlgoS8DirectStride1(bool large_group) : m_large_group(large_group) {} bool is_reproducible() const override { return true; } const char* name() const override { return m_large_group ? "S8STRD1_LARGE_GROUP" : "S8STRD1_SMALL_GROUP"; } bool usable(fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; bool is_preferred(megdnn::fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoS8DirectStride1NCHW44 final : public AlgoBase { public: AlgoS8DirectStride1NCHW44() {} bool is_reproducible() const override { return true; } const char* name() const override { return "S8_NCHW44_DIRECT_STRD1"; } bool usable(fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; bool is_preferred(megdnn::fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoS8DirectStride2 final : public AlgoBase { bool m_large_group; public: AlgoS8DirectStride2(bool large_group) : m_large_group(large_group) {} bool is_reproducible() const override { return true; } const char* name() const override { return m_large_group ? "S8STRD2_LARGE_GROUP" : "S8STRD2_SMALL_GROUP"; } bool usable(fallback::ConvBiasImpl*, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoS8DirectStride2NCHW44 final : public AlgoBase { public: AlgoS8DirectStride2NCHW44() {} bool is_reproducible() const override { return true; } const char* name() const override { return "S8_NCHW44_DIRECT_STRD2"; } bool usable(fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; bool is_preferred(megdnn::fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoS8DirectNCHWNCHW44 final : public AlgoBase { public: AlgoS8DirectNCHWNCHW44() {} bool is_reproducible() const override { return true; } const char* name() const override { return "S8_CONV_NCHW_NCHW44"; } bool usable(fallback::ConvBiasImpl*, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; bool is_preferred(megdnn::fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoS8ChanWiseStride1NCHW44 final : public AlgoBase { public: bool is_reproducible() const override { return true; } const char* name() const override { return "S8_CHAN_WISE_STRD1_NCHW44"; } bool usable(fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoS8ChanWiseStride2NCHW44 final : public AlgoBase { public: bool is_reproducible() const override { return true; } const char* name() const override { return "S8_CHAN_WISE_STRD2_NCHW44"; } bool usable(fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; }; #if __ARM_FEATURE_DOTPROD class ConvBiasImpl::AlgoDotS8DirectNCHWNCHW44 final : public AlgoBase { public: bool is_reproducible() const override { return true; } const char* name() const override { return "ARMDOTS8_NCHW_NCHW44"; } bool usable(FallbackConvBiasImpl*, const NCBKernSizeParam&, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(FallbackConvBiasImpl*, const NCBKernSizeParam&) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoDotS8DirectStride1 final : public AlgoBase { bool m_large_group; public: AlgoDotS8DirectStride1(bool large_group) : m_large_group(large_group) {} bool is_reproducible() const override { return true; } const char* name() const override { return m_large_group ? "ARMDOTS8STRD1_LARGE_GROUP" : "ARMDOTS8STRD1_SMALL_GROUP"; } bool usable(FallbackConvBiasImpl*, const NCBKernSizeParam&, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(FallbackConvBiasImpl*, const NCBKernSizeParam&) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoDotS8DirectStride2 final : public AlgoBase { bool m_large_group; public: AlgoDotS8DirectStride2(bool large_group) : m_large_group(large_group) {} bool is_reproducible() const override { return true; } const char* name() const override { return m_large_group ? "ARMDOTS8STRD2_LARGE_GROUP" : "ARMDOTS8STRD2_SMALL_GROUP"; } bool usable(FallbackConvBiasImpl*, const NCBKernSizeParam&, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(FallbackConvBiasImpl*, const NCBKernSizeParam&) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; }; class ConvBiasImpl::AlgoDotS8Direct_NCHW44 final : public AlgoBase { public: AlgoDotS8Direct_NCHW44() {} bool is_reproducible() const override { return true; } const char* name() const override { return "ARMDOTS8DIRECT_NCHW44"; } bool usable(FallbackConvBiasImpl*, const NCBKernSizeParam&, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(FallbackConvBiasImpl*, const NCBKernSizeParam&) const override; SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; bool is_preferred(megdnn::fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; }; #endif class ConvBiasImpl::AlgoS8WinogradF23_8x8 final : public AlgoBase { public: AlgoS8WinogradF23_8x8(fallback::MatrixMulImpl::AlgoBase* matmul_algo, uint32_t tile_size) : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {} bool is_reproducible() const override { return true; } const char* name() const override { if (m_name.empty()) { m_name = ConvBiasImpl::algo_name( m_matmul_algo->name(), {8, 2, m_tile_size}); } return m_name.c_str(); } bool usable(fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; static std::vector get_avaiable_matmul_algos(const NCBKernSizeParam& param); private: fallback::MatrixMulImpl::AlgoBase* m_matmul_algo; mutable std::string m_name; uint32_t m_tile_size; }; //=======================input int8 compute fp32 output int8============ class ConvBiasImpl::AlgoS8CF32WinogradF23_4x4_NCHW44 final : public AlgoBase { public: AlgoS8CF32WinogradF23_4x4_NCHW44(fallback::MatrixMulImpl::AlgoBase* matmul_algo, uint32_t tile_size) : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {} bool is_reproducible() const override { return true; } const char* name() const override { if (m_name.empty()) { m_name = ConvBiasImpl::algo_name( m_matmul_algo->name(), {4, 2, m_tile_size}, param::ConvBias::Format::NCHW44); } return m_name.c_str(); } bool usable(fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; static std::vector get_avaiable_matmul_algos(const NCBKernSizeParam& param); private: fallback::MatrixMulImpl::AlgoBase* m_matmul_algo; mutable std::string m_name; uint32_t m_tile_size; }; //=======================input int8 compute int16 output int8============ class ConvBiasImpl::AlgoS8WinogradF23_8x8_NCHW44 final : public AlgoBase { public: AlgoS8WinogradF23_8x8_NCHW44(fallback::MatrixMulImpl::AlgoBase* matmul_algo, uint32_t tile_size) : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {} bool is_reproducible() const override { return true; } const char* name() const override { if (m_name.empty()) { m_name = ConvBiasImpl::algo_name( m_matmul_algo->name(), {8, 2, m_tile_size}, param::ConvBias::Format::NCHW44); } return m_name.c_str(); } bool usable(fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param, AlgoSelectionStrategy algo_selection_strategy) const override; size_t get_workspace(fallback::ConvBiasImpl*, const NCBKernSizeParam& param) const override; virtual SmallVector dispatch_kerns( fallback::ConvBiasImpl* opr, const NCBKernSizeParam& param) const override; static std::vector get_avaiable_matmul_algos(const NCBKernSizeParam& param); private: fallback::MatrixMulImpl::AlgoBase* m_matmul_algo; mutable std::string m_name; uint32_t m_tile_size; }; } // namespace arm_common } // namespace megdnn // vim: syntax=cpp.doxygen