opr_impl.h 2.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
/**
 * \file dnn/src/arm_common/conv_bias/opr_impl.h
 * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
 *
 * Copyright (c) 2014-2020 Megvii Inc. All rights reserved.
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or
 * implied.
 */
#pragma once
#include "src/common/utils.h"
#include "src/fallback/conv_bias/opr_impl.h"

namespace megdnn {
namespace arm_common {

class ConvBiasImpl : public fallback::ConvBiasImpl {
public:
    using fallback::ConvBiasImpl::ConvBiasImpl;
    using FallbackConvBiasImpl = fallback::ConvBiasImpl;
    using NCBKernIndex = fallback::ConvBiasImpl::NCBKernIndex;

    bool is_thread_safe() const override { return true; }

    SmallVector<AlgoBase*> algo_pack() override;

    bool is_matmul_quantized_prefer(
            const ConvBiasImpl::NCBKernSizeParam& ncb_param) override;
    class AlgoPack;

protected:
    static void* const sm_arm_common_algo_type;

    const char* get_algorithm_set_name() const override;

private:
    class AlgoS8DirectStride1;
    class AlgoS8DirectStride1NCHW44;
    class AlgoS8DirectStride2;
    class AlgoS8DirectStride2NCHW44;
43
    class AlgoS8DirectNCHWNCHW44;
44 45 46 47 48 49 50 51
    class AlgoQU8DirectStride1;
    class AlgoQU8DirectStride2;
    class AlgoFP32WinogradF23_4x4;
    class AlgoFP32WinogradF63;
    class AlgoFP32WinogradF63_4x4;
    class AlgoFP32WinogradF54;
    class AlgoFP32WinogradF45;

52 53 54
    class AlgoFP32WinogradF23_4x4_NCHW44;
    class AlgoFP32WinogradF63_4x4_NCHW44;

55 56 57 58 59 60 61 62 63 64
    class AlgoS8ChanWiseStride1NCHW44;
    class AlgoS8ChanWiseStride2NCHW44;

#if __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
    class AlgoFP16WinogradF23;
    class AlgoFP16WinogradF45;
    class AlgoFP16WinogradF63;
    class AlgoFP16WinogradF23_8x8;
#endif
#if __ARM_FEATURE_DOTPROD
65
    class AlgoDotS8DirectNCHWNCHW44;
66 67 68 69
    class AlgoDotS8DirectStride1;
    class AlgoDotS8DirectStride2;
    class AlgoDotU8DirectStride1;
    class AlgoDotU8DirectStride2;
70 71

    class AlgoDotS8Direct_NCHW44;
72 73 74 75
#endif
    class AlgoF32Direct;
    class AlgoF32DirectStride1;
    class AlgoF32DirectStride2;
76
    class AlgoF32DirectNCHWNCHW44;
77 78
    class AlgoF32ChannelWiseNCHW44;
    class AlgoF32DirectNCHW44;
79

80 81 82 83
    class AlgoI8x8x16Direct;
    class AlgoI8x8x16Stride2;
    class AlgoI8x8x16Stride2Filter2;
    class AlgoS8WinogradF23_8x8;
84 85
    class AlgoS8CF32WinogradF23_4x4_NCHW44;
    class AlgoS8WinogradF23_8x8_NCHW44;
86 87 88 89 90 91 92 93 94 95
#if __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
    class AlgoF16Direct;
    class AlgoF16DirectStride1;
#endif
};

}  // namespace arm_common
}  // namespace megdnn

// vim: syntax=cpp.doxygen