algos.h 8.6 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/**
 * \file dnn/src/arm_common/conv_bias/int8/algos.h
 * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
 *
 * Copyright (c) 2014-2020 Megvii Inc. All rights reserved.
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or
 * implied.
 */

#pragma once

#include "src/arm_common/conv_bias/opr_impl.h"

namespace megdnn {
namespace arm_common {

class ConvBiasImpl::AlgoS8DirectStride1 final : public AlgoBase {
    bool m_large_group;

public:
    AlgoS8DirectStride1(bool large_group) : m_large_group(large_group) {}
    bool is_reproducible() const override { return true; }
    const char* name() const override {
        return m_large_group ? "S8STRD1_LARGE_GROUP" : "S8STRD1_SMALL_GROUP";
    }
29
    bool usable(const NCBKernSizeParam& param,
30
                AlgoSelectionStrategy algo_selection_strategy) const override;
31
    size_t get_workspace(const NCBKernSizeParam& param) const override;
32 33 34
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;

35
    bool is_preferred(const NCBKernSizeParam& param) const override;
36 37 38 39 40 41 42 43 44 45 46
};

class ConvBiasImpl::AlgoS8DirectStride2 final : public AlgoBase {
    bool m_large_group;

public:
    AlgoS8DirectStride2(bool large_group) : m_large_group(large_group) {}
    bool is_reproducible() const override { return true; }
    const char* name() const override {
        return m_large_group ? "S8STRD2_LARGE_GROUP" : "S8STRD2_SMALL_GROUP";
    }
47
    bool usable(const NCBKernSizeParam& param,
48 49
                AlgoSelectionStrategy algo_selection_strategy) const override;

50
    size_t get_workspace(const NCBKernSizeParam& param) const override;
51 52 53 54
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;
};

55
class ConvBiasImpl::AlgoS8DirectNCHW44 final : public AlgoBase {
56
public:
57
    AlgoS8DirectNCHW44() {}
58
    bool is_reproducible() const override { return true; }
59
    const char* name() const override { return "S8_NCHW44_DIRECT"; }
60
    bool usable(const NCBKernSizeParam& param,
61
                AlgoSelectionStrategy algo_selection_strategy) const override;
62
    size_t get_workspace(const NCBKernSizeParam& param) const override;
63 64
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;
65
    bool is_preferred(const NCBKernSizeParam& param) const override;
66 67
};

68
class ConvBiasImpl::AlgoS8DirectNCHWNCHW44 final : public AlgoBase {
69
public:
70
    AlgoS8DirectNCHWNCHW44() {}
71 72
    bool is_reproducible() const override { return true; }
    const char* name() const override { return "S8_CONV_NCHW_NCHW44"; }
73
    bool usable(const NCBKernSizeParam& param,
74
                AlgoSelectionStrategy algo_selection_strategy) const override;
75
    size_t get_workspace(const NCBKernSizeParam& param) const override;
76 77
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;
78
    bool is_preferred(const NCBKernSizeParam& param) const override;
79 80 81 82 83 84
};

class ConvBiasImpl::AlgoS8ChanWiseStride1NCHW44 final : public AlgoBase {
public:
    bool is_reproducible() const override { return true; }
    const char* name() const override { return "S8_CHAN_WISE_STRD1_NCHW44"; }
85
    bool usable(const NCBKernSizeParam& param,
86
                AlgoSelectionStrategy algo_selection_strategy) const override;
87
    size_t get_workspace(const NCBKernSizeParam& param) const override;
88 89 90 91 92 93 94 95
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;
};

class ConvBiasImpl::AlgoS8ChanWiseStride2NCHW44 final : public AlgoBase {
public:
    bool is_reproducible() const override { return true; }
    const char* name() const override { return "S8_CHAN_WISE_STRD2_NCHW44"; }
96
    bool usable(const NCBKernSizeParam& param,
97
                AlgoSelectionStrategy algo_selection_strategy) const override;
98
    size_t get_workspace(const NCBKernSizeParam& param) const override;
99 100 101 102 103
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;
};

#if __ARM_FEATURE_DOTPROD
104 105 106 107 108

class ConvBiasImpl::AlgoDotS8DirectNCHWNCHW44 final : public AlgoBase {
public:
    bool is_reproducible() const override { return true; }
    const char* name() const override { return "ARMDOTS8_NCHW_NCHW44"; }
109
    bool usable(const NCBKernSizeParam&,
110 111
                AlgoSelectionStrategy algo_selection_strategy) const override;

112
    size_t get_workspace(const NCBKernSizeParam&) const override;
113 114 115 116
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;
};

117 118 119 120 121 122 123 124 125 126 127
class ConvBiasImpl::AlgoDotS8DirectStride1 final : public AlgoBase {
    bool m_large_group;

public:
    AlgoDotS8DirectStride1(bool large_group) : m_large_group(large_group) {}

    bool is_reproducible() const override { return true; }
    const char* name() const override {
        return m_large_group ? "ARMDOTS8STRD1_LARGE_GROUP"
                             : "ARMDOTS8STRD1_SMALL_GROUP";
    }
128
    bool usable(const NCBKernSizeParam&,
129 130
                AlgoSelectionStrategy algo_selection_strategy) const override;

131
    size_t get_workspace(const NCBKernSizeParam&) const override;
132 133 134 135 136 137 138 139 140 141 142 143 144 145 146
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;
};

class ConvBiasImpl::AlgoDotS8DirectStride2 final : public AlgoBase {
    bool m_large_group;

public:
    AlgoDotS8DirectStride2(bool large_group) : m_large_group(large_group) {}
    bool is_reproducible() const override { return true; }
    const char* name() const override {
        return m_large_group ? "ARMDOTS8STRD2_LARGE_GROUP"
                             : "ARMDOTS8STRD2_SMALL_GROUP";
    }

147
    bool usable(const NCBKernSizeParam&,
148 149
                AlgoSelectionStrategy algo_selection_strategy) const override;

150
    size_t get_workspace(const NCBKernSizeParam&) const override;
151 152 153
    virtual SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;
};
154 155 156 157 158 159

class ConvBiasImpl::AlgoDotS8Direct_NCHW44 final : public AlgoBase {
public:
    AlgoDotS8Direct_NCHW44() {}

    bool is_reproducible() const override { return true; }
160 161
    const char* name() const override { return "ARMDOTS8DIRECT_NCHW44"; }
    bool usable(const NCBKernSizeParam&,
162 163
                AlgoSelectionStrategy algo_selection_strategy) const override;

164
    size_t get_workspace(const NCBKernSizeParam&) const override;
165 166 167 168

    SmallVector<NCBKern> dispatch_kerns(
            const NCBKernSizeParam& param) const override;

169
    bool is_preferred(const NCBKernSizeParam& param) const override;
170
};
171 172 173 174 175 176 177 178 179 180 181 182 183 184
#endif

class ConvBiasImpl::AlgoS8WinogradF23_8x8 final : public AlgoBase {
public:
    AlgoS8WinogradF23_8x8(fallback::MatrixMulImpl::AlgoBase* matmul_algo,
                          uint32_t tile_size)
            : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {}
    const char* name() const override {
        if (m_name.empty()) {
            m_name = ConvBiasImpl::algo_name<ConvBias::WinogradParam>(
                    m_matmul_algo->name(), {8, 2, m_tile_size});
        }
        return m_name.c_str();
    }
185
    MEGDNN_WINOGRAD_ALGO_FUN_DECLARE();
186 187
};

188 189 190
//=======================input int8 compute fp32 output int8============
class ConvBiasImpl::AlgoS8CF32WinogradF23_4x4_NCHW44 final : public AlgoBase {
public:
191 192
    AlgoS8CF32WinogradF23_4x4_NCHW44(
            fallback::MatrixMulImpl::AlgoBase* matmul_algo, uint32_t tile_size)
193 194 195 196 197 198 199 200 201
            : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {}
    const char* name() const override {
        if (m_name.empty()) {
            m_name = ConvBiasImpl::algo_name<ConvBias::WinogradParam>(
                    m_matmul_algo->name(), {4, 2, m_tile_size},
                    param::ConvBias::Format::NCHW44);
        }
        return m_name.c_str();
    }
202
    MEGDNN_WINOGRAD_ALGO_FUN_DECLARE();
203 204 205 206 207 208
};

//=======================input int8 compute int16 output int8============
class ConvBiasImpl::AlgoS8WinogradF23_8x8_NCHW44 final : public AlgoBase {
public:
    AlgoS8WinogradF23_8x8_NCHW44(fallback::MatrixMulImpl::AlgoBase* matmul_algo,
209
                                 uint32_t tile_size)
210 211 212 213 214 215 216 217 218 219
            : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {}
    const char* name() const override {
        if (m_name.empty()) {
            m_name = ConvBiasImpl::algo_name<ConvBias::WinogradParam>(
                    m_matmul_algo->name(), {8, 2, m_tile_size},
                    param::ConvBias::Format::NCHW44);
        }
        return m_name.c_str();
    }

220
    MEGDNN_WINOGRAD_ALGO_FUN_DECLARE();
221 222
};

223 224 225 226
}  // namespace arm_common
}  // namespace megdnn

// vim: syntax=cpp.doxygen