opr_impl.h 4.1 KB
Newer Older
1 2 3 4
/**
 * \file dnn/src/cuda/conv_bias/opr_impl.h
 * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
 *
5
 * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
6 7 8
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
9 10
 * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or
 * implied.
11 12 13 14 15 16 17 18 19 20 21 22 23
 */
#pragma once
#include "../elemwise/opr_impl.h"
#include "megdnn/oprs.h"

namespace megdnn {
namespace cuda {

class ConvBiasForwardImpl : public ConvBiasForward {
public:
    using ConvBiasForward::ConvBiasForward;
    void exec(_megdnn_tensor_in src, _megdnn_tensor_in filter,
              _megdnn_tensor_in bias, _megdnn_tensor_in z,
24 25 26
              _megdnn_tensor_out dst,
              const PreprocessedFilter* preprocessed_filter,
              _megdnn_workspace workspace) override;
27 28
    size_t get_workspace_in_bytes(const TensorLayout&, const TensorLayout&,
                                  const TensorLayout&, const TensorLayout&,
29 30 31 32 33 34 35
                                  const TensorLayout&,
                                  const PreprocessedFilter*) override;

    size_t get_preprocess_workspace_in_bytes(const TensorLayout&,
                                             const TensorLayout&,
                                             const TensorLayout&,
                                             const TensorLayout&,
M
Megvii Engine Team 已提交
36
                                             const TensorLayout&) override;
37 38
    SmallVector<TensorLayout> deduce_preprocessed_filter_layout(
            const TensorLayout&, const TensorLayout&, const TensorLayout&,
M
Megvii Engine Team 已提交
39
            const TensorLayout&, const TensorLayout&) override;
40
    void exec_preprocess(const TensorLayout&, _megdnn_tensor_in,
41
                         _megdnn_tensor_in, const TensorLayout&,
42
                         const TensorLayout&, PreprocessedFilter*,
M
Megvii Engine Team 已提交
43
                         _megdnn_workspace) override;
44 45 46 47 48 49 50 51
    const char* get_algorithm_set_name() const override;

    class AlgoBase;
    class AlgoCUDNNConvBiasActivation;
    class AlgoChanwise;
    class AlgoChanwiseSmall;
    class AlgoChanwise8x8x32;
    class AlgoCUDNNConv;
52
    class AlgoFallbackNCHWQS8;
53 54 55 56 57 58 59
    class AlgoInplaceMatmul;
    class AlgoMatmul;
    class AlgoMatmul8x8x32;
    class Algo1x1;
    class AlgoBatchedMatmul;
    class AlgoGroupConvGeneral;
    class AlgoQUInt4x4x32WMMA;
60
    class AlgoCutlassConvolutionBase;
61 62 63 64 65 66
    class AlgoInt8CHWN4DotProdImplicitGemm;
    class AlgoInt8NCHW4DotProdImplicitGemm;
    class AlgoInt8CHWN4IMMAImplicitGemm;
    class AlgoInt8NCHW4IMMAImplicitGemm;
    class AlgoInt8CHWN4IMMAImplicitGemmReorderFilter;
    class AlgoInt8CHWN4IMMAImplicitGemmUnrollWidth;
67
    class AlgoInt8NCHW32IMMAImplicitGemm;
68
    class AlgoInt8NHWCIMMAImplicitGemm;
69
    class AlgoInt4NCHW64IMMAImplicitGemmBase;
70
    class AlgoInt4Int4NCHW64IMMAImplicitGemm;
71
    class AlgoUInt4Int4NCHW64IMMAImplicitGemm;
72 73 74
    class AlgoInt4NHWCIMMAImplicitGemmBase;
    class AlgoInt4Int4NHWCIMMAImplicitGemm;
    class AlgoUInt4Int4NHWCIMMAImplicitGemm;
75
    class AlgoBFloat16;
76 77 78 79 80

    class AlgoPack;

    static const AlgoPack& algo_pack() { return sm_algo_pack; }

81
    Algorithm* get_algorithm_from_desc(const AlgorithmDesc& desc) override;
82 83 84 85 86

    std::vector<Algorithm*> get_all_algorithms(
            const TensorLayout& src, const TensorLayout& filter,
            const TensorLayout& bias, const TensorLayout& z,
            const TensorLayout& dst) override;
87 88 89 90
    std::vector<Algorithm*> get_all_algorithms_safe(
            const TensorLayout& src, const TensorLayout& filter,
            const TensorLayout& bias, const TensorLayout& z,
            const TensorLayout& dst) override;
91 92 93 94 95 96
    Algorithm* get_algorithm_heuristic(
            const TensorLayout& src, const TensorLayout& filter,
            const TensorLayout& bias, const TensorLayout& z,
            const TensorLayout& dst, size_t workspace_limit_in_bytes,
            const AlgoAttribute& positive_attr,
            const AlgoAttribute& negative_attr) override;
97

98
private:
99

100 101 102 103 104
    static AlgoPack sm_algo_pack;
};

}  // namespace cuda
}  // namespace megdnn
105

106
// vim: syntax=cpp.doxygen