op_teller.h 2.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once
16
#include <memory>
17
#include <string>
18
#include <unordered_set>
19
#include <vector>
20

21
#include "paddle/fluid/framework/ir/node.h"
22
#include "paddle/fluid/framework/op_desc.h"
23
#include "paddle/fluid/inference/tensorrt/engine.h"
24

W
wanghuancoder 已提交
25 26 27 28 29 30
namespace paddle {
namespace framework {
class OpDesc;
}  // namespace framework
}  // namespace paddle

31 32 33 34 35 36 37 38 39 40
namespace paddle {
namespace inference {
namespace tensorrt {

/*
 * Single Op teller definition.
 * One can override this and define a more complex tell logic, considerring more
 * issues such as op_desc.
 */
struct Teller {
41 42 43
  virtual bool operator()(const framework::OpDesc& desc,
                          bool use_no_calib_int8 = false,
                          bool with_dynamic_shape = false) = 0;
44 45 46 47 48 49 50 51 52 53 54 55 56 57

  virtual ~Teller() = default;
};
/*
 * A real example:
 *
 * struct SomeTeller : public Teller {
 * bool operator()(const std::string& op_type,
 *                const framework::OpDesc& desc) override {
 *  return op_type == "fc" && desc.Inputs().size() == 2;
 * }
 *};
 */

58 59 60 61 62
enum class OpConverterType {
  Default = 0,
  GenericPluginCreater,
  CustomPluginCreater
};
63 64
/*
 * class OpTeller helps to tell whether a fluid
65 66
 * operator can be transformed to a TensorRT layer
 * and use which kind of OpConverter
67 68 69 70 71 72 73 74
 */
class OpTeller {
 public:
  static OpTeller& Global() {
    static std::unique_ptr<OpTeller> x(new OpTeller);
    return *x;
  }

75 76
  bool Tell(const framework::ir::Node* node,
            bool use_no_calib_int8 = false,
77
            bool with_dynamic_shape = false);
78

79 80 81 82 83 84 85 86 87 88 89 90 91 92
  std::unique_ptr<Teller>& GetDefaultTeller() { return tellers_.at(0); }

  std::unique_ptr<Teller>& GetGenericPluginTeller() { return tellers_.at(1); }

  std::unique_ptr<Teller>& GetCustomPluginTeller() { return tellers_.at(2); }

  void SetOpConverterType(std::string name, OpConverterType type) {
    op_converter_type_map_[name] = type;
  }

  const std::map<std::string, OpConverterType>& GetOpConverterTypeMap() const {
    return op_converter_type_map_;
  }

93 94 95 96 97
 private:
  OpTeller();

 private:
  std::vector<std::unique_ptr<Teller>> tellers_;
98
  std::map<std::string, OpConverterType> op_converter_type_map_;
99 100 101 102 103
};

}  // namespace tensorrt
}  // namespace inference
}  // namespace paddle