trt_graph_split_pass.h 1.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once
16
#include <mlir/Pass/Pass.h>
17 18
#include "paddle/infrt/dialect/infrt_base.h"
#include "paddle/infrt/dialect/tensorrt/trt_ops.h"
19 20 21 22 23 24 25 26 27 28 29 30 31

namespace infrt {
namespace trt {
/*
 * trtGraphSplitPass.
 *
 * Splite the graph op when the number of operations is too small.
 * The feature is the opposite of 'trtOpTellerPass'.
 *
 * source func:
 *
 * func @main() -> tensor<?xf32> {
 *  %a = "pd.feed"()...
32
 *  %d, %f = "trt.create_engine"(%a) {
33 34 35
 *     %m = "pd.conv2d"(%a)...
 *     %n = "pd.conv3d"(%m)...
 *     %s = "pd.conv2d"(%a)...
36
 *     "Infrt.return" (%n, %s)
37
 *  } ...
38
 *  "pd.fetch" (%d, %f)
39 40 41 42 43 44 45 46
 * }
 *
 * destination func:
 * func @main() -> tensor<?xf32> {
 *  %a = "pd.feed"()...
 *  %c = "pd.conv2d"(%a) ...
 *  %d = "pd.conv3d"(%c) ...
 *  %f = "pd.conv2d"(%a) ...
47
 *  "pd.fetch" (%d, %f)
48 49
 * }
 */
50 51
class TRTGraphSplitPass
    : public mlir::PassWrapper<TRTGraphSplitPass, mlir::FunctionPass> {
52 53
 public:
  ::llvm::StringRef getName() const override { return "trtGraphSplitPass"; }
54 55 56
  void getDependentDialects(mlir::DialectRegistry &registry) const override {
    registry.insert<TensorRTDialect, ::infrt::dialect::INFRTDialect>();
  }
57
  void runOnFunction() override;
58
  explicit TRTGraphSplitPass(size_t min_subgraph_size = 3)
59 60 61 62 63 64 65
      : min_subgraph_size_(min_subgraph_size) {}

 private:
  size_t min_subgraph_size_;
};
}  // namespace trt
}  // namespace infrt