trt_graph_split_pass.h 1.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once
16
#include <mlir/Pass/Pass.h>
17 18 19 20 21 22 23 24 25 26 27

namespace infrt {
namespace trt {
/*
 * trtGraphSplitPass.
 *
 * Splite the graph op when the number of operations is too small.
 * The feature is the opposite of 'trtOpTellerPass'.
 *
 * source func:
 *
S
Shang Zhizhou 已提交
28
 * func @main(%a : tensor<?xf32>) -> tensor<?xf32> {
29
 *  %d, %f = "infrt.graph"(%a) {
30 31 32
 *     %m = "pd.conv2d"(%a)...
 *     %n = "pd.conv3d"(%m)...
 *     %s = "pd.conv2d"(%a)...
33
 *     infrt.return %n, %s : ...
34
 *  } ...
35
 *  infrt.return %d, %f : ...
36 37 38
 * }
 *
 * destination func:
S
Shang Zhizhou 已提交
39
 * func @main(%a : tensor<?xf32>) -> tensor<?xf32> {
40 41 42
 *  %c = "pd.conv2d"(%a) ...
 *  %d = "pd.conv3d"(%c) ...
 *  %f = "pd.conv2d"(%a) ...
43
 *  infrt.return %d, %f:...
44 45
 * }
 */
46 47
class TRTGraphSplitPass
    : public mlir::PassWrapper<TRTGraphSplitPass, mlir::FunctionPass> {
48 49
 public:
  ::llvm::StringRef getName() const override { return "trtGraphSplitPass"; }
S
Shang Zhizhou 已提交
50
  void getDependentDialects(mlir::DialectRegistry &registry) const override {}
51
  void runOnFunction() override;
52
  explicit TRTGraphSplitPass(size_t min_subgraph_size = 3)
53 54 55 56 57 58 59
      : min_subgraph_size_(min_subgraph_size) {}

 private:
  size_t min_subgraph_size_;
};
}  // namespace trt
}  // namespace infrt