trt_graph_split_pass.h 1.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once
16
#include <mlir/Pass/Pass.h>
17
#include "paddle/infrt/dialect/infrt_base.h"
18 19 20 21 22 23 24 25 26 27 28

namespace infrt {
namespace trt {
/*
 * trtGraphSplitPass.
 *
 * Splite the graph op when the number of operations is too small.
 * The feature is the opposite of 'trtOpTellerPass'.
 *
 * source func:
 *
S
Shang Zhizhou 已提交
29 30
 * func @main(%a : tensor<?xf32>) -> tensor<?xf32> {
 *  %d, %f = "pd.graph"(%a) {
31 32 33
 *     %m = "pd.conv2d"(%a)...
 *     %n = "pd.conv3d"(%m)...
 *     %s = "pd.conv2d"(%a)...
S
Shang Zhizhou 已提交
34
 *     "infrt.return" (%n, %s)...
35
 *  } ...
S
Shang Zhizhou 已提交
36
 *  "infrt.return" (%d, %f)...
37 38 39
 * }
 *
 * destination func:
S
Shang Zhizhou 已提交
40
 * func @main(%a : tensor<?xf32>) -> tensor<?xf32> {
41 42 43
 *  %c = "pd.conv2d"(%a) ...
 *  %d = "pd.conv3d"(%c) ...
 *  %f = "pd.conv2d"(%a) ...
S
Shang Zhizhou 已提交
44
 *  "infrt.return" (%d, %f)...
45 46
 * }
 */
47 48
class TRTGraphSplitPass
    : public mlir::PassWrapper<TRTGraphSplitPass, mlir::FunctionPass> {
49 50
 public:
  ::llvm::StringRef getName() const override { return "trtGraphSplitPass"; }
S
Shang Zhizhou 已提交
51
  void getDependentDialects(mlir::DialectRegistry &registry) const override {}
52
  void runOnFunction() override;
53
  explicit TRTGraphSplitPass(size_t min_subgraph_size = 3)
54 55 56 57 58 59 60
      : min_subgraph_size_(min_subgraph_size) {}

 private:
  size_t min_subgraph_size_;
};
}  // namespace trt
}  // namespace infrt