trt_graph_split_pass.h 1.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once
16
#include <mlir/Pass/Pass.h>
17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33

namespace infrt {
namespace trt {
/*
 * trtGraphSplitPass.
 *
 * Splite the graph op when the number of operations is too small.
 * The feature is the opposite of 'trtOpTellerPass'.
 *
 * source func:
 *
 * func @main() -> tensor<?xf32> {
 *  %a = "pd.feed"()...
 *  %d, %f = "pd.graph"(%a) {
 *     %m = "pd.conv2d"(%a)...
 *     %n = "pd.conv3d"(%m)...
 *     %s = "pd.conv2d"(%a)...
34
 *     "pd.return" (%n, %s)
35
 *  } ...
36
 *  "pd.fetch" (%d, %f)
37 38 39 40 41 42 43 44
 * }
 *
 * destination func:
 * func @main() -> tensor<?xf32> {
 *  %a = "pd.feed"()...
 *  %c = "pd.conv2d"(%a) ...
 *  %d = "pd.conv3d"(%c) ...
 *  %f = "pd.conv2d"(%a) ...
45
 *  "pd.fetch" (%d, %f)
46 47
 * }
 */
48 49
class TRTGraphSplitPass
    : public mlir::PassWrapper<TRTGraphSplitPass, mlir::FunctionPass> {
50 51 52
 public:
  ::llvm::StringRef getName() const override { return "trtGraphSplitPass"; }
  void runOnFunction() override;
53
  explicit TRTGraphSplitPass(size_t min_subgraph_size = 3)
54 55 56 57 58 59 60
      : min_subgraph_size_(min_subgraph_size) {}

 private:
  size_t min_subgraph_size_;
};
}  // namespace trt
}  // namespace infrt