pass.cc 8.4 KB
Newer Older
X
Xin Pan 已提交
1
/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
X
start  
Xin Pan 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/fluid/framework/ir/pass.h"
Q
Qiao Longfei 已提交
16

17
#include <algorithm>
18

X
Xin Pan 已提交
19
#include "paddle/fluid/framework/ir/graph_helper.h"
20
#include "paddle/fluid/framework/op_proto_maker.h"
21
#include "paddle/fluid/framework/program_utils.h"
W
wanghuancoder 已提交
22 23 24

namespace paddle {
namespace framework {
25
class Scope;
W
wanghuancoder 已提交
26 27 28 29 30
namespace ir {
class Graph;
}  // namespace ir
}  // namespace framework
}  // namespace paddle
31 32 33
#ifdef PADDLE_WITH_MKLDNN
#include "paddle/fluid/platform/mkldnn_helper.h"
#endif
X
start  
Xin Pan 已提交
34 35

namespace paddle {
X
Xin Pan 已提交
36 37
namespace framework {
namespace ir {
38

39 40 41
static const char kParamScopeAttr[] = "__param_scope__";

static const std::vector<std::string> support_subgraph_passes = {
42
    "simplify_with_basic_ops_pass",
43 44 45 46 47 48
    "fused_multi_transformer_encoder_pass",
    "fused_multi_transformer_decoder_pass",
    "fused_multi_transformer_encoder_fuse_qkv_pass",
    "fused_multi_transformer_decoder_fuse_qkv_pass",
    "multi_devices_fused_multi_transformer_encoder_fuse_qkv_pass",
    "multi_devices_fused_multi_transformer_decoder_fuse_qkv_pass",
49
    "fuse_multi_transformer_layer_pass"};
50

51 52
Graph *Pass::Apply(Graph *graph) const {
  VLOG(10) << "start to apply pass " << Type() << " to graph";
C
chengduo 已提交
53
  CheckPrevPass();
54 55
  PADDLE_ENFORCE_NOT_NULL(
      graph, platform::errors::InvalidArgument("Graph cannot be nullptr."));
56
  for (const std::string &attr : required_pass_attrs_) {
57
    PADDLE_ENFORCE_NE(
58 59
        attrs_.find(attr),
        attrs_.end(),
60 61
        platform::errors::InvalidArgument(
            "Required atrribute %s for pass < %s > is not set.", attr, Type()));
X
Xin Pan 已提交
62
  }
63
  for (const std::string &attr : required_graph_attrs_) {
64 65
    PADDLE_ENFORCE_EQ(graph->Has(attr),
                      true,
66 67
                      platform::errors::InvalidArgument(
                          "Required atrribute %s for graph is not set.", attr));
X
Xin Pan 已提交
68
  }
69
  ApplyImpl(graph);
X
Xin Pan 已提交
70
  // TODO(panyx0718): Add more verifications.
71
  PADDLE_ENFORCE_EQ(
72 73
      HasCircle(*graph),
      false,
74 75 76
      platform::errors::InvalidArgument(
          "Illegal pass %s. Generated graph shouldn't contain cycle.", Type()));
  PADDLE_ENFORCE_EQ(
77 78
      VarDescIsConsistency(*graph),
      true,
79 80
      platform::errors::InvalidArgument(
          "The VarDescs of persistable variable are not consistency."));
C
chengduo 已提交
81 82 83 84
  if (!graph->Has(kPassRecorder)) {
    graph->Set<PassRecorder>(kPassRecorder, new PassRecorder);
  }
  graph->Get<PassRecorder>(kPassRecorder).insert(Type());
85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115

  if (graph->IsMainGraph() && std::count(support_subgraph_passes.begin(),
                                         support_subgraph_passes.end(),
                                         Type())) {
    for (size_t i = 1; i < graph->SubGraphsSize(); i++) {
      auto *sub_graph = graph->GetSubGraph(i);
      if (!sub_graph->Has(framework::ir::kParamScopeAttr)) {
        sub_graph->SetNotOwned<Scope>(
            framework::ir::kParamScopeAttr,
            &graph->Get<Scope>(framework::ir::kParamScopeAttr));
      }

      ApplyImpl(sub_graph);
      PADDLE_ENFORCE_EQ(
          HasCircle(*sub_graph),
          false,
          platform::errors::InvalidArgument(
              "Illegal pass %s. Generated graph shouldn't contain cycle.",
              Type()));
      PADDLE_ENFORCE_EQ(
          VarDescIsConsistency(*sub_graph),
          true,
          platform::errors::InvalidArgument(
              "The VarDescs of persistable variable are not consistency."));
      if (!sub_graph->Has(kPassRecorder)) {
        sub_graph->Set<PassRecorder>(kPassRecorder, new PassRecorder);
      }
      sub_graph->Get<PassRecorder>(kPassRecorder).insert(Type());
    }
  }
  applied_ = true;
116 117 118
#ifdef PADDLE_WITH_MKLDNN
  // Clear mkl-dnn cache,
  // Passes can change params, tensors, so caching need to be discarded
119
  platform::ClearMKLDNNCache(paddle::platform::CPUPlace());
120
#endif
121
  VLOG(10) << "finish to apply pass " << Type() << " to graph";
122
  return graph;
X
Xin Pan 已提交
123 124
}

125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170
static void FillNotSpecifiedOpRole(const ProgramDesc &main_program) {
  for (size_t block_idx = 0; block_idx < main_program.Size(); ++block_idx) {
    auto ops = main_program.Block(block_idx).AllOps();
    size_t n = ops.size();
    std::vector<OpRole> roles;
    roles.reserve(n);
    auto op_role_attr = OpProtoAndCheckerMaker::OpRoleAttrName();
    for (auto *op : ops) {
      OpRole role;
      if (op->HasAttr(op_role_attr)) {
        role = static_cast<OpRole>(op->GetAttrIfExists<int>(op_role_attr));
      } else {
        role = OpRole::kNotSpecified;
      }
      roles.emplace_back(role);
    }

    // NOTE: The following codes may be wrong in some cases.
    // But how can we get the right OpRole? The right way
    // is that all passes should deal with unspecified OpRole.
    auto prev_role = OpRole::kForward;
    for (size_t i = 0; i < n; ++i) {
      if (roles[i] == OpRole::kNotSpecified) {
        VLOG(10) << "Fill op role of " << ops[i]->Type() << " as "
                 << static_cast<int>(prev_role);
        ops[i]->SetAttr(op_role_attr, static_cast<int>(prev_role));
      } else {
        prev_role = roles[i];
      }
    }
  }
}

void Pass::ApplyPassesToProgram(const std::vector<const Pass *> &passes,
                                ProgramDesc *main_program,
                                ProgramDesc *startup_program) {
  VLOG(10) << "ApplyPassesToProgram is called";
  PADDLE_ENFORCE_NOT_NULL(
      main_program,
      platform::errors::InvalidArgument("The main program must be provided."));

  PADDLE_ENFORCE_NOT_NULL(startup_program,
                          platform::errors::InvalidArgument(
                              "The startup program must be provided."));

  for (auto *p : passes) {
171 172 173
    PADDLE_ENFORCE_NOT_NULL(p,
                            platform::errors::InvalidArgument(
                                "The provided pass cannot be nullptr."));
174 175
    VLOG(10) << "Pass " << p->Type();
    if (passes.size() > 1) {
176 177
      PADDLE_ENFORCE_EQ(p->SupportApplyProgramViaGraph(),
                        true,
178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199
                        platform::errors::PermissionDenied(
                            "Each pass must support to be applied via Graph if "
                            "multi-passes are applied."));
    }
  }

  if (passes.size() == 1 && !passes[0]->SupportApplyProgramViaGraph()) {
    VLOG(10) << "apply pass " << passes[0]->Type() << " to program";
    passes[0]->ApplyImpl(main_program, startup_program);
    FillNotSpecifiedOpRole(*main_program);
    VLOG(10) << "finish to apply pass " << passes[0]->Type() << " to program";
    return;
  }

  Graph graph(*main_program);
  for (auto *p : passes) {
    p->Apply(&graph);
  }
  ConvertToPrograms(&graph, main_program, startup_program);
  FillNotSpecifiedOpRole(*main_program);
}

200 201
void Pass::ApplyImpl(ProgramDesc *main_program,
                     ProgramDesc *startup_program) const {
202 203 204
  PADDLE_THROW(platform::errors::Unimplemented(
      "The pass %s does not support to apply ProgramDesc directly", Type()));
}
205

206 207
void Pass::ConvertToPrograms(Graph *graph,
                             ProgramDesc *main_program,
208
                             ProgramDesc *startup_program) {
209
  ProgramDesc new_main_program;
210
  GraphToProgram(*graph, &new_main_program);
211 212
  main_program->CopyFrom(*new_main_program.Proto());

213
  if (graph->Has(details::kStartupProgramDescs)) {
214
    const auto &startups =
215
        graph->Get<details::ProgramDescs>(details::kStartupProgramDescs);
216 217
    VLOG(10) << "Merge startup programs";
    MergePrograms(startup_program, startups, /*append=*/true);
218
    graph->Erase(details::kStartupProgramDescs);
219 220
  }

221
  if (graph->Has(details::kProgramDescs)) {
222
    const auto &mains =
223
        graph->Get<details::ProgramDescs>(details::kProgramDescs);
224 225
    VLOG(10) << "Merge main programs";
    MergePrograms(main_program, mains, /*append=*/false);
226
    graph->Erase(details::kProgramDescs);
227 228
  }

229 230 231 232
  startup_program->Flush();
  main_program->Flush();
}

233
PassRegistry &PassRegistry::Instance() {
X
Xin Pan 已提交
234 235 236 237 238
  static PassRegistry g_pass_info_map;
  return g_pass_info_map;
}
}  // namespace ir
}  // namespace framework
X
start  
Xin Pan 已提交
239
}  // namespace paddle