tracer.cc 6.3 KB
Newer Older
J
Jiabin Yang 已提交
1
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
2 3 4 5 6 7 8 9 10 11 12 13 14
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "paddle/fluid/imperative/tracer.h"
H
hong 已提交
15
#include <set>
M
minqiyang 已提交
16
#include <unordered_set>
17
#include <utility>
C
chengduo 已提交
18
#include "paddle/fluid/platform/profiler.h"
M
minqiyang 已提交
19

20
namespace paddle {
M
minqiyang 已提交
21 22
namespace imperative {

23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52
static void ClearNoNeedBufferInputs(OpBase* op) {
  auto& inferer = op->Info().NoNeedBufferVarsInferer();
  if (!inferer) return;
  auto* ins = op->GetMutableInsMap();
  const auto& no_need_buffer_slots =
      inferer(*ins, op->GetOutsMap(), op->Attrs());
  if (no_need_buffer_slots.empty()) return;

  for (auto& slot : no_need_buffer_slots) {
    auto iter = ins->find(slot);
    if (iter == ins->end()) continue;
    VLOG(2) << "Clear data buffer of " << slot << " in " << op->Type();

    for (auto& each_var : iter->second) {
      if (!each_var) continue;

      auto& var = each_var->Var();
      PADDLE_ENFORCE_EQ(var.IsType<framework::LoDTensor>(), true,
                        "Only support LoDTensor");
      // TODO(zjl): support higher order derivatives
      auto new_var = new VarBase(false, each_var->Name());
      auto* new_tensor =
          new_var->MutableVar()->GetMutable<framework::LoDTensor>();
      auto& old_tensor = var.Get<framework::LoDTensor>();
      new_tensor->Resize(old_tensor.dims());
      each_var.reset(new_var);
    }
  }
}

H
hong 已提交
53 54 55 56 57
static std::vector<std::unique_ptr<OpBase>> CreateGradOpBases(
    const OpBase* fw_op_base, const NameVarBaseMap& in,
    const NameVarBaseMap& out) {
  if (fw_op_base->Info().dygraph_grad_op_maker_) {
    return fw_op_base->Info().dygraph_grad_op_maker_(fw_op_base, in, out);
J
Jiabin Yang 已提交
58 59
  } else {
    return {};
X
Xin Pan 已提交
60
  }
M
minqiyang 已提交
61 62
}

63 64 65 66 67 68 69 70 71 72
static void PassStopGradient(const NameVarBaseMap& outs, bool generate_grad) {
  for (const auto& name_pair : outs) {
    for (const auto& vb : name_pair.second) {
      VLOG(6) << "Set output: " << vb->Name() << "'s OverridedStopGradient as "
              << generate_grad;
      vb->InnerSetOverridedStopGradient(generate_grad);
    }
  }
}

J
Jiabin Yang 已提交
73 74 75 76 77 78 79 80 81
void Tracer::TraceOp(const std::string& type, const NameVarBaseMap& ins,
                     const NameVarBaseMap& outs, framework::AttributeMap attrs,
                     const platform::Place& place, bool trace_backward) {
  platform::RecordEvent event(type);
  VLOG(1) << "Trace Op: " << type;
  size_t op_id = GenerateUniqueId();
  auto op = OpBase::Create(op_id, type, ins, outs, std::move(attrs), place);
  op->Run(ins, outs);

82 83 84 85 86
  if (enable_program_desc_tracing_) {
    VLOG(5) << "Trace op " << type << " into ProgramDesc";
    program_desc_tracer_->InsertOp(type, ins, outs, op->Attrs());
  }

J
Jiabin Yang 已提交
87
  if (ComputeRequiredGrad(ins, outs, trace_backward)) {
H
hong 已提交
88
    TraceBackward(op, ins, outs);
89 90
  } else {
    VLOG(3) << "No Grad to track for Op: " << type;
91
  }
M
minqiyang 已提交
92 93
}

J
Jiabin Yang 已提交
94
bool Tracer::ComputeRequiredGrad(const NameVarBaseMap& ins,
95
                                 const NameVarBaseMap& outs,
J
Jiabin Yang 已提交
96
                                 bool trace_backward) {
97 98 99 100 101 102 103 104 105 106 107 108 109
  if (!trace_backward) return false;

  for (const auto& name_pair : ins) {
    for (const auto& var_base : name_pair.second) {
      if (!var_base->OverridedStopGradient()) {
        VLOG(6) << "Find out input: " << var_base->Name()
                << "'s GeneratedGrad is True";
        PassStopGradient(outs, var_base->OverridedStopGradient());
        return true;
      }
    }
  }
  return false;
M
minqiyang 已提交
110 111
}

J
Jiabin Yang 已提交
112 113 114 115 116 117
void Tracer::TraceBackward(const std::shared_ptr<OpBase>& fwd_op,
                           const NameVarBaseMap& ins,
                           const NameVarBaseMap& outs) {
  // grad_to_var is a map of framework::GradVarName(in_var_name/out_var_name) ->
  // in_var_name/out_var_name
  std::unordered_map<std::string, std::string> grad_to_var;
118

J
Jiabin Yang 已提交
119
  // Get grad_op_desc using fwd_op_desc
H
hong 已提交
120 121
  std::vector<std::unique_ptr<OpBase>> grad_op_bases_ =
      CreateGradOpBases(fwd_op.get(), ins, outs);
122

H
hong 已提交
123
  size_t grad_op_num = grad_op_bases_.size();
124

H
hong 已提交
125 126 127 128
  std::set<VarBase*> set_input_vars;
  for (auto& fwd_in_it : ins) {
    for (auto& var_base_it : fwd_in_it.second) {
      set_input_vars.insert(var_base_it.get());
M
minqiyang 已提交
129 130 131
    }
  }

H
hong 已提交
132 133 134
  for (auto& fwd_out_it : outs) {
    for (auto& var_base_it : fwd_out_it.second) {
      set_input_vars.insert(var_base_it.get());
M
minqiyang 已提交
135 136 137
    }
  }

H
hong 已提交
138
  for (size_t i = 0; i < grad_op_num; ++i) {
J
Jiabin Yang 已提交
139 140
    size_t trace_id = fwd_op->id();

H
hong 已提交
141 142 143 144 145 146 147 148 149 150 151 152
    std::shared_ptr<OpBase> grad_op = std::move(grad_op_bases_[i]);
    grad_op->SetId(trace_id);
    grad_op->SetPlace(fwd_op->place());
    grad_op->CreateOperatorBase();

    auto& grad_in = *(grad_op->GetMutableInsMap());
    auto& grad_out = *(grad_op->GetMutableOutsMap());
    for (auto& grad_in_it : grad_in) {
      for (auto& var_base_it : grad_in_it.second) {
        if (set_input_vars.count(var_base_it.get()) == 0) {
          var_base_it->AddGradOps(grad_op);
          engine_->InsertGradVar(var_base_it.get());
J
Jiabin Yang 已提交
153 154 155
        }
      }
    }
156

157
    std::set<OpBase*> visited_preceding_ops;
H
hong 已提交
158 159 160 161 162 163 164 165 166
    for (auto& grad_out_it : grad_out) {
      bool flag_clear_list = false;
      for (auto& var_base_it : grad_out_it.second) {
        if ((!var_base_it->OverridedStopGradient()) ||
            (grad_out_it.second.size() > 1)) {
          auto preceding_ops = var_base_it->GradOps();
          if (!preceding_ops.empty()) {
            for (const auto& op : preceding_ops) {
              visited_preceding_ops.insert(op);
J
Jiabin Yang 已提交
167 168 169
            }
          }
        } else {
H
hong 已提交
170
          flag_clear_list = true;
M
minqiyang 已提交
171 172
        }
      }
H
hong 已提交
173 174 175
      if (flag_clear_list) {
        grad_out_it.second.clear();
      }
M
minqiyang 已提交
176
    }
H
hong 已提交
177 178 179 180 181 182 183
    std::vector<OpBase*> vec_preceding_ops(visited_preceding_ops.begin(),
                                           visited_preceding_ops.end());

    grad_op->SetGradPendingOps(std::move(vec_preceding_ops));

    // this OpBase* is just used to manage op's life time
    engine_->InsertOp(grad_op.get(), grad_op);
184
    ClearNoNeedBufferInputs(grad_op.get());
M
minqiyang 已提交
185 186
  }
}
J
Jiabin Yang 已提交
187

M
minqiyang 已提交
188
}  // namespace imperative
189
}  // namespace paddle