layer.cc 8.6 KB
Newer Older
J
Jiabin Yang 已提交
1
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
2 3 4 5 6 7 8 9 10 11 12 13 14 15
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/imperative/layer.h"
16
#include <algorithm>
J
Jiabin Yang 已提交
17
#include <queue>
18 19
#include <utility>
#include "paddle/fluid/framework/op_registry.h"
J
Jiabin Yang 已提交
20 21 22
#include "paddle/fluid/framework/variable_helper.h"
#include "paddle/fluid/imperative/prepared_operator.h"
#include "paddle/fluid/operators/math/math_function.h"
M
minqiyang 已提交
23
#include "paddle/fluid/platform/device_context.h"
J
Jiabin Yang 已提交
24
#include "paddle/fluid/platform/enforce.h"
C
chengduo 已提交
25
#include "paddle/fluid/platform/profiler.h"
26 27 28 29

namespace paddle {
namespace imperative {

J
Jiabin Yang 已提交
30
using framework::Variable;
Z
Zeng Jinle 已提交
31 32 33 34 35 36 37 38
void ThreadSafeNameSet::Insert(const std::string& name) {
  std::lock_guard<std::mutex> guard(mtx_);
  set_.insert(name);
}

void ThreadSafeNameSet::Remove(const std::string& name) {
  std::lock_guard<std::mutex> guard(mtx_);
  auto iter = set_.find(name);
J
Jiabin Yang 已提交
39
  PADDLE_ENFORCE_EQ(iter != set_.end(), true, "%s does not exist", name);
Z
Zeng Jinle 已提交
40 41 42 43 44 45 46 47 48 49 50 51
  set_.erase(iter);
}

std::vector<std::string> ThreadSafeNameSet::Names() const {
  std::lock_guard<std::mutex> guard(mtx_);
  return std::vector<std::string>(set_.begin(), set_.end());
}

ThreadSafeNameSet VarBase::name_set_;

std::vector<std::string> VarBase::AliveVarNames() { return name_set_.Names(); }

J
Jiabin Yang 已提交
52 53 54 55 56
static framework::VariableNameMap CreateVarNameMap(
    const framework::OpInfo& op_info, const std::string& op_type,
    const NameVarBaseMap& varbase_map, bool is_input) {
  if (op_info.proto_ == nullptr) {
    return {};
M
minqiyang 已提交
57 58
  }

J
Jiabin Yang 已提交
59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78
  framework::VariableNameMap result;

  for (auto& var :
       is_input ? op_info.Proto().inputs() : op_info.Proto().outputs()) {
    auto it = varbase_map.find(var.name());
    if (it == varbase_map.end()) {
      PADDLE_ENFORCE_EQ(
          var.dispensable(), true,
          "Var: %s not dispensable and there are no such var in inputs",
          var.name());
      result[var.name()] = {};
    } else {
      auto& var_vector = it->second;
      std::vector<std::string> args;
      args.reserve(var_vector.size());
      for (auto& var_base : var_vector) {
        args.emplace_back(var_base->Name());
      }
      result[var.name()] = std::move(args);
    }
M
minqiyang 已提交
79
  }
J
Jiabin Yang 已提交
80 81
  return result;
}
M
minqiyang 已提交
82

J
Jiabin Yang 已提交
83 84 85 86 87 88 89 90 91
static framework::RuntimeContext PrepareRuntimeContext(
    const NameVarBaseMap& ins, const NameVarBaseMap& outs) {
  framework::VariableValueMap inputs, outputs;
  for (auto& in_pair : ins) {
    auto& in_ctx = inputs[in_pair.first];
    in_ctx.reserve(in_pair.second.size());
    for (auto& in_var : in_pair.second) {
      in_ctx.emplace_back(in_var->MutableVar());
    }
M
minqiyang 已提交
92 93
  }

J
Jiabin Yang 已提交
94 95 96 97 98
  for (auto& out_pair : outs) {
    auto& out_ctx = outputs[out_pair.first];
    out_ctx.reserve(out_pair.second.size());
    for (auto& out_var : out_pair.second) {
      out_ctx.emplace_back(out_var->MutableVar());
99
    }
J
Jiabin Yang 已提交
100 101 102 103 104 105 106 107 108
  }
  return framework::RuntimeContext(std::move(inputs), std::move(outputs));
}

static std::string DebugString(
    const std::string& name,
    const std::vector<std::shared_ptr<VarBase>>& vars) {
  std::stringstream ss;
  ss << name << "{";
M
minqiyang 已提交
109

J
Jiabin Yang 已提交
110 111
  for (size_t i = 0; i < vars.size(); ++i) {
    if (i > 0) ss << ", ";
M
minqiyang 已提交
112

J
Jiabin Yang 已提交
113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135
    if (vars[i] == nullptr) {
      ss << "NULL";
      continue;
    }
    ss << vars[i]->Name() << "[";
    auto& var = vars[i]->Var();
    if (!var.IsInitialized()) {
      ss << "NOT_INITED_VAR";
    } else if (var.IsType<framework::LoDTensor>()) {
      auto& tensor = var.Get<framework::LoDTensor>();
      ss << "LoDTensor<";
      if (tensor.IsInitialized()) {
        ss << framework::DataTypeToString(tensor.type()) << ", ";
        ss << tensor.place() << ", ";
        ss << "(" << tensor.dims() << ")";
      } else {
        ss << "NOT_INITED";
      }
      ss << ">";
    } else {
      ss << "UNRESOLVED_TYPE";
    }
    ss << "]";
136
  }
137

J
Jiabin Yang 已提交
138 139
  ss << "}";
  return ss.str();
140 141
}

J
Jiabin Yang 已提交
142 143 144 145 146 147 148 149 150 151 152 153 154
std::string LayerDebugString(const std::string& op_type,
                             const NameVarBaseMap& ins,
                             const NameVarBaseMap& outs) {
  std::stringstream ss;
  ss << "Op(" << op_type << "): ";

  ss << "Inputs: ";

  size_t i = 0;
  for (auto& pair : ins) {
    if (i > 0) ss << ", ";
    ss << DebugString(pair.first, pair.second);
    ++i;
155 156
  }

J
Jiabin Yang 已提交
157 158 159 160 161 162 163 164 165
  ss << ",   Outputs: ";
  i = 0;
  for (auto& pair : outs) {
    if (i > 0) ss << ", ";
    ss << DebugString(pair.first, pair.second);
    ++i;
  }
  return ss.str();
}
166

J
Jiabin Yang 已提交
167 168 169 170 171 172
void VarBase::AddGradOps(const std::weak_ptr<OpBase>& op) {
  if (op.lock() == nullptr) {
    return;
  }
  for (const auto& cur_op : grad_ops_) {
    if (cur_op.lock() == op.lock()) {
173 174
      return;
    }
175
  }
J
Jiabin Yang 已提交
176 177
  grad_ops_.emplace_back(op);
}
178

J
Jiabin Yang 已提交
179 180 181 182 183 184 185
void VarBase::ClearGradient() {
  if (grad_var_) {
    auto* grad_t = grad_var_->var_.GetMutable<framework::LoDTensor>();
    if (grad_t->IsInitialized()) {
      auto* dev_ctx =
          platform::DeviceContextPool::Instance().Get(grad_t->place());
      operators::math::set_constant(*dev_ctx, grad_t, 0.0);
186 187
    }
  }
J
Jiabin Yang 已提交
188
}
189

J
Jiabin Yang 已提交
190
std::shared_ptr<VarBase> VarBase::NewVarBase(const platform::Place& dst_place,
M
minqiyang 已提交
191
                                             const bool blocking) const {
J
Jiabin Yang 已提交
192 193 194 195 196 197 198 199 200 201 202 203 204 205 206
  PADDLE_ENFORCE_EQ(var_.IsInitialized() && var_.IsType<framework::LoDTensor>(),
                    true,
                    "Variable must be initialized and type of LoDTensor when "
                    "getting numpy tensor");

  auto& src_tensor = var_.Get<framework::LoDTensor>();

  // TODO(Jiabin): change this after move unique_name generator to CXX
  auto new_var = std::make_shared<VarBase>(
      false, "Itmp" + std::to_string(copied_counter_++));

  auto* dst_tensor = new_var->var_.GetMutable<framework::LoDTensor>();
  dst_tensor->set_lod(src_tensor.lod());

  framework::TensorCopy(src_tensor, dst_place, dst_tensor);
P
Paddle CI 已提交
207
  if (blocking) {
208 209 210 211 212
    platform::DeviceContextPool::Instance().Get(dst_place)->Wait();
    auto src_place = src_tensor.place();
    if (!(src_place == dst_place)) {
      platform::DeviceContextPool::Instance().Get(src_place)->Wait();
    }
P
Paddle CI 已提交
213 214 215
  }

  if (platform::is_gpu_place(dst_place)) {
216
    VLOG(3) << "copy tensor " << Name() << " from gpu";
M
minqiyang 已提交
217 218
  }

P
Paddle CI 已提交
219
  return new_var;
M
minqiyang 已提交
220
}
J
Jiabin Yang 已提交
221 222 223 224 225 226 227 228 229 230 231
// create OpBase from optype
OpBase::OpBase(size_t id, const std::string& type, const NameVarBaseMap& ins,
               const NameVarBaseMap& outs, framework::AttributeMap attrs,
               const platform::Place& place)
    : id_(id), place_(place) {
  const auto& info = framework::OpInfoMap::Instance().Get(type);

  // Step 1: Run forward
  if (info.Checker() != nullptr) {
    info.Checker()->Check(&attrs);
  }
M
minqiyang 已提交
232

J
Jiabin Yang 已提交
233 234 235 236 237 238
  auto input_name_map = CreateVarNameMap(info, type, ins, true);
  auto output_name_map = CreateVarNameMap(info, type, outs, false);
  op_ = framework::OpRegistry::CreateOp(type, std::move(input_name_map),
                                        std::move(output_name_map),
                                        std::move(attrs));
  VLOG(3) << "Construct Op: " << type << std::endl;
239 240
}

J
Jiabin Yang 已提交
241 242 243 244 245 246
// create OpBase from opdesc
OpBase::OpBase(size_t id, const framework::OpDesc& op_desc,
               const platform::Place& place)
    : id_(id), op_(framework::OpRegistry::CreateOp(op_desc)), place_(place) {
  VLOG(3) << "Construct Op: " << op_desc.Type() << std::endl;
}
247

J
Jiabin Yang 已提交
248 249 250 251 252 253 254
void OpBase::Run(const NameVarBaseMap& ins, const NameVarBaseMap& outs) {
  auto* op_kernel = dynamic_cast<framework::OperatorWithKernel*>(op_.get());
  PADDLE_ENFORCE_NOT_NULL(op_kernel, "only support op with kernel");
  auto& info = op_->Info();
  if (info.infer_var_type_) {
    RuntimeInferVarTypeContext infer_var_type_ctx(ins, &outs, op_->Attrs());
    info.infer_var_type_(&infer_var_type_ctx);
X
Xin Pan 已提交
255
  }
X
Xin Pan 已提交
256

J
Jiabin Yang 已提交
257 258 259 260
  // Initialize output var type
  for (auto& var_pair : outs) {
    for (auto& var : var_pair.second) {
      InitializeVariable(var->MutableVar(), var->Type());
261 262
    }
  }
X
Xin Pan 已提交
263

J
Jiabin Yang 已提交
264 265 266 267
  VLOG(3) << "Running Op " << Type();
  VLOG(5) << LayerDebugString(Type(), ins, outs);
  auto runtime_ctx = PrepareRuntimeContext(ins, outs);
  auto runtime_place = PreparedOp::GetExpectedPlace(place(), ins);
268

J
Jiabin Yang 已提交
269 270
  auto prepared_op =
      PreparedOp::Prepare(runtime_ctx, *op_kernel, runtime_place);
271

J
Jiabin Yang 已提交
272
  prepared_op.Run();
273

J
Jiabin Yang 已提交
274
  VLOG(4) << LayerDebugString(Type(), ins, outs);
275 276
}

J
Jiabin Yang 已提交
277 278 279 280
void OpBase::ClearBackwardTrace() {
  grad_pending_ops_.clear();
  ins_.clear();
  outs_.clear();
281 282 283 284
}

}  // namespace imperative
}  // namespace paddle