tracer.h 7.1 KB
Newer Older
J
Jiabin Yang 已提交
1
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

J
Jiabin Yang 已提交
17 18
#include <atomic>
#include <future>  // NOLINT
19
#include <map>
J
Jiabin Yang 已提交
20
#include <memory>
21
#include <string>
22
#include <unordered_map>
23
#include <vector>
J
Jiabin Yang 已提交
24
#include "ThreadPool.h"
25
#include "paddle/fluid/framework/garbage_collector.h"
L
Leo Chen 已提交
26
#include "paddle/fluid/imperative/amp_auto_cast.h"
27
#include "paddle/fluid/imperative/basic_engine.h"
28
#include "paddle/fluid/imperative/jit/program_desc_tracer.h"
29
#include "paddle/fluid/imperative/layer.h"
J
Jiabin Yang 已提交
30
#include "paddle/fluid/platform/macros.h"
31
#include "paddle/phi/core/compat/arg_map_context.h"
32 33 34 35

namespace paddle {
namespace imperative {

L
Leo Chen 已提交
36 37
enum class AmpLevel;

38 39
enum class AmpDtype;

40 41 42 43
using GarbageCollectorMap =
    std::map<platform::Place,
             std::unique_ptr<paddle::framework::GarbageCollector>>;

44 45 46
class UniqueNameGenerator {
 public:
  explicit UniqueNameGenerator(std::string prefix = "") : prefix_(prefix) {}
47
  std::string Generate(std::string key = "dygraph_tmp") {
L
Leo Chen 已提交
48
    return prefix_ + key + "_" + std::to_string(id_++);
49 50 51 52 53 54 55
  }

 private:
  std::atomic<int> id_{0};
  std::string prefix_;
};

56
class Tracer {
J
Jiabin Yang 已提交
57 58
  DISABLE_COPY_AND_ASSIGN(Tracer);

59
 public:
60
  Tracer()
61
      : basic_engine_(new BasicEngine()),
62
        program_desc_tracer_(new jit::ProgramDescTracer()),
63 64 65
        generator_(new UniqueNameGenerator()) {
    expected_place_ = platform::CPUPlace();
  }
66

J
Jiabin Yang 已提交
67
  ~Tracer() = default;
68

J
Jiabin Yang 已提交
69 70 71 72 73 74
  template <typename VarType>
  void TraceOp(const std::string& type, const NameVarMap<VarType>& ins,
               const NameVarMap<VarType>& outs, framework::AttributeMap attrs,
               const platform::Place& place, bool trace_backward,
               const std::map<std::string, std::string>& inplace_map = {},
               paddle::framework::AttributeMap* passed_default_attrs_ = nullptr,
75
               bool use_default_attr_map = true);
J
Jiabin Yang 已提交
76

W
wanghuancoder 已提交
77 78 79 80 81 82 83 84 85 86
  template <typename VarType>
  void TraceOpImpl(
      const std::string& type, const NameVarMap<VarType>& ins,
      const NameVarMap<VarType>& outs,
      framework::AttributeMap& attrs,  // NOLINT
      const platform::Place& place, bool trace_backward,
      const std::map<std::string, std::string>& inplace_map = {},
      paddle::framework::AttributeMap* passed_default_attrs_ = nullptr,
      bool use_default_attr_map = true);

J
Jiabin Yang 已提交
87 88
  void TraceOp(const std::string& type, const NameVarBaseMap& ins,
               const NameVarBaseMap& outs, framework::AttributeMap attrs,
89
               const std::map<std::string, std::string>& inplace_map = {});
J
Jiabin Yang 已提交
90

J
Jiabin Yang 已提交
91
  void TraceOp(const std::string& type, const NameTensorMap& ins,
W
wanghuancoder 已提交
92 93
               const NameTensorMap& outs,
               paddle::framework::AttributeMap& attrs,  // NOLINT
J
Jiabin Yang 已提交
94 95 96
               const std::map<std::string, std::string>& inplace_map = {});

  void TraceOp(const std::string& type, const NameTensorMap& ins,
W
wanghuancoder 已提交
97 98 99 100 101 102
               const NameTensorMap& outs,
               paddle::framework::AttributeMap attrs);

  void TraceOp(const std::string& type, const NameTensorMap& ins,
               const NameTensorMap& outs,
               paddle::framework::AttributeMap& attrs,  // NOLINT
J
Jiabin Yang 已提交
103 104
               const paddle::platform::Place& place,
               paddle::framework::AttributeMap* default_attrs,
105
               bool use_default_attr_map,
106
               const std::map<std::string, std::string>& inplace_map = {});
107

108 109
  bool ComputeRequiredGrad(const NameVarBaseMap& ins,
                           const NameVarBaseMap& outs, bool trace_backward);
J
Jiabin Yang 已提交
110 111
  bool ComputeRequiredGrad(const NameTensorMap& ins, const NameTensorMap& outs,
                           bool trace_backward);
J
Jiabin Yang 已提交
112

113 114 115 116 117 118 119 120 121 122 123 124
  void SetEnableProgramDescTracing(bool enabled) {
    enable_program_desc_tracing_ = enabled;
  }

  bool IsProgramDescTracingEnabled() const {
    return enable_program_desc_tracing_;
  }

  jit::ProgramDescTracer* GetProgramDescTracer() {
    return program_desc_tracer_.get();
  }

125 126 127 128 129 130 131
  // Note(Aurelius84): The `tmp` is used as prefix key while naming a temporary
  // intermediate var both in imperative and static mode. But the
  // `UniqueNameGenerator` in C++ and `unique_name.py` in Python doesn't share
  // the same auto-increment id. It will create a variable repeatedly with same
  // name like `tmp_0` in some cases when transform dygraph into static layers.
  // So we modify the default prefix key into `eager_tmp` to distinguish with
  // static graph.
132
  std::string GenerateUniqueName(std::string key = "dygraph_tmp") {
133 134 135
    return generator_->Generate(key);
  }

136 137
  BasicEngine* GetEngine() const { return basic_engine_.get(); }

138 139
  platform::Place ExpectedPlace() const { return expected_place_; }

W
WangXi 已提交
140
  void SetExpectedPlace(platform::Place place);
141

142
  bool HasGrad() const { return has_grad_; }
143

144
  void SetHasGrad(bool has_grad) { has_grad_ = has_grad; }
145

L
Leo Chen 已提交
146 147 148 149
  void SetAmpLevel(AmpLevel level) {
    VLOG(4) << "set amp_level to " << static_cast<unsigned int>(level);
    amp_level_ = level;
  }
150

L
Leo Chen 已提交
151
  AmpLevel GetAmpLevel() const { return amp_level_; }
152

153 154 155
  void SetAmpDtype(std::string amp_dtype) {
    VLOG(4) << "set amp_dtype to " << amp_dtype;
    if (amp_dtype == "float16") {
156
      amp_dtype_ = phi::DataType::FLOAT16;
157
    } else if (amp_dtype == "bfloat16") {
158
      amp_dtype_ = phi::DataType::BFLOAT16;
159
    } else {
160
      amp_dtype_ = phi::DataType::FLOAT32;
161 162 163 164
    }
  }

  std::string GetAmpDtype() const {
165
    if (amp_dtype_ == phi::DataType::FLOAT16) {
166
      return std::string("float16");
167
    } else if (amp_dtype_ == phi::DataType::BFLOAT16) {
168 169 170 171 172 173
      return std::string("bfloat16");
    } else {
      return std::string("float32");
    }
  }

174
  phi::KernelSignature GetExpectedKernelSignature(
175 176
      const std::string& type, const NameTensorMap& ins,
      const NameTensorMap& outs, framework::AttributeMap attrs) const;
177

178 179 180
  paddle::framework::GarbageCollector* MutableGarbageCollectorIfNotExists(
      const platform::Place& place);

181
 private:
182
  std::unique_ptr<BasicEngine> basic_engine_;
183
  std::unique_ptr<jit::ProgramDescTracer> program_desc_tracer_;
184
  std::unique_ptr<UniqueNameGenerator> generator_;
185
  platform::Place expected_place_;
186
  GarbageCollectorMap gcs_;
187 188

  static thread_local bool enable_program_desc_tracing_;
Z
Zeng Jinle 已提交
189
  static thread_local bool has_grad_;
190
  static thread_local AmpLevel amp_level_;
191
  static thread_local phi::DataType amp_dtype_;
192 193
};

194 195 196
// To access static variable current_tracer
const std::shared_ptr<Tracer>& GetCurrentTracer();
void SetCurrentTracer(const std::shared_ptr<Tracer>& tracer_);
197 198 199
void IncreaseVarbaseReferenceCountUntilCopyComplete(
    const std::shared_ptr<imperative::VarBase>& var,
    const platform::Place& place);
200

201 202
void PassStopGradient(const NameVarBaseMap& outs, bool generate_grad);

203 204
}  // namespace imperative
}  // namespace paddle