accumulation_node.h 2.6 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

17
#include "paddle/fluid/eager/autograd_meta.h"
18
#include "paddle/fluid/eager/grad_node_info.h"
19
#include "paddle/fluid/eager/hooks.h"
20 21 22 23 24 25

namespace egr {

class GradNodeAccumulation : public GradNodeBase {
 public:
  // Constructor: configure fwd input tensors to grad node
26
  explicit GradNodeAccumulation(AutogradMeta* meta) : GradNodeBase(1, 1) {
J
Jiabin Yang 已提交
27
    VLOG(6) << "Construct GradNodeAccumulation";
28 29 30 31
    if (meta) {
      weak_grad_ = meta->WeakGrad();
    }

32 33
    SetDefaultGradInOutMeta();
  }
34

J
Jiabin Yang 已提交
35 36 37
  ~GradNodeAccumulation() override {
    VLOG(6) << "Destruct GradNodeAccumulation";
  }
38 39

  // Functor: perform backward computations
40 41 42 43
  virtual paddle::small_vector<std::vector<paddle::experimental::Tensor>,
                               kSlotSmallVectorSize>
  operator()(paddle::small_vector<std::vector<paddle::experimental::Tensor>,
                                  kSlotSmallVectorSize>& grads,  // NOLINT
44 45
             bool create_graph = false,
             bool is_new_grad = false) override;
46 47 48

  void ClearTensorWrappers() override { VLOG(6) << "Do nothing here now"; }

49 50
  std::string name() { return "GradNodeAccumulation"; }

51 52 53
  /**
   * Register ReduceHook
   * **/
54
  void RegisterReduceHook(std::shared_ptr<TensorVoidHook>&& hook);
55 56 57 58 59 60 61

  /**
   * Apply ReduceHook here
   * **/
  inline bool ReduceHooksRegistered() { return reduce_hooks_.size() != 0; }
  void ApplyReduceHooks();

62 63 64 65 66
  std::shared_ptr<GradNodeBase> Copy() const override {
    return std::shared_ptr<GradNodeAccumulation>(
        new GradNodeAccumulation(nullptr));
  }

J
Jiabin Yang 已提交
67 68
  void SetFakeEmpty(bool is_fake_empty) { is_fake_empty_ = is_fake_empty; }

69
 private:
J
Jiabin Yang 已提交
70 71
  // TODO(Jiabin): remove this when we make our clear gradient really cleared;
  bool is_fake_empty_ = {false};
72
  std::weak_ptr<paddle::experimental::Tensor> weak_grad_;
J
Jiabin Yang 已提交
73
  std::vector<std::shared_ptr<TensorVoidHook>> reduce_hooks_;
74 75 76
  std::function<paddle::experimental::Tensor(
      const paddle::experimental::Tensor&)>
      retain_grad_hook_;
77 78 79
};

}  // namespace egr