backward_test.cc 12.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32
// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include <sstream>

#include "glog/logging.h"
#include "gtest/gtest.h"

#include "paddle/fluid/eager/accumulation/accumulation_node.h"
#include "paddle/fluid/eager/api/generated/eager_generated/backwards/scale_node.h"
#include "paddle/fluid/eager/api/utils/tensor_utils.h"
#include "paddle/fluid/eager/autograd_meta.h"
#include "paddle/fluid/eager/backward.h"
#include "paddle/fluid/eager/grad_node_info.h"
#include "paddle/fluid/eager/tests/test_utils.h"

#include "paddle/fluid/eager/api/all.h"

#include "paddle/pten/core/dense_tensor.h"
#include "paddle/pten/core/tensor_meta.h"

33
namespace egr {
34 35 36

TEST(Backward, SingleNodeEmptyGrad) {
  // Prepare Device Contexts
37
  eager_test::InitEnv(paddle::platform::CPUPlace());
38 39 40 41 42

  // Prepare Inputs
  paddle::framework::DDim ddim = paddle::framework::make_ddim({4, 16, 16, 32});

  // Create Target Tensor
43 44 45 46
  paddle::experimental::Tensor target_tensor =
      egr_utils_api::CreateTensorWithValue(
          ddim, paddle::platform::CPUPlace(), pten::DataType::FLOAT32,
          pten::DataLayout::NCHW, 1.0 /*value*/, false /*is_leaf*/);
47

48
  paddle::experimental::Tensor leaf_tensor;
49 50 51 52 53 54 55 56 57 58 59
  {
    // Create Scale Node
    auto node0_ptr = std::make_shared<GradNodeScale>(1, 1);
    node0_ptr->SetAttributes_scale(5.0 /*scale*/);

    // Set grad in/out meta
    node0_ptr->SetDefaultGradInOutMeta();
    AutogradMeta* auto_grad_meta = EagerUtils::autograd_meta(&target_tensor);
    auto_grad_meta->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(node0_ptr));
    auto_grad_meta->SetSingleOutRankWithSlot(0, 0);
60
    auto_grad_meta->SetStopGradient(false);
61 62 63 64 65 66 67 68 69

    // Connect Tensor and AccumulationNode via AutoGradMeta
    auto acc_node_ptr = std::make_shared<egr::GradNodeAccumulation>();

    AutogradMeta* auto_grad_meta1 = EagerUtils::autograd_meta(&leaf_tensor);
    auto_grad_meta1->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(acc_node_ptr));
    auto_grad_meta1->SetSingleOutRankWithSlot(0, 0);

70
    egr_utils_api::RetainGradForTensor(leaf_tensor);
71 72 73

    // Connect Node0 -> AccumulationNode via Edge
    auto meta = egr::AutogradMeta();
74
    meta.SetStopGradient(false);
75 76
    meta.SetSingleOutRankWithSlot(0, 0);
    meta.SetGradNode(acc_node_ptr);
77 78
    std::vector<egr::AutogradMeta*> res = {&meta};
    node0_ptr->AddEdges(&res, 0);
79
  }
80
  std::vector<paddle::experimental::Tensor> outs = {target_tensor};
81 82 83 84
  // Run Backward
  RunBackward(outs, {});

  // Check Output Value
85
  eager_test::CompareGradTensorWithValue<float>(leaf_tensor, 5.0);
86 87 88 89
}

TEST(Backward, SingleNodeCustomGrad) {
  // Prepare Device Contexts
90
  eager_test::InitEnv(paddle::platform::CPUPlace());
91 92

  // Prepare Inputs
93
  std::vector<paddle::experimental::Tensor> target_tensors;
94 95 96
  paddle::framework::DDim ddim = paddle::framework::make_ddim({4, 16, 16, 32});

  // Create Target Tensor
97
  paddle::experimental::Tensor tensor = egr_utils_api::CreateTensorWithValue(
98 99 100 101
      ddim, paddle::platform::CPUPlace(), pten::DataType::FLOAT32,
      pten::DataLayout::NCHW, 1.0 /*value*/, false /*is_leaf*/);
  target_tensors.emplace_back(std::move(tensor));

102
  std::vector<paddle::experimental::Tensor> grad_tensors;
103
  // Create Grad Tensor
104 105 106 107
  paddle::experimental::Tensor grad_tensor =
      egr_utils_api::CreateTensorWithValue(
          ddim, paddle::platform::CPUPlace(), pten::DataType::FLOAT32,
          pten::DataLayout::NCHW, 10.0 /*value*/, false /*is_leaf*/);
108 109
  grad_tensors.emplace_back(std::move(grad_tensor));

110
  paddle::experimental::Tensor leaf_tensor;
111 112 113 114 115 116 117 118 119 120 121 122 123 124
  {
    // Create Scale Node
    auto node0_ptr = std::make_shared<GradNodeScale>(1, 1);
    node0_ptr->SetAttributes_scale(5.0 /*scale*/);

    // Set grad in/out meta
    node0_ptr->SetDefaultGradInOutMeta();

    // Connect Tensor and Node via AutoGradMeta
    AutogradMeta* auto_grad_meta =
        EagerUtils::autograd_meta(&(target_tensors[0]));
    auto_grad_meta->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(node0_ptr));
    auto_grad_meta->SetSingleOutRankWithSlot(0, 0);
125
    auto_grad_meta->SetStopGradient(false);
126 127 128 129 130 131 132 133
    // Connect Tensor and AccumulationNode via AutoGradMeta
    auto acc_node_ptr = std::make_shared<egr::GradNodeAccumulation>();

    AutogradMeta* auto_grad_meta1 = EagerUtils::autograd_meta(&leaf_tensor);
    auto_grad_meta1->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(acc_node_ptr));
    auto_grad_meta1->SetSingleOutRankWithSlot(0, 0);

134
    egr_utils_api::RetainGradForTensor(leaf_tensor);
135 136 137

    // Connect Node0 -> AccumulationNode via Edge
    auto meta = egr::AutogradMeta();
138
    meta.SetStopGradient(false);
139 140
    meta.SetSingleOutRankWithSlot(0, 0);
    meta.SetGradNode(acc_node_ptr);
141 142
    std::vector<egr::AutogradMeta*> res = {&meta};
    node0_ptr->AddEdges(&res, 0);
143 144 145 146 147 148
  }

  // Run Backward
  RunBackward(target_tensors, grad_tensors);

  // Check Output Value
149
  eager_test::CompareGradTensorWithValue<float>(leaf_tensor, 50.0);
150 151 152 153 154 155 156 157 158 159 160
}

/*
Node1
  |
Node0
  |
 inp0
*/
TEST(Backward, LinearNodes) {
  // Prepare Device Contexts
161
  eager_test::InitEnv(paddle::platform::CPUPlace());
162 163

  // Prepare Inputs
164
  std::vector<paddle::experimental::Tensor> target_tensors;
165 166 167
  paddle::framework::DDim ddim = paddle::framework::make_ddim({4, 16, 16, 32});

  // Create Target Tensor
168
  paddle::experimental::Tensor tensor = egr_utils_api::CreateTensorWithValue(
169 170 171 172
      ddim, paddle::platform::CPUPlace(), pten::DataType::FLOAT32,
      pten::DataLayout::NCHW, 1.0 /*value*/, false /*is_leaf*/);
  target_tensors.emplace_back(std::move(tensor));

173
  paddle::experimental::Tensor leaf_tensor;
174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194
  {
    // Create Node0
    auto node0_ptr = std::make_shared<GradNodeScale>(1, 1);
    node0_ptr->SetAttributes_scale(5.0 /*scale*/);

    // Set grad in/out meta for node0
    node0_ptr->SetDefaultGradInOutMeta();

    // Create Node1
    auto node1_ptr = std::make_shared<GradNodeScale>(1, 1);
    node1_ptr->SetAttributes_scale(10.0 /*scale*/);

    // Set grad in/out meta for node1
    node1_ptr->SetDefaultGradInOutMeta();

    // Connect Input Tensor and Node0 via AutoGradMeta
    AutogradMeta* auto_grad_meta =
        EagerUtils::autograd_meta(&(target_tensors[0]));
    auto_grad_meta->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(node0_ptr));
    auto_grad_meta->SetSingleOutRankWithSlot(0, 0);
195
    auto_grad_meta->SetStopGradient(false);
196 197
    // Connect Node0 -> Node1 via Edge
    auto meta0 = egr::AutogradMeta();
198
    meta0.SetStopGradient(false);
199 200
    meta0.SetSingleOutRankWithSlot(0, 0);
    meta0.SetGradNode(node1_ptr);
201 202
    std::vector<egr::AutogradMeta*> res0 = {&meta0};
    node0_ptr->AddEdges(&res0, 0);
203 204 205 206 207 208 209 210 211

    // Connect Tensor and AccumulationNode via AutoGradMeta
    auto acc_node_ptr = std::make_shared<egr::GradNodeAccumulation>();

    AutogradMeta* auto_grad_meta1 = EagerUtils::autograd_meta(&leaf_tensor);
    auto_grad_meta1->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(acc_node_ptr));
    auto_grad_meta1->SetSingleOutRankWithSlot(0, 0);

212
    egr_utils_api::RetainGradForTensor(leaf_tensor);
213 214 215

    // Connect Node1 -> AccumulationNode via Edge
    auto meta1 = egr::AutogradMeta();
216
    meta1.SetStopGradient(false);
217 218
    meta1.SetSingleOutRankWithSlot(0, 0);
    meta1.SetGradNode(acc_node_ptr);
219 220
    std::vector<egr::AutogradMeta*> res1 = {&meta1};
    node1_ptr->AddEdges(&res1, 0);
221 222 223 224 225 226
  }

  // Use Empty Grad Tensor
  RunBackward(target_tensors, {});

  // Check Output Value
227
  eager_test::CompareGradTensorWithValue<float>(leaf_tensor, 50.0);
228 229 230 231 232 233 234 235 236 237 238
}

/*
    Node2
    |   |
Node0   Node1
  |      |
 inp0   inp1
*/
TEST(Backward, WithAccumulation) {
  // Prepare Device Contexts
239
  eager_test::InitEnv(paddle::platform::CPUPlace());
240 241 242 243 244

  // Prepare Inputs
  paddle::framework::DDim ddim = paddle::framework::make_ddim({4, 16, 16, 32});

  // Create Target Tensor
245 246
  std::vector<paddle::experimental::Tensor> target_tensors;
  paddle::experimental::Tensor tensor0 = egr_utils_api::CreateTensorWithValue(
247 248
      ddim, paddle::platform::CPUPlace(), pten::DataType::FLOAT32,
      pten::DataLayout::NCHW, 1.0 /*value*/, false /*is_leaf*/);
249
  paddle::experimental::Tensor tensor1 = egr_utils_api::CreateTensorWithValue(
250 251 252 253 254 255
      ddim, paddle::platform::CPUPlace(), pten::DataType::FLOAT32,
      pten::DataLayout::NCHW, 1.0 /*value*/, false /*is_leaf*/);
  target_tensors.emplace_back(std::move(tensor0));
  target_tensors.emplace_back(std::move(tensor1));

  // Create Grad Tensor
256 257 258 259 260 261 262 263 264
  std::vector<paddle::experimental::Tensor> grad_tensors;
  paddle::experimental::Tensor grad_tensor0 =
      egr_utils_api::CreateTensorWithValue(
          ddim, paddle::platform::CPUPlace(), pten::DataType::FLOAT32,
          pten::DataLayout::NCHW, 5.0 /*value*/, false /*is_leaf*/);
  paddle::experimental::Tensor grad_tensor1 =
      egr_utils_api::CreateTensorWithValue(
          ddim, paddle::platform::CPUPlace(), pten::DataType::FLOAT32,
          pten::DataLayout::NCHW, 10.0 /*value*/, false /*is_leaf*/);
265 266 267
  grad_tensors.emplace_back(std::move(grad_tensor0));
  grad_tensors.emplace_back(std::move(grad_tensor1));

268
  paddle::experimental::Tensor leaf_tensor;
269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288
  {
    // Create Node0
    auto node0_ptr = std::make_shared<GradNodeScale>(1, 1);
    node0_ptr->SetAttributes_scale(5.0 /*scale*/);
    node0_ptr->SetDefaultGradInOutMeta();

    // Create Node1
    auto node1_ptr = std::make_shared<GradNodeScale>(1, 1);
    node1_ptr->SetAttributes_scale(10.0 /*scale*/);
    node1_ptr->SetDefaultGradInOutMeta();
    // Create Node2
    auto node2_ptr = std::make_shared<GradNodeScale>(1, 1);
    node2_ptr->SetAttributes_scale(20.0 /*scale*/);
    node2_ptr->SetDefaultGradInOutMeta();
    // Connect Inp0 and Node0 via AutoGradMeta
    AutogradMeta* auto_grad_meta0 =
        EagerUtils::autograd_meta(&(target_tensors[0]));
    auto_grad_meta0->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(node0_ptr));
    auto_grad_meta0->SetSingleOutRankWithSlot(0, 0);
289
    auto_grad_meta0->SetStopGradient(false);
290 291 292 293 294 295
    // Connect Inp1 and Node1 via AutoGradMeta
    AutogradMeta* auto_grad_meta1 =
        EagerUtils::autograd_meta(&(target_tensors[1]));
    auto_grad_meta1->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(node1_ptr));
    auto_grad_meta1->SetSingleOutRankWithSlot(0, 0);
296
    auto_grad_meta1->SetStopGradient(false);
297 298 299

    // Connect Node0 -> Node2 via Edge
    auto meta0 = egr::AutogradMeta();
300
    meta0.SetStopGradient(false);
301 302
    meta0.SetSingleOutRankWithSlot(0, 0);
    meta0.SetGradNode(node2_ptr);
303 304
    std::vector<egr::AutogradMeta*> res0 = {&meta0};
    node0_ptr->AddEdges(&res0, 0);
305 306 307

    // Connect Node1 -> Node2 via Edge
    auto meta1 = egr::AutogradMeta();
308
    meta1.SetStopGradient(false);
309 310
    meta1.SetSingleOutRankWithSlot(0, 0);
    meta1.SetGradNode(node2_ptr);
311 312
    std::vector<egr::AutogradMeta*> res1 = {&meta1};
    node1_ptr->AddEdges(&res1, 0);
313 314 315 316 317 318 319 320 321

    // Connect Tensor and AccumulationNode via AutoGradMeta
    auto acc_node_ptr = std::make_shared<egr::GradNodeAccumulation>();

    AutogradMeta* auto_grad_meta2 = EagerUtils::autograd_meta(&leaf_tensor);
    auto_grad_meta2->SetGradNode(
        std::dynamic_pointer_cast<GradNodeBase>(acc_node_ptr));
    auto_grad_meta2->SetSingleOutRankWithSlot(0, 0);

322
    egr_utils_api::RetainGradForTensor(leaf_tensor);
323 324 325

    // Connect Node2 -> AccumulationNode via Edge
    auto meta2 = egr::AutogradMeta();
326
    meta2.SetStopGradient(false);
327 328
    meta2.SetSingleOutRankWithSlot(0, 0);
    meta2.SetGradNode(acc_node_ptr);
329 330
    std::vector<egr::AutogradMeta*> res2 = {&meta2};
    node2_ptr->AddEdges(&res2, 0);
331 332 333 334
  }

  RunBackward(target_tensors, grad_tensors);

335
  eager_test::CompareGradTensorWithValue<float>(leaf_tensor, 2500.0);
336 337
}

338
}  // namespace egr