hook_test_intermidiate.cc 8.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include <sstream>

#include "gtest/gtest.h"

#include "paddle/fluid/eager/api/all.h"
#include "paddle/fluid/eager/backward.h"
#include "paddle/fluid/eager/grad_node_info.h"
#include "paddle/fluid/eager/tests/test_utils.h"
#include "paddle/fluid/imperative/tracer.h"
24
#include "paddle/phi/core/dense_tensor.h"
25 26

#include "paddle/fluid/eager/api/generated/fluid_generated/dygraph_forward_api.h"
27
#include "paddle/fluid/eager/hooks.h"
28
#include "paddle/phi/core/kernel_registry.h"
29 30 31 32 33

namespace egr {

paddle::experimental::Tensor hook_function(
    const paddle::experimental::Tensor& t) {
34
  auto t_dense = std::dynamic_pointer_cast<phi::DenseTensor>(t.impl());
35

36 37
  auto ret_meta = phi::DenseTensorMeta(t_dense->dtype(), t_dense->dims(),
                                       t_dense->layout());
38
  auto place = t_dense->place();
39 40 41
  size_t bytes_size = phi::product(t_dense->dims()) * SizeOf(t_dense->dtype());
  auto ret_dense = std::make_shared<phi::DenseTensor>(
      phi::make_intrusive<paddle::experimental::SharedStorage>(
42 43 44 45 46 47 48 49 50
          paddle::memory::Alloc(place, bytes_size)),
      std::move(ret_meta));

  float* t_ptr = t_dense->mutable_data<float>(place);
  float* ret_ptr = ret_dense->mutable_data<float>(place);
  for (int i = 0; i < ret_dense->numel(); i++) {
    ret_ptr[i] = t_ptr[i] + 3.0;
  }

51
  auto ret_impl = std::dynamic_pointer_cast<phi::TensorBase>(ret_dense);
52 53 54 55 56 57
  paddle::experimental::Tensor ret = paddle::experimental::Tensor();
  ret.set_impl(ret_impl);

  return ret;
}

58
void test_sigmoid(bool is_remove_gradient_hook) {
59 60 61 62 63
  // Prepare Device Contexts
  VLOG(6) << "Init Env";
  eager_test::InitEnv(paddle::platform::CPUPlace());

  VLOG(6) << "Make Dim";
64
  paddle::framework::DDim ddim = phi::make_ddim({2, 4, 4, 4});
65 66 67

  VLOG(6) << "Make paddle::experimental::Tensor";
  paddle::experimental::Tensor tensor = egr_utils_api::CreateTensorWithValue(
68 69
      ddim, paddle::platform::CPUPlace(), phi::DataType::FLOAT32,
      phi::DataLayout::NCHW, 0.0, true);
70

71 72
  VLOG(6) << "Make ReduceHook function";
  auto reduce_hook = [&](void) -> void {
73
    auto* t_ptr = std::dynamic_pointer_cast<phi::DenseTensor>(tensor.impl())
74 75 76 77 78 79
                      ->data<float>();
    for (int i = 0; i < tensor.numel(); i++) {
      t_ptr[i] = 100.0;  // set to 100.0
    }
  };

80 81 82 83
  VLOG(6) << "Retain Grad for Tensor";
  egr_utils_api::RetainGradForTensor(tensor);

  VLOG(6) << "Register GradientHook for Tensor";
84 85
  int64_t hook_id = egr_utils_api::RegisterGradientHookForTensor(
      tensor, std::make_shared<CppTensorHook>(hook_function));
86

87
  VLOG(6) << "Register ReduceHook for Tensor";
88 89
  egr_utils_api::RegisterReduceHookForTensor(
      tensor, std::make_shared<CppTensorVoidHook>(reduce_hook));
90

91 92 93 94 95 96 97 98
  VLOG(6) << "Runing Forward";
  auto output_tensor = sigmoid_dygraph_function(tensor, {});
  VLOG(6) << "Finish Forward";

  eager_test::CompareTensorWithValue<float>(output_tensor, 0.5);

  std::vector<paddle::experimental::Tensor> target_tensors = {output_tensor};

99 100 101 102 103
  if (is_remove_gradient_hook) {
    std::shared_ptr<GradNodeBase> grad_node_tmp = EagerUtils::grad_node(tensor);
    grad_node_tmp->RemoveGradientHook(hook_id);
  }

104 105 106 107
  VLOG(6) << "Runing Backward";
  RunBackward(target_tensors, {});
  VLOG(6) << "Finish Backward";

108 109
  eager_test::CompareGradTensorWithValue<float>(
      tensor, is_remove_gradient_hook ? 0.25 : 0.25 + 3.0);
110 111 112

  VLOG(6) << "Checking ReduceHook results";
  for (int i = 0; i < tensor.numel(); i++) {
113
    CHECK_EQ(std::dynamic_pointer_cast<phi::DenseTensor>(tensor.impl())
114 115 116
                 ->data<float>()[i],
             static_cast<float>(100.0f));
  }
117 118 119
  VLOG(6) << "After Tests";
}

120
void test_elementwiseAdd(bool is_remove_gradient_hook) {
121 122 123 124 125 126 127
  // Prepare Device Contexts
  eager_test::InitEnv(paddle::platform::CPUPlace());

  auto tracer = std::make_shared<paddle::imperative::Tracer>();
  paddle::imperative::SetCurrentTracer(tracer);

  // 1. Prepare Input
128
  paddle::framework::DDim ddimX = phi::make_ddim({4, 16});
129
  paddle::experimental::Tensor X = egr_utils_api::CreateTensorWithValue(
130 131
      ddimX, paddle::platform::CPUPlace(), phi::DataType::FLOAT32,
      phi::DataLayout::NCHW, 3.0, true);
132 133
  egr_utils_api::RetainGradForTensor(X);

134
  paddle::framework::DDim ddimY = phi::make_ddim({4, 16});
135
  paddle::experimental::Tensor Y = egr_utils_api::CreateTensorWithValue(
136 137
      ddimY, paddle::platform::CPUPlace(), phi::DataType::FLOAT32,
      phi::DataLayout::NCHW, 2.0, true);
138

139
  auto reduce_hook = [&]() -> void {
140
    auto* t_ptr =
141
        std::dynamic_pointer_cast<phi::DenseTensor>(Y.impl())->data<float>();
142 143 144 145 146
    for (int i = 0; i < Y.numel(); i++) {
      t_ptr[i] = 100.0;  // set to 100.0
    }
  };

147
  egr_utils_api::RetainGradForTensor(Y);
148 149 150 151
  int64_t hook_id = egr_utils_api::RegisterGradientHookForTensor(
      Y, std::make_shared<CppTensorHook>(hook_function));
  egr_utils_api::RegisterReduceHookForTensor(
      Y, std::make_shared<CppTensorVoidHook>(reduce_hook));
152 153 154 155 156

  auto output_tensor = elementwise_add_dygraph_function(X, Y, {});

  eager_test::CompareTensorWithValue<float>(output_tensor, 5);
  std::vector<paddle::experimental::Tensor> target_tensors = {output_tensor};
157 158 159 160 161 162

  if (is_remove_gradient_hook) {
    std::shared_ptr<GradNodeBase> grad_node_tmp = EagerUtils::grad_node(Y);
    grad_node_tmp->RemoveGradientHook(hook_id);
  }

163 164 165
  RunBackward(target_tensors, {});

  eager_test::CompareGradTensorWithValue<float>(X, 1.0);
166 167
  eager_test::CompareGradTensorWithValue<float>(
      Y, is_remove_gradient_hook ? 1.0 : 1.0 + 3.0);
168 169 170

  // Checking ReduceHook results
  for (int i = 0; i < Y.numel(); i++) {
171 172 173
    CHECK_EQ(
        std::dynamic_pointer_cast<phi::DenseTensor>(Y.impl())->data<float>()[i],
        static_cast<float>(100.0f));
174
  }
175 176
}

177
void test_matmul(bool is_remove_gradient_hook) {
178 179 180 181 182 183 184
  // Prepare Device Contexts
  eager_test::InitEnv(paddle::platform::CPUPlace());

  auto tracer = std::make_shared<paddle::imperative::Tracer>();
  paddle::imperative::SetCurrentTracer(tracer);

  // 1. Prepare Input
185
  paddle::framework::DDim ddimX = phi::make_ddim({4, 16});
186
  paddle::experimental::Tensor X = egr_utils_api::CreateTensorWithValue(
187 188
      ddimX, paddle::platform::CPUPlace(), phi::DataType::FLOAT32,
      phi::DataLayout::NCHW, 3.0, true);
189 190
  egr_utils_api::RetainGradForTensor(X);

191
  paddle::framework::DDim ddimY = phi::make_ddim({16, 20});
192
  paddle::experimental::Tensor Y = egr_utils_api::CreateTensorWithValue(
193 194
      ddimY, paddle::platform::CPUPlace(), phi::DataType::FLOAT32,
      phi::DataLayout::NCHW, 2.0, true);
195

196 197
  auto reduce_hook = [&](void) -> void {
    auto* t_ptr =
198
        std::dynamic_pointer_cast<phi::DenseTensor>(Y.impl())->data<float>();
199 200 201 202 203
    for (int i = 0; i < Y.numel(); i++) {
      t_ptr[i] = 100.0;  // set to 100.0
    }
  };

204
  egr_utils_api::RetainGradForTensor(Y);
205 206 207 208
  int64_t hook_id = egr_utils_api::RegisterGradientHookForTensor(
      Y, std::make_shared<CppTensorHook>(hook_function));
  egr_utils_api::RegisterReduceHookForTensor(
      Y, std::make_shared<CppTensorVoidHook>(reduce_hook));
209 210 211 212 213 214

  auto output_tensor = matmul_v2_dygraph_function(
      X, Y, {{"trans_x", false}, {"trans_y", false}});

  eager_test::CompareTensorWithValue<float>(output_tensor, 96);
  std::vector<paddle::experimental::Tensor> target_tensors = {output_tensor};
215 216 217 218 219 220

  if (is_remove_gradient_hook) {
    std::shared_ptr<GradNodeBase> grad_node_tmp = EagerUtils::grad_node(Y);
    grad_node_tmp->RemoveGradientHook(hook_id);
  }

221 222 223
  RunBackward(target_tensors, {});

  eager_test::CompareGradTensorWithValue<float>(X, 2.0 * 20);
224 225
  eager_test::CompareGradTensorWithValue<float>(
      Y, is_remove_gradient_hook ? 3.0 * 4 : 3.0 * 4 + 3);
226

227 228
  // Checking ReduceHook results
  for (int i = 0; i < Y.numel(); i++) {
229 230 231
    CHECK_EQ(
        std::dynamic_pointer_cast<phi::DenseTensor>(Y.impl())->data<float>()[i],
        static_cast<float>(100.0f));
232 233
  }
}
234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249

TEST(Hook_intermidiate, Sigmoid) {
  // True or false represents whether to call RemoveGradientHook
  test_sigmoid(true);
  test_sigmoid(false);
}

TEST(Hook_intermidiate, ElementwiseAdd) {
  test_elementwiseAdd(true);
  test_elementwiseAdd(false);
}

TEST(Hook_intermidiate, Matmul_v2) {
  test_matmul(true);
  test_matmul(false);
}
250 251 252 253 254
}  // namespace egr

USE_OP(sigmoid);
USE_OP_ITSELF(elementwise_add);
USE_OP_ITSELF(matmul_v2);