[CustomOP Unittest] XPU unittest only keep forward test (#53021)

89d1dd2e · HongyuJia · GitHub · e8d296ef · 89d1dd2e · 89d1dd2e
隐藏空白更改
内联并排

Showing with 3 addition and 280 deletion

test/custom_op/custom_relu_op_xpu.cc test/custom_op/custom_relu_op_xpu.cc +0 -127

test/custom_op/test_custom_relu_op_xpu_setup.py test/custom_op/test_custom_relu_op_xpu_setup.py +3 -153

未找到文件。
--- a/test/custom_op/custom_relu_op_xpu.cc
+++ b/test/custom_op/custom_relu_op_xpu.cc
@@ -31,28 +31,6 @@ void relu_cpu_forward_kernel(const data_t* x_data,
  }
 }
-template <typename data_t>
-void relu_cpu_backward_kernel(const data_t* grad_out_data,
-                              const data_t* out_data,
-                              data_t* grad_x_data,
-                              int64_t out_numel) {
-  for (int64_t i = 0; i < out_numel; ++i) {
-    grad_x_data[i] =
-        grad_out_data[i] * (out_data[i] > static_cast<data_t>(0) ? 1. : 0.);
-  }
-}
-template <typename data_t>
-void relu_cpu_double_backward_kernel(const data_t* out_data,
-                                     const data_t* ddx_data,
-                                     data_t* ddout_data,
-                                     int64_t ddout_numel) {
-  for (int64_t i = 0; i < ddout_numel; ++i) {
-    ddout_data[i] =
-        ddx_data[i] * (out_data[i] > static_cast<data_t>(0) ? 1. : 0.);
-  }
-}
 std::vector<paddle::Tensor> relu_cpu_forward(const paddle::Tensor& x) {
  CHECK_CPU_INPUT(x);
  auto out = paddle::empty_like(x);
@@ -66,77 +44,12 @@ std::vector<paddle::Tensor> relu_cpu_forward(const paddle::Tensor& x) {
  return {out};
 }
-std::vector<paddle::Tensor> relu_cpu_backward(const paddle::Tensor& x,
-                                              const paddle::Tensor& out,
-                                              const paddle::Tensor& grad_out) {
-  auto grad_x = paddle::empty_like(x);
-  PD_DISPATCH_FLOATING_TYPES(out.type(), "relu_cpu_backward", ([&] {
-                               relu_cpu_backward_kernel<data_t>(
-                                   grad_out.data<data_t>(),
-                                   out.data<data_t>(),
-                                   grad_x.data<data_t>(),
-                                   out.size());
-                             }));
-  return {grad_x};
-}
-std::vector<paddle::Tensor> relu_cpu_double_backward(
-    const paddle::Tensor& out, const paddle::Tensor& ddx) {
-  CHECK_CPU_INPUT(out);
-  CHECK_CPU_INPUT(ddx);
-  auto ddout = paddle::empty(out.shape(), out.dtype(), out.place());
-  PD_DISPATCH_FLOATING_TYPES(out.type(), "relu_cpu_double_backward", ([&] {
-                               relu_cpu_double_backward_kernel<data_t>(
-                                   out.data<data_t>(),
-                                   ddx.data<data_t>(),
-                                   ddout.mutable_data<data_t>(out.place()),
-                                   ddout.size());
-                             }));
-  return {ddout};
-}
 std::vector<paddle::Tensor> relu_xpu_forward(const paddle::Tensor& x) {
  CHECK_XPU_INPUT(x);
  auto out = paddle::relu(x);
  return {out};
 }
-std::vector<paddle::Tensor> relu_xpu_backward(const paddle::Tensor& x,
-                                              const paddle::Tensor& out,
-                                              const paddle::Tensor& grad_out) {
-  CHECK_XPU_INPUT(x);
-  CHECK_XPU_INPUT(out);
-  CHECK_XPU_INPUT(grad_out);
-  auto grad_x = paddle::empty_like(x, x.dtype(), x.place());
-  auto ones = paddle::experimental::full_like(x, 1.0, x.dtype(), x.place());
-  auto zeros = paddle::experimental::full_like(x, 0.0, x.dtype(), x.place());
-  auto condition = paddle::experimental::greater_than(x, zeros);
-  grad_x = grad_out * paddle::where(condition, ones, zeros);
-  return {grad_x};
-}
-std::vector<paddle::Tensor> relu_xpu_double_backward(
-    const paddle::Tensor& out, const paddle::Tensor& ddx) {
-  CHECK_XPU_INPUT(out);
-  CHECK_XPU_INPUT(ddx);
-  auto ddout = paddle::empty(out.shape(), out.dtype(), out.place());
-  auto ones =
-      paddle::experimental::full_like(out, 1.0, out.dtype(), out.place());
-  auto zeros =
-      paddle::experimental::full_like(out, 0.0, out.dtype(), out.place());
-  auto condition = paddle::experimental::greater_than(out, zeros);
-  ddout = paddle::multiply(ddx, paddle::where(condition, ones, zeros));
-  return {ddout};
-}
 std::vector<paddle::Tensor> ReluForward(const paddle::Tensor& x) {
  if (x.is_cpu()) {
    return relu_cpu_forward(x);
@@ -147,47 +60,7 @@ std::vector<paddle::Tensor> ReluForward(const paddle::Tensor& x) {
  }
 }
-std::vector<paddle::Tensor> ReluBackward(const paddle::Tensor& x,
-                                         const paddle::Tensor& out,
-                                         const paddle::Tensor& grad_out) {
-  if (x.is_cpu()) {
-    return relu_cpu_backward(x, out, grad_out);
-  } else if (x.is_xpu()) {
-    return relu_xpu_backward(x, out, grad_out);
-  } else {
-    PD_THROW("Not implemented.");
-  }
-}
-std::vector<paddle::Tensor> ReluDoubleBackward(const paddle::Tensor& out,
-                                               const paddle::Tensor& ddx) {
-  if (out.is_cpu()) {
-    return relu_cpu_double_backward(out, ddx);
-  } else if (out.place().GetType() == phi::AllocationType::XPU) {
-    return relu_xpu_double_backward(out, ddx);
-  } else {
-    PD_THROW("Not implemented.");
-  }
-}
-std::vector<std::vector<int64_t>> ReluDoubleBackwardInferShape(
-    const std::vector<int64_t>& out_shape,
-    const std::vector<int64_t>& ddx_shape) {
-  return {out_shape};
-}
 PD_BUILD_OP(custom_relu)
    .Inputs({"X"})
    .Outputs({"Out"})
    .SetKernelFn(PD_KERNEL(ReluForward));
-PD_BUILD_GRAD_OP(custom_relu)
-    .Inputs({"X", "Out", paddle::Grad("Out")})
-    .Outputs({paddle::Grad("X")})
-    .SetKernelFn(PD_KERNEL(ReluBackward));
-PD_BUILD_DOUBLE_GRAD_OP(custom_relu)
-    .Inputs({"Out", paddle::Grad(paddle::Grad("X"))})
-    .Outputs({paddle::Grad(paddle::Grad("Out"))})
-    .SetKernelFn(PD_KERNEL(ReluDoubleBackward))
-    .SetInferShapeFn(PD_INFER_SHAPE(ReluDoubleBackwardInferShape));
--- a/test/custom_op/test_custom_relu_op_xpu_setup.py
+++ b/test/custom_op/test_custom_relu_op_xpu_setup.py
@@ -34,15 +34,7 @@ def custom_relu_dynamic(func, device, dtype, np_x, use_func=True):
    t.retain_grads()
    out = func(t) if use_func else paddle.nn.functional.relu(t)
-    out.retain_grads()
+    return out.numpy()
-    out.stop_gradient = False
-    out.backward()
-    if t.grad is None:
-        return out.numpy(), t.grad
-    else:
-        return out.numpy(), t.grad.numpy()
 def custom_relu_static(
@@ -71,80 +63,6 @@ def custom_relu_static(
    return out_v
-def custom_relu_static_inference(func, device, np_data, np_label, path_prefix):
-    paddle.set_device(device)
-    with static.scope_guard(static.Scope()):
-        with static.program_guard(static.Program()):
-            # simple module
-            data = static.data(
-                name='data', shape=[None, 1, 28, 28], dtype='float32'
-            )
-            label = static.data(name='label', shape=[None, 1], dtype='int64')
-            hidden = static.nn.fc(data, size=128)
-            hidden = func(hidden)
-            hidden = static.nn.fc(hidden, size=128)
-            predict = static.nn.fc(hidden, size=10, activation='softmax')
-            loss = paddle.nn.functional.cross_entropy(input=hidden, label=label)
-            avg_loss = paddle.mean(loss)
-            opt = paddle.optimizer.SGD(learning_rate=0.1)
-            opt.minimize(avg_loss)
-            # run start up model
-            exe = static.Executor()
-            exe.run(static.default_startup_program())
-            # train
-            for _ in range(4):
-                exe.run(
-                    static.default_main_program(),
-                    feed={'data': np_data, 'label': np_label},
-                    fetch_list=[avg_loss],
-                )
-            # save inference model
-            static.save_inference_model(path_prefix, [data], [predict], exe)
-            # get train predict value
-            predict_v = exe.run(
-                static.default_main_program(),
-                feed={'data': np_data, 'label': np_label},
-                fetch_list=[predict],
-            )
-    return predict_v
-def custom_relu_double_grad_dynamic(func, device, dtype, np_x, use_func=True):
-    paddle.set_device(device)
-    t = paddle.to_tensor(np_x, dtype=dtype, stop_gradient=False)
-    t.retain_grads()
-    out = func(t) if use_func else paddle.nn.functional.relu(t)
-    out.retain_grads()
-    dx = paddle.grad(
-        outputs=out,
-        inputs=t,
-        grad_outputs=paddle.ones_like(t),
-        create_graph=True,
-        retain_graph=True,
-    )
-    ddout = paddle.grad(
-        outputs=dx[0],
-        inputs=out.grad,
-        grad_outputs=paddle.ones_like(t),
-        create_graph=False,
-    )
-    assert ddout[0].numpy() is not None
-    return dx[0].numpy(), ddout[0].numpy()
 class TestNewCustomOpXpuSetUpInstall(unittest.TestCase):
    def setUp(self):
        cur_dir = os.path.dirname(os.path.abspath(__file__))
@@ -189,79 +107,11 @@ class TestNewCustomOpXpuSetUpInstall(unittest.TestCase):
    def test_dynamic(self):
        for dtype in self.dtypes:
            x = np.random.uniform(-1, 1, [4, 8]).astype(dtype)
-            out, x_grad = custom_relu_dynamic(
+            out = custom_relu_dynamic(self.custom_op, self.device, dtype, x)
-                self.custom_op, self.device, dtype, x
+            pd_out = custom_relu_dynamic(
-            )
-            pd_out, pd_x_grad = custom_relu_dynamic(
-                self.custom_op, self.device, dtype, x, False
-            )
-            check_output(out, pd_out, "out")
-            check_output(x_grad, pd_x_grad, "x_grad")
-    def test_static_save_and_load_inference_model(self):
-        paddle.enable_static()
-        np_data = np.random.random((1, 1, 28, 28)).astype("float32")
-        np_label = np.random.random((1, 1)).astype("int64")
-        path_prefix = "self.custom_op_inference/custom_relu"
-        predict = custom_relu_static_inference(
-            self.custom_op, self.device, np_data, np_label, path_prefix
-        )
-        # load inference model
-        with static.scope_guard(static.Scope()):
-            exe = static.Executor()
-            [
-                inference_program,
-                feed_target_names,
-                fetch_targets,
-            ] = static.load_inference_model(path_prefix, exe)
-            predict_infer = exe.run(
-                inference_program,
-                feed={feed_target_names[0]: np_data},
-                fetch_list=fetch_targets,
-            )
-            check_output(predict, predict_infer, "predict")
-        paddle.disable_static()
-    def test_static_save_and_run_inference_predictor(self):
-        paddle.enable_static()
-        np_data = np.random.random((1, 1, 28, 28)).astype("float32")
-        np_label = np.random.random((1, 1)).astype("int64")
-        path_prefix = "self.custom_op_inference/custom_relu"
-        from paddle.inference import Config, create_predictor
-        predict = custom_relu_static_inference(
-            self.custom_op, self.device, np_data, np_label, path_prefix
-        )
-        # load inference model
-        config = Config(path_prefix + ".pdmodel", path_prefix + ".pdiparams")
-        predictor = create_predictor(config)
-        input_tensor = predictor.get_input_handle(
-            predictor.get_input_names()[0]
-        )
-        input_tensor.reshape(np_data.shape)
-        input_tensor.copy_from_cpu(np_data.copy())
-        predictor.run()
-        output_tensor = predictor.get_output_handle(
-            predictor.get_output_names()[0]
-        )
-        predict_infer = output_tensor.copy_to_cpu()
-        predict = np.array(predict).flatten()
-        predict_infer = np.array(predict_infer).flatten()
-        check_output_allclose(predict, predict_infer, "predict")
-        paddle.disable_static()
-    def test_func_double_grad_dynamic(self):
-        for dtype in self.dtypes:
-            x = np.random.uniform(-1, 1, [4, 8]).astype(dtype)
-            out, dx_grad = custom_relu_double_grad_dynamic(
-                self.custom_op, self.device, dtype, x
-            )
-            pd_out, pd_dx_grad = custom_relu_double_grad_dynamic(
                self.custom_op, self.device, dtype, x, False
            )
            check_output(out, pd_out, "out")
-            check_output(dx_grad, pd_dx_grad, "dx_grad")
    def test_with_dataloader(self):
        paddle.disable_static()