diff --git a/paddle/phi/api/yaml/legacy_backward.yaml b/paddle/phi/api/yaml/legacy_backward.yaml index 76d60522d863314defaf2f3c23d4f37f1097042a..2f4eff98356044343bee115cf169a050be117417 100755 --- a/paddle/phi/api/yaml/legacy_backward.yaml +++ b/paddle/phi/api/yaml/legacy_backward.yaml @@ -326,12 +326,7 @@ forward : cast (Tensor x, DataType out_dtype) -> Tensor(out) args : (Tensor x, Tensor out_grad) output : Tensor(x_grad) - infer_meta : - func : UnchangedInferMeta - param : [x] - kernel : - func : cast_grad - data_type : out_grad + invoke : cast (out_grad, x.dtype()) no_need_buffer : x - backward_op : ceil_grad @@ -2101,6 +2096,12 @@ optional : grad_grad_out_grad inplace : (grad_grad_x -> fwd_grad_out_grad) +- backward_op : sign_grad + forward : sign (Tensor x) -> Tensor(out) + args : (Tensor out_grad) + output : Tensor(x_grad) + invoke : scale(out_grad, 0.0, 0.0, true) + - backward_op : silu_grad forward : silu (Tensor x) -> Tensor(out) args : (Tensor x, Tensor out_grad) diff --git a/paddle/phi/api/yaml/legacy_ops.yaml b/paddle/phi/api/yaml/legacy_ops.yaml index e69d54eb1e238db0787b4b9f4e1e096d572c3fa5..cd531142e233fd23686f218d7fd1a907dab6a6b9 100755 --- a/paddle/phi/api/yaml/legacy_ops.yaml +++ b/paddle/phi/api/yaml/legacy_ops.yaml @@ -2377,6 +2377,7 @@ func : UnchangedInferMeta kernel : func : sign + backward : sign_grad - op : silu args : (Tensor x) diff --git a/python/paddle/fluid/tests/unittests/gradient_checker.py b/python/paddle/fluid/tests/unittests/gradient_checker.py index e261fd8165d8627dbe5fe420e25ad502d2225375..15320c395e2db9920e49e5b04d32975c4b717da2 100644 --- a/python/paddle/fluid/tests/unittests/gradient_checker.py +++ b/python/paddle/fluid/tests/unittests/gradient_checker.py @@ -268,6 +268,9 @@ def grad_check(x, for v in x: v.stop_gradient = False v.persistable = True + for u in y: + u.stop_gradient = False + u.persistable = True if place is None: place = fluid.CPUPlace() if program is None: @@ -364,6 +367,9 @@ def double_grad_check(x, v.stop_gradient = False v.persistable = True y = _as_list(y) + for u in y: + u.stop_gradient = False + u.persistable = True if program is None: program = fluid.default_main_program() @@ -445,6 +451,9 @@ def triple_grad_check(x, v.stop_gradient = False v.persistable = True y = _as_list(y) + for u in y: + u.stop_gradient = False + u.persistable = True if program is None: program = fluid.default_main_program() @@ -578,6 +587,9 @@ def get_static_double_grad(x, for v in x: v.stop_gradient = False v.persistable = True + for u in y: + u.stop_gradient = False + u.persistable = True if place is None: place = fluid.CPUPlace() if program is None: @@ -736,7 +748,9 @@ def double_grad_check_for_dygraph(func, v.stop_gradient = False v.persistable = True y = _as_list(y) - + for u in y: + u.stop_gradient = False + u.persistable = True y_grads_init = [] for yi in y: np_type = dtype_to_np_dtype(yi.dtype) @@ -903,7 +917,9 @@ def triple_grad_check_for_dygraph(func, v.stop_gradient = False v.persistable = True y = _as_list(y) - + for u in y: + u.stop_gradient = False + u.persistable = True y_grads_init = [] for yi in y: np_type = dtype_to_np_dtype(yi.dtype) diff --git a/python/paddle/fluid/tests/unittests/test_cast_op.py b/python/paddle/fluid/tests/unittests/test_cast_op.py index cd67440990cb852a13eb9bfdab121f8a5df4db05..a3a6805a868ee5d4b4312899c347e29238d91f2d 100644 --- a/python/paddle/fluid/tests/unittests/test_cast_op.py +++ b/python/paddle/fluid/tests/unittests/test_cast_op.py @@ -23,6 +23,9 @@ import paddle.fluid as fluid from paddle.fluid import compiler, Program, program_guard from op_test import OpTest, convert_uint16_to_float, convert_float_to_uint16 from paddle.fluid.framework import _test_eager_guard +import gradient_checker +from decorator_helper import prog_scope +import paddle.fluid.layers as layers class TestCastOpFp32ToFp64(OpTest): @@ -137,6 +140,80 @@ class TestCastOpEager(unittest.TestCase): self.assertTrue(x.gradient().dtype == np.float16) +class TestCastDoubleGradCheck(unittest.TestCase): + + def cast_wrapper(self, x): + return paddle.cast(x[0], 'float64') + + @prog_scope() + def func(self, place): + # the shape of input variable should be clearly specified, not inlcude -1. + eps = 0.005 + dtype = np.float32 + + data = layers.data('data', [2, 3, 4], False, dtype) + data.persistable = True + out = paddle.cast(data, 'float64') + data_arr = np.random.uniform(-1, 1, data.shape).astype(dtype) + + gradient_checker.double_grad_check([data], + out, + x_init=[data_arr], + place=place, + eps=eps) + fluid.set_flags({"FLAGS_retain_grad_for_all_tensor": True}) + gradient_checker.double_grad_check_for_dygraph(self.cast_wrapper, + [data], + out, + x_init=[data_arr], + place=place) + + def test_grad(self): + paddle.enable_static() + places = [fluid.CPUPlace()] + if core.is_compiled_with_cuda(): + places.append(fluid.CUDAPlace(0)) + for p in places: + self.func(p) + + +class TestCastTripleGradCheck(unittest.TestCase): + + def cast_wrapper(self, x): + return paddle.cast(x[0], 'float64') + + @prog_scope() + def func(self, place): + # the shape of input variable should be clearly specified, not inlcude -1. + eps = 0.005 + dtype = np.float32 + + data = layers.data('data', [2, 3, 4], False, dtype) + data.persistable = True + out = paddle.cast(data, 'float64') + data_arr = np.random.uniform(-1, 1, data.shape).astype(dtype) + + gradient_checker.triple_grad_check([data], + out, + x_init=[data_arr], + place=place, + eps=eps) + fluid.set_flags({"FLAGS_retain_grad_for_all_tensor": True}) + gradient_checker.triple_grad_check_for_dygraph(self.cast_wrapper, + [data], + out, + x_init=[data_arr], + place=place) + + def test_grad(self): + paddle.enable_static() + places = [fluid.CPUPlace()] + if core.is_compiled_with_cuda(): + places.append(fluid.CUDAPlace(0)) + for p in places: + self.func(p) + + if __name__ == '__main__': paddle.enable_static() unittest.main() diff --git a/python/paddle/fluid/tests/unittests/test_sign_op.py b/python/paddle/fluid/tests/unittests/test_sign_op.py index 444675a4bb5c22c701177f052751e5efb7753e38..3eda8b286c84021a84ffb9d6d6d434337f36ad42 100644 --- a/python/paddle/fluid/tests/unittests/test_sign_op.py +++ b/python/paddle/fluid/tests/unittests/test_sign_op.py @@ -19,7 +19,11 @@ import numpy as np from op_test import OpTest import paddle import paddle.fluid as fluid +import paddle.fluid.core as core from paddle.fluid import Program, program_guard +import gradient_checker +from decorator_helper import prog_scope +import paddle.fluid.layers as layers class TestSignOp(OpTest): @@ -91,6 +95,80 @@ class TestSignAPI(unittest.TestCase): paddle.sign(input4) +class TestSignDoubleGradCheck(unittest.TestCase): + + def sign_wrapper(self, x): + return paddle.sign(x[0]) + + @prog_scope() + def func(self, place): + # the shape of input variable should be clearly specified, not inlcude -1. + eps = 0.005 + dtype = np.float32 + + data = layers.data('data', [1, 4], False, dtype) + data.persistable = True + out = paddle.sign(data) + data_arr = np.random.uniform(-1, 1, data.shape).astype(dtype) + + gradient_checker.double_grad_check([data], + out, + x_init=[data_arr], + place=place, + eps=eps) + fluid.set_flags({"FLAGS_retain_grad_for_all_tensor": True}) + gradient_checker.double_grad_check_for_dygraph(self.sign_wrapper, + [data], + out, + x_init=[data_arr], + place=place) + + def test_grad(self): + paddle.enable_static() + places = [fluid.CPUPlace()] + if core.is_compiled_with_cuda(): + places.append(fluid.CUDAPlace(0)) + for p in places: + self.func(p) + + +class TestSignTripleGradCheck(unittest.TestCase): + + def sign_wrapper(self, x): + return paddle.sign(x[0]) + + @prog_scope() + def func(self, place): + # the shape of input variable should be clearly specified, not inlcude -1. + eps = 0.005 + dtype = np.float32 + + data = layers.data('data', [1, 4], False, dtype) + data.persistable = True + out = paddle.sign(data) + data_arr = np.random.uniform(-1, 1, data.shape).astype(dtype) + + gradient_checker.triple_grad_check([data], + out, + x_init=[data_arr], + place=place, + eps=eps) + fluid.set_flags({"FLAGS_retain_grad_for_all_tensor": True}) + gradient_checker.triple_grad_check_for_dygraph(self.sign_wrapper, + [data], + out, + x_init=[data_arr], + place=place) + + def test_grad(self): + paddle.enable_static() + places = [fluid.CPUPlace()] + if core.is_compiled_with_cuda(): + places.append(fluid.CUDAPlace(0)) + for p in places: + self.func(p) + + if __name__ == "__main__": paddle.enable_static() unittest.main()