【prim】scatter_nd_add_grad (#52469)

* add scatter_nd_add comp * add scatter_nd_add prim * fix * fix * add public_python_api in TestScatterNdAddSimpleOp setup function * fix composite_backward_api.h * fix composite_backward * add test cases * fix composite_backward_api.h, unittest

【prim】scatter_nd_add_grad (#52469)
* add scatter_nd_add comp * add scatter_nd_add prim * fix * fix * add public_python_api in TestScatterNdAddSimpleOp setup function * fix composite_backward_api.h * fix composite_backward * add test cases * fix composite_backward_api.h, unittest
55c4eb8a · mhy-666 · GitHub · 1164626c · 55c4eb8a · 55c4eb8a
3 changed file
--- a/paddle/fluid/prim/api/composite_backward/composite_backward_api.h
+++ b/paddle/fluid/prim/api/composite_backward/composite_backward_api.h
@@ -1805,5 +1805,21 @@ void roll_grad(const Tensor& x,
    set_output<T>(x_grad_output, x_grad);
  }
 }
+template <typename T>
+void scatter_nd_add_grad(const Tensor& index,
+                         const Tensor& updates,
+                         const Tensor& out_grad,
+                         Tensor* x_grad,
+                         Tensor* updates_grad) {
+  if (x_grad) {
+    by_pass<T>(out_grad, x_grad);
+  }
+  if (updates_grad) {
+    // Gradient by Gather: dUpdates = dO[Ids]
+    auto tmp_updates_grad = gather_nd<T>(out_grad, index);
+    set_output<T>(tmp_updates_grad, updates_grad);
+  }
+}
 }  // namespace prim
 }  // namespace paddle
--- a/paddle/phi/api/yaml/backward.yaml
+++ b/paddle/phi/api/yaml/backward.yaml
@@ -1454,6 +1454,7 @@
  kernel :
    func : scatter_nd_add_grad
  no_need_buffer : updates
+  composite: scatter_nd_add_grad(index, updates, out_grad, x_grad, updates_grad)
 - backward_op : segment_pool_grad
  forward : segment_pool (Tensor x, Tensor segment_ids, str pooltype="SUM") -> Tensor(out), Tensor(summed_ids)

--- a/python/paddle/fluid/tests/unittests/test_scatter_nd_op.py
+++ b/python/paddle/fluid/tests/unittests/test_scatter_nd_op.py
@@ -69,6 +69,8 @@ class TestScatterNdAddSimpleOp(OpTest):
    def setUp(self):
        self.op_type = "scatter_nd_add"
        self.python_api = paddle.scatter_nd_add
+        self.public_python_api = paddle.scatter_nd_add
+        self.prim_op_type = "prim"
        self._set_dtype()
        if self.dtype == np.float64:
            target_dtype = "float64"
@@ -94,7 +96,7 @@ class TestScatterNdAddSimpleOp(OpTest):
        self.check_output()
    def test_check_grad(self):
-        self.check_grad(['X', 'Updates'], 'Out')
+        self.check_grad(['X', 'Updates'], 'Out', check_prim=True)
 class TestScatterNdAddSimpleFP16Op(TestScatterNdAddSimpleOp):
@@ -127,7 +129,9 @@ class TestScatterNdAddSimpleBF16Op(TestScatterNdAddSimpleOp):
    def test_check_grad(self):
        if core.is_compiled_with_cuda():
            place = core.CUDAPlace(0)
-            self.check_grad_with_place(place, ['X', 'Updates'], 'Out')
+            self.check_grad_with_place(
+                place, ['X', 'Updates'], 'Out', check_prim=True
+            )
 class TestScatterNdAddWithEmptyIndex(OpTest):
@@ -138,6 +142,8 @@ class TestScatterNdAddWithEmptyIndex(OpTest):
    def setUp(self):
        self.op_type = "scatter_nd_add"
        self.python_api = paddle.scatter_nd_add
+        self.public_python_api = paddle.scatter_nd_add
+        self.prim_op_type = "prim"
        self._set_dtype()
        if self.dtype == np.float64:
            target_dtype = "float64"
@@ -166,7 +172,7 @@ class TestScatterNdAddWithEmptyIndex(OpTest):
        self.check_output()
    def test_check_grad(self):
-        self.check_grad(['X', 'Updates'], 'Out')
+        self.check_grad(['X', 'Updates'], 'Out', check_prim=True)
 class TestScatterNdAddWithEmptyIndexFP16(TestScatterNdAddWithEmptyIndex):
@@ -199,7 +205,9 @@ class TestScatterNdAddWithEmptyIndexBF16(TestScatterNdAddWithEmptyIndex):
    def test_check_grad(self):
        if core.is_compiled_with_cuda():
            place = core.CUDAPlace(0)
-            self.check_grad_with_place(place, ['X', 'Updates'], 'Out')
+            self.check_grad_with_place(
+                place, ['X', 'Updates'], 'Out', check_prim=True
+            )
 class TestScatterNdAddWithHighRankSame(OpTest):
@@ -210,6 +218,8 @@ class TestScatterNdAddWithHighRankSame(OpTest):
    def setUp(self):
        self.op_type = "scatter_nd_add"
        self.python_api = paddle.scatter_nd_add
+        self.public_python_api = paddle.scatter_nd_add
+        self.prim_op_type = "prim"
        self._set_dtype()
        if self.dtype == np.float64:
            target_dtype = "float64"
@@ -241,7 +251,7 @@ class TestScatterNdAddWithHighRankSame(OpTest):
        self.check_output()
    def test_check_grad(self):
-        self.check_grad(['X', 'Updates'], 'Out')
+        self.check_grad(['X', 'Updates'], 'Out', check_prim=True)
 class TestScatterNdAddWithHighRankSameFP16(TestScatterNdAddWithHighRankSame):
@@ -274,7 +284,9 @@ class TestScatterNdAddWithHighRankSameBF16(TestScatterNdAddWithHighRankSame):
    def test_check_grad(self):
        if core.is_compiled_with_cuda():
            place = core.CUDAPlace(0)
-            self.check_grad_with_place(place, ['X', 'Updates'], 'Out')
+            self.check_grad_with_place(
+                place, ['X', 'Updates'], 'Out', check_prim=True
+            )
 class TestScatterNdAddWithHighRankDiff(OpTest):
@@ -285,6 +297,8 @@ class TestScatterNdAddWithHighRankDiff(OpTest):
    def setUp(self):
        self.op_type = "scatter_nd_add"
        self.python_api = paddle.scatter_nd_add
+        self.public_python_api = paddle.scatter_nd_add
+        self.prim_op_type = "prim"
        shape = (8, 2, 2, 1, 10)
        ref_np = np.random.rand(*shape).astype("double")
        index = np.vstack([np.random.randint(0, s, size=500) for s in shape]).T
@@ -300,7 +314,7 @@ class TestScatterNdAddWithHighRankDiff(OpTest):
        self.check_output()
    def test_check_grad(self):
-        self.check_grad(['X', 'Updates'], 'Out')
+        self.check_grad(['X', 'Updates'], 'Out', check_prim=True)
 # Test Python API
@@ -310,6 +324,7 @@ class TestScatterNdOpAPI(unittest.TestCase):
    """
    def testcase1(self):
+        with paddle.fluid.framework._static_guard():
            ref1 = paddle.static.data(
                name='ref1',
                shape=[10, 9, 8, 1, 3],
@@ -328,6 +343,7 @@ class TestScatterNdOpAPI(unittest.TestCase):
            output1 = paddle.scatter_nd_add(ref1, index1, updates1)
    def testcase2(self):
+        with paddle.fluid.framework._static_guard():
            ref2 = paddle.static.data(
                name='ref2',
                shape=[10, 9, 8, 1, 3],
@@ -348,6 +364,7 @@ class TestScatterNdOpAPI(unittest.TestCase):
            )
    def testcase3(self):
+        with paddle.fluid.framework._static_guard():
            shape3 = [10, 9, 8, 1, 3]
            index3 = paddle.static.data(
                name='index3',
@@ -362,6 +379,7 @@ class TestScatterNdOpAPI(unittest.TestCase):
            output3 = paddle.scatter_nd(index3, updates3, shape3)
    def testcase4(self):
+        with paddle.fluid.framework._static_guard():
            shape4 = [10, 9, 8, 1, 3]
            index4 = paddle.static.data(
                name='index4',
@@ -373,7 +391,9 @@ class TestScatterNdOpAPI(unittest.TestCase):
                shape=[5, 5, 8],
                dtype='double',
            )
-        output4 = paddle.scatter_nd(index4, updates4, shape4, name='scatter_nd')
+            output4 = paddle.scatter_nd(
+                index4, updates4, shape4, name='scatter_nd'
+            )
    def testcase5(self):
        if not fluid.core.is_compiled_with_cuda():
@@ -430,6 +450,7 @@ class TestScatterNdOpAPI(unittest.TestCase):
 class TestScatterNdOpRaise(unittest.TestCase):
    def test_check_raise(self):
        def check_raise_is_test():
+            with paddle.fluid.framework._static_guard():
                try:
                    ref5 = paddle.static.data(
                        name='ref5', shape=[-1, 3, 4, 5], dtype='float32'
@@ -450,6 +471,7 @@ class TestScatterNdOpRaise(unittest.TestCase):
    def test_check_raise2(self):
        with self.assertRaises(ValueError):
+            with paddle.fluid.framework._static_guard():
                ref6 = paddle.static.data(
                    name='ref6',
                    shape=[10, 9, 8, 1, 3],
@@ -469,13 +491,16 @@ class TestScatterNdOpRaise(unittest.TestCase):
    def test_check_raise3(self):
        def check_raise_is_test():
+            with paddle.fluid.framework._static_guard():
                try:
                    shape = [3, 4, 5]
                    index7 = paddle.static.data(
                        name='index7', shape=[-1, 2, 1], dtype='int32'
                    )
                    updates7 = paddle.static.data(
-                    name='updates7', shape=[-1, 2, 4, 5, 20], dtype='float32'
+                        name='updates7',
+                        shape=[-1, 2, 4, 5, 20],
+                        dtype='float32',
                    )
                    output7 = paddle.scatter_nd(index7, updates7, shape)
                except Exception as e: