fix bug in c_split (#56917)

201480d5 · ShenLiang · GitHub · 79bfb184 · 201480d5
隐藏空白更改
内联并排

Showing with 33 addition and 13 deletion

python/paddle/distributed/fleet/layers/mpu/mp_ops.py python/paddle/distributed/fleet/layers/mpu/mp_ops.py +33 -13

未找到文件。
--- a/python/paddle/distributed/fleet/layers/mpu/mp_ops.py
+++ b/python/paddle/distributed/fleet/layers/mpu/mp_ops.py
@@ -48,6 +48,38 @@ class c_identity_eager(PyLayer):
        return dy


+class c_split_eager(PyLayer):
+    @staticmethod
+    def forward(ctx, tensor, group, rank, nranks):
+        ctx.group = group
+        ctx.nranks = nranks
+        return _legacy_C_ops.c_split(
+            tensor,
+            'use_calc_stream',
+            True,
+            'ring_id',
+            group.id,
+            'rank',
+            rank,
+            'nranks',
+            nranks,
+            'use_model_parallel',
+            True,
+        )
+
+    @staticmethod
+    def backward(ctx, dy):
+        group = ctx.group
+        out_shape = dy.shape
+        out_shape[0] = out_shape[0] * ctx.nranks
+        out = paddle.empty(out_shape, dtype=dy.dtype)
+        group.process_group.all_gather_into_tensor_on_calc_stream(
+            out,
+            dy,
+        )
+        return out
+
+
 def _c_identity(tensor, group=None, skip_c_identity_dynamic=False):
    """
    Return a copy of the tensor, mainly used with model parallel.
@@ -179,19 +211,7 @@ def _c_split(tensor, group=None):
    )

    if in_dynamic_mode():
-        return _legacy_C_ops.c_split(
-            tensor,
-            'use_calc_stream',
-            True,
-            'ring_id',
-            ring_id,
-            'rank',
-            rank,
-            'nranks',
-            nranks,
-            'use_model_parallel',
-            True,
-        )
+        return c_split_eager.apply(tensor, group, rank, nranks)
    else:
        op_type = 'c_split'
        helper = LayerHelper(op_type, **locals())