update instantiate for auto parallel (#46883)

3b5064d6 · caozhou · GitHub · 0773639a · 3b5064d6
显示空白变更内容
内联并排

Showing with 5 addition and 4 deletion

python/paddle/distributed/auto_parallel/process_group.py python/paddle/distributed/auto_parallel/process_group.py +5 -4

未找到文件。
--- a/python/paddle/distributed/auto_parallel/process_group.py
+++ b/python/paddle/distributed/auto_parallel/process_group.py
@@ -21,7 +21,7 @@ from ..collective import _get_global_env
 from ..collective import _new_ring_id
 from ...fluid.framework import _non_static_mode
 from ...fluid.layers.tensor import fill_constant
-from paddle.fluid.framework import _enable_legacy_dygraph
+from paddle import _legacy_C_ops
 def get_all_process_groups():
@@ -145,14 +145,15 @@ class ProcessGroup:
            # TODO(shenliang03): This is a temporary solution to solve the problem of
            # hang caused by cross-creation of new_group
            paddle.disable_static()
-            _enable_legacy_dygraph()
            paddle.set_device('gpu:%d' %
                              paddle.distributed.ParallelEnv().dev_id)
            tmp = paddle.to_tensor(
                [1], dtype="int32") if _non_static_mode() else fill_constant(
                    [0], dtype="int32", value="1")
-            paddle.distributed.all_reduce(tmp, sync_op=True, group=self)
+            # use legacy ops
-            paddle.distributed.wait(tmp, group=self)
+            _legacy_C_ops.c_allreduce_sum_(tmp, 'use_calc_stream', True,
+                                           'ring_id', self.id)
+            _legacy_C_ops.c_sync_calc_stream(tmp, tmp)
            paddle.enable_static()
        self._is_instantiate = True