From 9388a6381c51733dd5b23aac9c07b0ef0fcb4667 Mon Sep 17 00:00:00 2001 From: mapingshuo Date: Thu, 28 May 2020 17:43:18 +0800 Subject: [PATCH] fix popen error (#24767) replace join to terminate --- python/paddle/distributed/utils.py | 9 +++------ 1 file changed, 3 insertions(+), 6 deletions(-) diff --git a/python/paddle/distributed/utils.py b/python/paddle/distributed/utils.py index 3b55ec7ffce..511d501a220 100644 --- a/python/paddle/distributed/utils.py +++ b/python/paddle/distributed/utils.py @@ -252,15 +252,12 @@ def get_cluster(node_ips, node_ip, paddle_ports, selected_gpus): def terminate_local_procs(procs): for p in procs: if p.proc.poll() is None: - # subprocess need to release resource(e.g. shared memory) - # use join to wait subprocess releasing - p.proc.join(timeout=1) + p.proc.terminate() p.log_fn.close() logger.debug("terminate process id:{}".format(p.proc.pid)) - # wait all process terminiated - # time.sleep(3) - + #wait all process terminiated + time.sleep(3) for step in range(0, 50): alive = False for p in procs: -- GitLab