diff --git a/python/paddle/distributed/fleet/utils/fs.py b/python/paddle/distributed/fleet/utils/fs.py index 7e0456f2793731b3a4acc3e00675a60886fb4f64..af38d9f513810b0044c35b9b63f7493b38a3e27f 100644 --- a/python/paddle/distributed/fleet/utils/fs.py +++ b/python/paddle/distributed/fleet/utils/fs.py @@ -847,8 +847,9 @@ class HDFSClient(FS): if self.is_file(fs_path): return self._try_download(fs_path, local_path) # download dir - _, all_filenames = self.ls_dir(fs_path) - all_files = [fs_path + i for i in all_filenames] + dirs, all_filenames = self.ls_dir(fs_path) + all_files = [fs_path + "/" + i for i in all_filenames] + all_files.extend([fs_path + "/" + i for i in dirs]) procs = [] for i in range(multi_processes): process_datas = self._split_files(all_files, i, multi_processes)