Clean code

a7b0d5bd · Yu Yang · e3144393 · a7b0d5bd · a7b0d5bd
隐藏空白更改
内联并排

Showing with 10 addition and 13 deletion

paddle/fluid/framework/parallel_executor.cc paddle/fluid/framework/parallel_executor.cc +8 -11

paddle/fluid/framework/parallel_executor.h paddle/fluid/framework/parallel_executor.h +2 -2

未找到文件。
--- a/paddle/fluid/framework/parallel_executor.cc
+++ b/paddle/fluid/framework/parallel_executor.cc
@@ -27,15 +27,16 @@ namespace framework {
 class ParallelExecutorPrivate {
 public:
  explicit ParallelExecutorPrivate(const std::vector<platform::Place> &places)
-      : places_(places), fetch_dev_ctxs_(places) {}
+      : places_(places) {}
  std::vector<platform::Place> places_;
-  platform::DeviceContextPool fetch_dev_ctxs_;
  std::vector<Scope *> local_scopes_;
  Scope *global_scope_;
+  std::unique_ptr<details::SSAGraphExecutor> executor_;
+#ifdef PADDLE_WITH_CUDA
  std::unique_ptr<platform::NCCLContextMap> nccl_ctxs_;
-  std::unique_ptr<details::SSAGraphExecutor> executor_;
+#endif
 };
 ParallelExecutor::ParallelExecutor(
@@ -54,8 +55,10 @@ ParallelExecutor::ParallelExecutor(
    member_->local_scopes_.push_back(&scope->NewScope());
  }
-  // Bcast Parameters to all GPUs
+// Bcast Parameters to all GPUs
-  BuildNCCLCommunicator();
+#ifdef PADDLE_WITH_CUDA
+  member_->nccl_ctxs_.reset(new platform::NCCLContextMap(member_->places_));
+#endif
  if (platform::is_gpu_place(places[0]) &&
      member_->local_scopes_.size() != 1) {  // Is CUDA
    BCastParamsToGPUs(startup_program);
@@ -123,12 +126,6 @@ void ParallelExecutor::BCastParamsToGPUs(
 #endif
 }
-void ParallelExecutor::BuildNCCLCommunicator() const {
-#ifdef PADDLE_WITH_CUDA
-  member_->nccl_ctxs_.reset(new platform::NCCLContextMap(member_->places_));
-#endif
-}
 void ParallelExecutor::Run(const std::vector<std::string> &fetch_tensors,
                           const std::string &fetched_var_name) {
  auto fetch_data = member_->executor_->Run(fetch_tensors);

--- a/paddle/fluid/framework/parallel_executor.h
+++ b/paddle/fluid/framework/parallel_executor.h
@@ -31,6 +31,8 @@ namespace framework {
 class ParallelExecutorPrivate;
 class ParallelExecutor {
+  DISABLE_COPY_AND_ASSIGN(ParallelExecutor);
 public:
  explicit ParallelExecutor(size_t num_threads,
                            const std::vector<platform::Place>& places,
@@ -46,8 +48,6 @@ class ParallelExecutor {
  ParallelExecutorPrivate* member_;
  void BCastParamsToGPUs(const ProgramDesc& startup_program) const;
-  void BuildNCCLCommunicator() const;
 };
 }  // namespace framework