Polish NCCLHelper

c64190ec · Yu Yang · 7483555a · c64190ec
显示空白变更内容
内联并排

Showing with 11 addition and 8 deletion

paddle/fluid/platform/nccl_helper.h paddle/fluid/platform/nccl_helper.h +11 -8

未找到文件。
--- a/paddle/fluid/platform/nccl_helper.h
+++ b/paddle/fluid/platform/nccl_helper.h
@@ -61,7 +61,7 @@ struct NCCLContext {
  ncclComm_t comm_;

  explicit NCCLContext(int dev_id)
-      : ctx_(new CUDADeviceContext(CUDAPlace(dev_id))) {}
+      : ctx_(new CUDADeviceContext(CUDAPlace(dev_id))), comm_{nullptr} {}

  cudaStream_t stream() const { return ctx_->stream(); }

@@ -95,6 +95,7 @@ struct NCCLContextMap {
  std::vector<int> order_;

  explicit NCCLContextMap(const std::vector<platform::Place> &places) {
+    PADDLE_ENFORCE(!places.empty());
    order_.reserve(places.size());
    for (auto &p : places) {
      int dev_id = boost::get<CUDAPlace>(p).device;
@@ -105,6 +106,7 @@ struct NCCLContextMap {
        order_.size(), contexts_.size(),
        "NCCL Context Map does not support contain two or more same device");

+    if (places.size() > 1) {
      std::vector<ncclComm_t> comms;
      comms.resize(order_.size());

@@ -116,6 +118,7 @@ struct NCCLContextMap {
        contexts_.at(dev_id).comm_ = comms[i++];
      }
    }
+  }

  CUDADeviceContext *DevCtx(int dev_id) const { return at(dev_id).ctx_.get(); }