Merge pull request #13080 from reyoung/fix_scale_grad_bug

Fix bug when loss@GRAD is reused. (Release Branch)

Merge pull request #13080 from reyoung/fix_scale_grad_bug
Fix bug when loss@GRAD is reused. (Release Branch)
12ac0730 · Xin Pan · GitHub · e860a5d0 · 941e835b · 12ac0730
隐藏空白更改
内联并排

Showing with 3 addition and 11 deletion

paddle/fluid/framework/details/multi_devices_graph_pass.cc paddle/fluid/framework/details/multi_devices_graph_pass.cc +3 -11

未找到文件。
--- a/paddle/fluid/framework/details/multi_devices_graph_pass.cc
+++ b/paddle/fluid/framework/details/multi_devices_graph_pass.cc
@@ -625,19 +625,11 @@ int MultiDevSSAGraphBuilder::GetVarDeviceID(const ir::Graph &graph,
 void MultiDevSSAGraphBuilder::CreateScaleLossGradOp(
    ir::Graph *result, const std::string &loss_grad_name) const {
  for (size_t i = 0; i < places_.size(); ++i) {
-// Insert ScaleCost OpHandle
+    // Insert ScaleCost OpHandle
-#ifdef PADDLE_WITH_CUDA
+    auto *dev_ctx = platform::DeviceContextPool::Instance().Get(places_[i]);
-    auto *communication_dev_ctx =
-        nccl_ctxs_ ? nccl_ctxs_->DevCtx(places_[i])
-                   : platform::DeviceContextPool::Instance().Get(places_[i]);
-#else
-    auto *communication_dev_ctx =
-        platform::DeviceContextPool::Instance().Get(platform::CPUPlace());
-#endif
    auto *op_handle = new ScaleLossGradOpHandle(
        result->CreateEmptyNode("scale_loss_grad", ir::Node::Type::kOperation),
-        local_scopes_.size(), local_scopes_[i], places_[i],
+        local_scopes_.size(), local_scopes_[i], places_[i], dev_ctx);
-        communication_dev_ctx);
    result->Get<GraphOps>(kGraphOps).emplace_back(op_handle);
    // FIXME: Currently ScaleLossGradOp only use device_count as scale