Wait fetch op

76570c2e · Yu Yang · b6ca3711 · 76570c2e · 76570c2e
Showing with 1 addition and 3 deletion

paddle/fluid/framework/details/fetch_op_handle.cc paddle/fluid/framework/details/fetch_op_handle.cc +1 -0

paddle/fluid/framework/details/op_handle_base.cc paddle/fluid/framework/details/op_handle_base.cc +0 -3

未找到文件。
--- a/paddle/fluid/framework/details/fetch_op_handle.cc
+++ b/paddle/fluid/framework/details/fetch_op_handle.cc
@@ -66,6 +66,7 @@ void FetchOpHandle::RunImpl() {
    if (platform::is_gpu_place(var->place_)) {
 #ifdef PADDLE_WITH_CUDA
      TensorCopy(t, cpu, *dev_ctx_[t.place()], &tensors_[i]);
+      dev_ctx_[t.place()]->Wait();
 #endif
    } else {
      tensors_[i].ShareDataWith(t);

--- a/paddle/fluid/framework/details/op_handle_base.cc
+++ b/paddle/fluid/framework/details/op_handle_base.cc
@@ -33,9 +33,6 @@ std::string OpHandleBase::DebugString() const {

 OpHandleBase::~OpHandleBase() {
 #ifdef PADDLE_WITH_CUDA
-  for (auto &ctx : dev_ctx_) {
-    ctx.second->Wait();
-  }
  for (auto &ev : events_) {
    PADDLE_ENFORCE(cudaEventDestroy(ev.second));
  }