提交 f5521cf2 编写于 作者: D duanyanhui

fix custom_device copy sync

上级 0f99debd
...@@ -457,13 +457,13 @@ void Tensor::CopyToCpuImpl(T *data, ...@@ -457,13 +457,13 @@ void Tensor::CopyToCpuImpl(T *data,
auto custom_place = t_place; auto custom_place = t_place;
auto *dev_ctx = static_cast<const paddle::platform::CustomDeviceContext *>( auto *dev_ctx = static_cast<const paddle::platform::CustomDeviceContext *>(
pool.Get(custom_place)); pool.Get(custom_place));
dev_ctx->Wait();
paddle::memory::Copy(paddle::platform::CPUPlace(), paddle::memory::Copy(paddle::platform::CPUPlace(),
static_cast<void *>(data), static_cast<void *>(data),
custom_place, custom_place,
t_data, t_data,
ele_num * sizeof(T), ele_num * sizeof(T),
dev_ctx->stream()); dev_ctx->stream());
// TODO(wangran16): sync_stream
#else #else
PADDLE_THROW(paddle::platform::errors::InvalidArgument( PADDLE_THROW(paddle::platform::errors::InvalidArgument(
"The analysis predictor supports CPU, GPU, NPU and XPU now.")); "The analysis predictor supports CPU, GPU, NPU and XPU now."));
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册