diff --git a/cmake/external/xpu.cmake b/cmake/external/xpu.cmake index bb2e864f5cda254400e3ca3ae4846bfc581c84b0..08f6be6de11e0e9efa49757af7024b388dd522c2 100644 --- a/cmake/external/xpu.cmake +++ b/cmake/external/xpu.cmake @@ -25,7 +25,7 @@ else() endif() set(XPU_XCCL_BASE_URL - "https://klx-sdk-release-public.su.bcebos.com/xccl/release/1.0.4") + "https://klx-sdk-release-public.su.bcebos.com/xccl/release/1.0.5") if(WITH_AARCH64) set(XPU_XRE_DIR_NAME "xre-kylin_aarch64") diff --git a/paddle/fluid/operators/collective/c_allreduce_sum_op_xpu.cc b/paddle/fluid/operators/collective/c_allreduce_sum_op_xpu.cc index 16b3ff335b65493204d14540adf5fee68d82c9ae..a4d1c62e821ecc9925bd9eeb4d2b06003265a246 100644 --- a/paddle/fluid/operators/collective/c_allreduce_sum_op_xpu.cc +++ b/paddle/fluid/operators/collective/c_allreduce_sum_op_xpu.cc @@ -19,4 +19,5 @@ namespace plat = paddle::platform; REGISTER_OP_XPU_KERNEL(c_allreduce_sum, ops::CAllReduceOpXPUKernel, - ops::CAllReduceOpXPUKernel) + ops::CAllReduceOpXPUKernel, + ops::CAllReduceOpXPUKernel) diff --git a/paddle/fluid/platform/device/xpu/xpu2_op_list.h b/paddle/fluid/platform/device/xpu/xpu2_op_list.h index c246924e14b69ace3d824c557cc5df6dcf967b88..83f0c21315be2a74e478469bdef0c97353a2ecda 100644 --- a/paddle/fluid/platform/device/xpu/xpu2_op_list.h +++ b/paddle/fluid/platform/device/xpu/xpu2_op_list.h @@ -80,13 +80,16 @@ XPUOpMap& get_kl2_ops() { pOpKernelType(vartype::INT64, XPUPlace())})}, {"c_allreduce_sum", XPUKernelSet({pOpKernelType(vartype::FP16, XPUPlace()), - pOpKernelType(vartype::FP32, XPUPlace())})}, + pOpKernelType(vartype::FP32, XPUPlace()), + pOpKernelType(vartype::INT32, XPUPlace())})}, {"c_identity", XPUKernelSet({pOpKernelType(vartype::FP16, XPUPlace()), pOpKernelType(vartype::FP32, XPUPlace()), pOpKernelType(vartype::FP64, XPUPlace()), pOpKernelType(vartype::INT32, XPUPlace()), pOpKernelType(vartype::INT64, XPUPlace())})}, + {"c_sync_calc_stream", + XPUKernelSet({pOpKernelType(vartype::FP32, XPUPlace())})}, {"c_sync_comm_stream", XPUKernelSet({pOpKernelType(vartype::FP32, XPUPlace())})}, {"cast",