未验证 提交 9f1f1b0a 编写于 作者: H houj04 提交者: GitHub

[XPU] c_allreduce support int. update bkcl to 1.0.5. test=kunlun (#45248)

上级 3deab77f
...@@ -25,7 +25,7 @@ else() ...@@ -25,7 +25,7 @@ else()
endif() endif()
set(XPU_XCCL_BASE_URL set(XPU_XCCL_BASE_URL
"https://klx-sdk-release-public.su.bcebos.com/xccl/release/1.0.4") "https://klx-sdk-release-public.su.bcebos.com/xccl/release/1.0.5")
if(WITH_AARCH64) if(WITH_AARCH64)
set(XPU_XRE_DIR_NAME "xre-kylin_aarch64") set(XPU_XRE_DIR_NAME "xre-kylin_aarch64")
......
...@@ -19,4 +19,5 @@ namespace plat = paddle::platform; ...@@ -19,4 +19,5 @@ namespace plat = paddle::platform;
REGISTER_OP_XPU_KERNEL(c_allreduce_sum, REGISTER_OP_XPU_KERNEL(c_allreduce_sum,
ops::CAllReduceOpXPUKernel<ops::kRedSum, float>, ops::CAllReduceOpXPUKernel<ops::kRedSum, float>,
ops::CAllReduceOpXPUKernel<ops::kRedSum, plat::float16>) ops::CAllReduceOpXPUKernel<ops::kRedSum, plat::float16>,
ops::CAllReduceOpXPUKernel<ops::kRedSum, int>)
...@@ -80,13 +80,16 @@ XPUOpMap& get_kl2_ops() { ...@@ -80,13 +80,16 @@ XPUOpMap& get_kl2_ops() {
pOpKernelType(vartype::INT64, XPUPlace())})}, pOpKernelType(vartype::INT64, XPUPlace())})},
{"c_allreduce_sum", {"c_allreduce_sum",
XPUKernelSet({pOpKernelType(vartype::FP16, XPUPlace()), XPUKernelSet({pOpKernelType(vartype::FP16, XPUPlace()),
pOpKernelType(vartype::FP32, XPUPlace())})}, pOpKernelType(vartype::FP32, XPUPlace()),
pOpKernelType(vartype::INT32, XPUPlace())})},
{"c_identity", {"c_identity",
XPUKernelSet({pOpKernelType(vartype::FP16, XPUPlace()), XPUKernelSet({pOpKernelType(vartype::FP16, XPUPlace()),
pOpKernelType(vartype::FP32, XPUPlace()), pOpKernelType(vartype::FP32, XPUPlace()),
pOpKernelType(vartype::FP64, XPUPlace()), pOpKernelType(vartype::FP64, XPUPlace()),
pOpKernelType(vartype::INT32, XPUPlace()), pOpKernelType(vartype::INT32, XPUPlace()),
pOpKernelType(vartype::INT64, XPUPlace())})}, pOpKernelType(vartype::INT64, XPUPlace())})},
{"c_sync_calc_stream",
XPUKernelSet({pOpKernelType(vartype::FP32, XPUPlace())})},
{"c_sync_comm_stream", {"c_sync_comm_stream",
XPUKernelSet({pOpKernelType(vartype::FP32, XPUPlace())})}, XPUKernelSet({pOpKernelType(vartype::FP32, XPUPlace())})},
{"cast", {"cast",
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册