diff --git a/paddle/fluid/operators/collective/c_allreduce_max_op.cu.cc b/paddle/fluid/operators/collective/c_allreduce_max_op.cu.cc index 6ac228ca53dd5183c8a7f24d3aaf7b2ac04bb1fb..9be9674bb082bd1b5f6890f422521626d6da232b 100644 --- a/paddle/fluid/operators/collective/c_allreduce_max_op.cu.cc +++ b/paddle/fluid/operators/collective/c_allreduce_max_op.cu.cc @@ -28,7 +28,11 @@ PD_REGISTER_STRUCT_KERNEL(c_allreduce_max, ALL_LAYOUT, ops::CAllReduceMaxCUDAKernel, float, +#if NCCL_VERSION_CODE >= 21000 + plat::bfloat16, +#endif double, int, int64_t, - plat::float16) {} + plat::float16) { +} diff --git a/paddle/fluid/operators/collective/c_split_op.cu b/paddle/fluid/operators/collective/c_split_op.cu index c128a212739b6a33f14ea87d6759d33fc8f381a7..b01ed790e851715063312336b3eeae18b0382a26 100644 --- a/paddle/fluid/operators/collective/c_split_op.cu +++ b/paddle/fluid/operators/collective/c_split_op.cu @@ -123,4 +123,8 @@ PD_REGISTER_STRUCT_KERNEL(c_split, double, int, int64_t, - plat::float16) {} +#if NCCL_VERSION_CODE >= 21000 + plat::bfloat16, +#endif + plat::float16) { +} diff --git a/paddle/fluid/operators/collective/partial_allgather_op.cu.cc b/paddle/fluid/operators/collective/partial_allgather_op.cu.cc index 94ad2432e46ff8d928a5959347d6b11ff13c0127..ce5a5438eff55515a28dec9d7f633d27df5e390f 100644 --- a/paddle/fluid/operators/collective/partial_allgather_op.cu.cc +++ b/paddle/fluid/operators/collective/partial_allgather_op.cu.cc @@ -104,6 +104,9 @@ namespace plat = paddle::platform; REGISTER_OP_CUDA_KERNEL(partial_allgather, ops::PartialAllGatherOpCUDAKernel, +#if NCCL_VERSION_CODE >= 21000 + ops::PartialAllGatherOpCUDAKernel, +#endif ops::PartialAllGatherOpCUDAKernel, ops::PartialAllGatherOpCUDAKernel, ops::PartialAllGatherOpCUDAKernel, diff --git a/paddle/fluid/operators/collective/partial_recv_op.cu.cc b/paddle/fluid/operators/collective/partial_recv_op.cu.cc index f9fb0ce1862324617d1b3474f070fcdfd5009a0f..306175d1ca7af8d5e4768b488bfa0c7a417ed344 100644 --- a/paddle/fluid/operators/collective/partial_recv_op.cu.cc +++ b/paddle/fluid/operators/collective/partial_recv_op.cu.cc @@ -120,6 +120,9 @@ namespace plat = paddle::platform; REGISTER_OP_CUDA_KERNEL(partial_recv, ops::PartialRecvOpCUDAKernel, +#if NCCL_VERSION_CODE >= 21000 + ops::PartialRecvOpCUDAKernel, +#endif ops::PartialRecvOpCUDAKernel, ops::PartialRecvOpCUDAKernel, ops::PartialRecvOpCUDAKernel, diff --git a/paddle/fluid/operators/collective/partial_send_op.cu.cc b/paddle/fluid/operators/collective/partial_send_op.cu.cc index c73fa779c506930876794773e8abd4a7d81dfdf9..afac7f963fa0dc6107938db7b67c5164e512039e 100644 --- a/paddle/fluid/operators/collective/partial_send_op.cu.cc +++ b/paddle/fluid/operators/collective/partial_send_op.cu.cc @@ -120,6 +120,9 @@ namespace plat = paddle::platform; REGISTER_OP_CUDA_KERNEL(partial_send, ops::PartialSendCUDAKernel, ops::PartialSendCUDAKernel, +#if NCCL_VERSION_CODE >= 21000 + ops::PartialSendCUDAKernel, +#endif ops::PartialSendCUDAKernel, ops::PartialSendCUDAKernel, ops::PartialSendCUDAKernel);