[kunlun] bugfix for collective softmax_with_ce (#52565)

075d6b14 · jameszhang · GitHub · d947b20a · 075d6b14
隐藏空白更改
内联并排

Showing with 6 addition and 0 deletion

paddle/fluid/operators/collective/c_softmax_with_cross_entropy_op_xpu.cc ...erators/collective/c_softmax_with_cross_entropy_op_xpu.cc +6 -0

未找到文件。
--- a/paddle/fluid/operators/collective/c_softmax_with_cross_entropy_op_xpu.cc
+++ b/paddle/fluid/operators/collective/c_softmax_with_cross_entropy_op_xpu.cc
@@ -144,6 +144,12 @@ struct CSoftmaxWithCrossEntropyProcessGroupFunctor<phi::XPUContext, T> {
    phi::DenseTensor predicted_logits;
    predicted_logits =
        ctx.AllocateTmpTensor<T, phi::XPUContext>({N, 1}, dev_ctx);
+    ret = xpu::constant<XPUType>(
+        dev_ctx.x_context(),
+        reinterpret_cast<XPUType*>(predicted_logits.data<T>()),
+        N,
+        0.0);
+    PADDLE_ENFORCE_XDNN_SUCCESS(ret, "constant");
    const int start_index = rank * D;
    const int end_index = start_index + D;
    const auto& label_type = framework::TransToProtoVarType(labels->dtype());