fix bug for fp32 batchnorm_op when using nhwc data_layout (#37020)

0666b858 · Guoxia Wang · GitHub · cde335a1 · 0666b858
显示空白变更内容
内联并排

Showing with 1 addition and 1 deletion

paddle/fluid/operators/batch_norm_op.cu paddle/fluid/operators/batch_norm_op.cu +1 -1

未找到文件。
--- a/paddle/fluid/operators/batch_norm_op.cu
+++ b/paddle/fluid/operators/batch_norm_op.cu
@@ -916,7 +916,7 @@ class BatchNormGradKernel<platform::CUDADeviceContext, T>
    Tensor transformed_d_y(d_y->type());
    Tensor transformed_d_x;
    if (data_layout == DataLayout::kNHWC &&
-        compute_format == DataLayout::kNCHW) {
+        compute_format == DataLayout::kNCHW && x_dims.size() > 2) {
      VLOG(3) << "Transform input tensor from NHWC to NCHW.";
      ResizeToChannelFirst<platform::CUDADeviceContext, T>(ctx, x,
                                                           &transformed_x);