fix a bug in nlp: text_matching/sentence_transformers when last dim is 1 and...

fix a bug in nlp: text_matching/sentence_transformers when last dim is 1 and reduce mid dim (#34941)

fix a bug in nlp: text_matching/sentence_transformers when last dim is 1 and...
fix a bug in nlp: text_matching/sentence_transformers when last dim is 1 and reduce mid dim (#34941)
181f7cec · niuliling123 · GitHub · ed6624ab · 181f7cec
隐藏空白更改
内联并排

Showing with 2 addition and 2 deletion

paddle/fluid/operators/reduce_ops/reduce_op.cu.h paddle/fluid/operators/reduce_ops/reduce_op.cu.h +2 -2

未找到文件。
--- a/paddle/fluid/operators/reduce_ops/reduce_op.cu.h
+++ b/paddle/fluid/operators/reduce_ops/reduce_op.cu.h
@@ -770,7 +770,7 @@ void TensorReduceFunctorImpl(const framework::Tensor& x, framework::Tensor* y,
  auto x_dim = framework::vectorize<int>(x.dims());
  auto config = ReduceConfig<Ty>(origin_reduce_dims, x_dim);
  config.Run();  // get the parameters of LaunchReduceKernel
+  int numel = x.numel();
  // after config.run()
  // SetOutputData for ReduceHigherDim when should_reduce_again is true,
  // temp_output should be stored temp_data in output_data space or stored in
@@ -787,7 +787,7 @@ void TensorReduceFunctorImpl(const framework::Tensor& x, framework::Tensor* y,
  }
  config.SetOutputData(y_data, x.place(), &tmp);
-  bool use_cub_reduce = (config.left_num == 1) &&
+  bool use_cub_reduce = (config.reduce_num == numel) &&
                        (!std::is_same<Tx, paddle::platform::float16>::value);
  if (use_cub_reduce) {
    // launch CUB::Reduce