diff --git a/paddle/fluid/operators/elementwise/elementwise_add_op.h b/paddle/fluid/operators/elementwise/elementwise_add_op.h index 91b6750c5972f5918689edcae70b206a68ca85f7..db5c6eca6e5068648e51052be2916553bcf57328 100644 --- a/paddle/fluid/operators/elementwise/elementwise_add_op.h +++ b/paddle/fluid/operators/elementwise/elementwise_add_op.h @@ -348,7 +348,7 @@ class ElementwiseAddGradKernel : public ElemwiseGradKernel { } else { size_t thread_nums = 1024; size_t block_nums = (width + thread_nums - 1) / thread_nums; - int vec_size = VectorizedSize(dx_data); + int vec_size = VectorizedSize(dout_data); if (vec_size == 4 && width % 4 == 0) { block_nums = (width / vec_size + thread_nums - 1) / thread_nums; VecMatrixReduceLongWidth