diff --git a/paddle/phi/kernels/gpu/cumsum_kernel.cu b/paddle/phi/kernels/gpu/cumsum_kernel.cu index ed131e0ff541303a88524cece1bc1658ea28263d..460aa37f8f9952f3288df9882b593fca171b4ce1 100644 --- a/paddle/phi/kernels/gpu/cumsum_kernel.cu +++ b/paddle/phi/kernels/gpu/cumsum_kernel.cu @@ -263,8 +263,9 @@ void CumsumKernel(const Context& dev_ctx, dim3 blocks(32, 8); dim3 transpose_grids((width + tile_size - 1) / tile_size, (height + tile_size - 1) / tile_size); - out->Resize(out_dims); - auto* tmp_data = out->data(); + DenseTensor tmp_tensor; + tmp_tensor.Resize(out_dims); + auto* tmp_data = dev_ctx.template Alloc(&tmp_tensor); T* next_in_data = out_data; T* next_out_data = tmp_data;