Avoid using dynamic array in cuda kernel

92cfa2be · Yibing Liu · 28a0ac53 · 92cfa2be · 92cfa2be
显示空白变更内容
内联并排

Showing with 5 addition and 6 deletion

paddle/fluid/operators/argsort_op.cc paddle/fluid/operators/argsort_op.cc +2 -2

paddle/fluid/operators/argsort_op.cu paddle/fluid/operators/argsort_op.cu +3 -4

未找到文件。
--- a/paddle/fluid/operators/argsort_op.cc
+++ b/paddle/fluid/operators/argsort_op.cc
@@ -38,8 +38,8 @@ class ArgsortOp : public framework::OperatorWithKernel {
                   "dimension %d.",
                   axis, num_dims);
    PADDLE_ENFORCE(in_dims.size() + axis >= 0,
-                   "Attr(axis) %d of ArgsortOp plus the number of Input(X)'s "
+                   "Attr(axis) %d of ArgsortOp plus the rank %d of Input(X) "
-                   "dimensions %d must be nonnegative.",
+                   "must be nonnegative.",
                   axis, in_dims.size());
    ctx->SetOutputDim("Out", in_dims);

--- a/paddle/fluid/operators/argsort_op.cu
+++ b/paddle/fluid/operators/argsort_op.cu
@@ -31,8 +31,9 @@ __global__ void ComputeTargetIdx(const int64_t* in_dims, int dims_size,
                                 int64_t* med_ids) {
  int64_t index = threadIdx.x + blockDim.x * blockIdx.x;
  if (index < n) {
-    int64_t* shape_out_axis = new int64_t[dims_size - 1];
+    const int max_rank = 9;  // Max rank of a tensor allow in Fluid
-    int64_t* dims_out_axis = new int64_t[dims_size - 1];
+    int64_t shape_out_axis[max_rank - 1] = {0};
+    int64_t dims_out_axis[max_rank - 1] = {0};
    int64_t tmp = index;
    int64_t pos_in_axis = 0;
    int64_t i = dims_size - 2;
@@ -57,8 +58,6 @@ __global__ void ComputeTargetIdx(const int64_t* in_dims, int dims_size,
    int64_t traget_idx = group * dim_axis + pos_in_axis;
    trg_idx[index] = traget_idx;
    med_ids[traget_idx] = pos_in_axis;
-    delete[] shape_out_axis;
-    delete[] dims_out_axis;
  }
 }