conv shift: fix return before syncthreads

42dd5da0 · Markus Kliegl · 3dc88342 · 42dd5da0
隐藏空白更改
内联并排

Showing with 9 addition and 9 deletion

paddle/operators/conv_shift_op.cu paddle/operators/conv_shift_op.cu +9 -9

未找到文件。
--- a/paddle/operators/conv_shift_op.cu
+++ b/paddle/operators/conv_shift_op.cu
@@ -62,19 +62,19 @@ __global__ void ConvShiftForward(const T *x, const T *y, T *out, int x_width,
  if (tx < num_x) {
    int load_i = (i - y_half_width + x_width) % x_width;
    sx[tx] = x[k * x_width + load_i];
-  } else {
-    return;
  }
  __syncthreads();
-  // Compute dot product of sx[tx:tx + y_width] and sy.
+  if (tx < num_x) {
-  T sum = 0;
+    // Compute dot product of sx[tx:tx + y_width] and sy.
-  for (int j = 0; j < y_width; ++j) {
+    T sum = 0;
-    sum += sx[tx + j] * sy[j];
+    for (int j = 0; j < y_width; ++j) {
-  }
+      sum += sx[tx + j] * sy[j];
+    }
-  // Save to out[k, i].
+    // Save to out[k, i].
-  out[k * x_width + i] = sum;
+    out[k * x_width + i] = sum;
+  }
 }
 // Compute x gradient - initial naive implementation with atomic add.