Fix remove check kernel (#2553)

* op_conf * op * of_format * kernel util * empty kernel * unique_with_counts * py * gpu pass * refine * iter * fix type seq * fix * cpu pass * remove check kernel

Fix remove check kernel (#2553)
* op_conf * op * of_format * kernel util * empty kernel * unique_with_counts * py * gpu pass * refine * iter * fix type seq * fix * cpu pass * remove check kernel
4b9e15bd · Juncheng · Li Xinqi · 2454b240 · 4b9e15bd
隐藏空白更改
内联并排

Showing with 0 addition and 13 deletion

oneflow/core/kernel/unique_kernel_util.cu oneflow/core/kernel/unique_kernel_util.cu +0 -13

未找到文件。
--- a/oneflow/core/kernel/unique_kernel_util.cu
+++ b/oneflow/core/kernel/unique_kernel_util.cu
@@ -166,16 +166,6 @@ __global__ void IotaKernel(int64_t n, IDX* out) {
  CUDA_1D_KERNEL_LOOP_T(IDX, i, n) { out[i] = static_cast<IDX>(i); }
 }

-template<typename KEY, typename IDX>
-__global__ void CheckKernel(const int64_t n, const KEY* in, const IDX* num_unique,
-                            const KEY* unique_out, const IDX* idx_out) {
-  CUDA_1D_KERNEL_LOOP(i, n) {
-    IDX idx = idx_out[i];
-    assert(idx < *num_unique);
-    assert(unique_out[idx] == in[i]);
-  }
-}
-
 }  // namespace

 template<typename KEY, typename IDX>
@@ -229,9 +219,6 @@ void UniqueKernelUtil<DeviceType::kGPU, KEY, IDX>::UniqueWithCounts(
                                          PermutationIterator<IDX, IDX*, IDX*>>(
      cub_temp_storage.ptr, cub_temp_storage.size_in_bytes, unique_counting_iter, remapping_iter, n,
      ctx->cuda_stream()));
-  CheckKernel<KEY, IDX>
-      <<<BlocksNum4ThreadsNum(n), kCudaThreadsNumPerBlock, 0, ctx->cuda_stream()>>>(
-          n, in, num_unique, unique_out, idx_out);
 }

 template<typename KEY, typename IDX>