提交 4b9e15bd 编写于 作者: J Juncheng 提交者: Li Xinqi

Fix remove check kernel (#2553)

* op_conf

* op

* of_format

* kernel util

* empty kernel

* unique_with_counts

* py

* gpu pass

* refine

* iter

* fix type seq

* fix

* cpu pass

* remove check kernel
上级 2454b240
......@@ -166,16 +166,6 @@ __global__ void IotaKernel(int64_t n, IDX* out) {
CUDA_1D_KERNEL_LOOP_T(IDX, i, n) { out[i] = static_cast<IDX>(i); }
}
template<typename KEY, typename IDX>
__global__ void CheckKernel(const int64_t n, const KEY* in, const IDX* num_unique,
const KEY* unique_out, const IDX* idx_out) {
CUDA_1D_KERNEL_LOOP(i, n) {
IDX idx = idx_out[i];
assert(idx < *num_unique);
assert(unique_out[idx] == in[i]);
}
}
} // namespace
template<typename KEY, typename IDX>
......@@ -229,9 +219,6 @@ void UniqueKernelUtil<DeviceType::kGPU, KEY, IDX>::UniqueWithCounts(
PermutationIterator<IDX, IDX*, IDX*>>(
cub_temp_storage.ptr, cub_temp_storage.size_in_bytes, unique_counting_iter, remapping_iter, n,
ctx->cuda_stream()));
CheckKernel<KEY, IDX>
<<<BlocksNum4ThreadsNum(n), kCudaThreadsNumPerBlock, 0, ctx->cuda_stream()>>>(
n, in, num_unique, unique_out, idx_out);
}
template<typename KEY, typename IDX>
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册