fix c_embedding bug (#52742)

4a790cba · Chitsing KUI · GitHub · 94a8177f · 4a790cba
隐藏空白更改
内联并排

Showing with 6 addition and 0 deletion

paddle/fluid/operators/collective/c_embedding_op.cu paddle/fluid/operators/collective/c_embedding_op.cu +6 -0

未找到文件。
--- a/paddle/fluid/operators/collective/c_embedding_op.cu
+++ b/paddle/fluid/operators/collective/c_embedding_op.cu
@@ -19,6 +19,8 @@ limitations under the License. */
 #include "paddle/fluid/platform/float16.h"
 #include "paddle/phi/backends/gpu/gpu_primitives.h"

+DECLARE_bool(cudnn_deterministic);
+
 namespace paddle {
 namespace operators {

@@ -164,6 +166,10 @@ class CEmbeddingGradCUDAKernel : public framework::OpKernel<T> {
    t.device(*dev_ctx.eigen_device()) = t.constant(static_cast<T>(0));

    const auto &index_type = framework::TransToProtoVarType(ids_t->dtype());
+    if (FLAGS_cudnn_deterministic) {
+      VLOG(2) << "Run grad kernel of embedding with single thread.";
+      blocks = 1;
+    }
    if (index_type == framework::proto::VarType::INT32) {
      CEmbeddingGrad<T, int32_t>
          <<<blocks, threads, 0, dev_ctx.stream()>>>(d_table,