Fix submanifold conv (#45060)

* fix submanifold conv

Fix submanifold conv (#45060)
* fix submanifold conv
27e3b06f · zhangkaihuo · GitHub · 26c573de · 27e3b06f
显示空白变更内容
内联并排

Showing with 4 addition and 4 deletion

paddle/phi/kernels/sparse/gpu/conv.cu.h paddle/phi/kernels/sparse/gpu/conv.cu.h +4 -4

未找到文件。
--- a/paddle/phi/kernels/sparse/gpu/conv.cu.h
+++ b/paddle/phi/kernels/sparse/gpu/conv.cu.h
@@ -662,9 +662,9 @@ int ProductRuleBook(const Context& dev_ctx,
                                       dev_ctx.stream());
    dev_ctx.Wait();
-    size_t cache_size = kernel_size * 2 + kernel_size *
+    size_t cache_size =
-                                              config.thread_per_block.x * 2 *
+        kernel_size * 2 * sizeof(int) +
-                                              sizeof(int);
+        kernel_size * config.thread_per_block.x * 2 * sizeof(int);
    const int MAX_CACHE_SIZE = 48 * 1024;
    while (cache_size >= MAX_CACHE_SIZE) {
      config.thread_per_block.x /= 2;
@@ -672,7 +672,7 @@ int ProductRuleBook(const Context& dev_ctx,
      PADDLE_ENFORCE_GE(config.thread_per_block.x,
                        32,
                        phi::errors::Fatal("the shared memory is not enough"));
-      cache_size = kernel_size * 2 +
+      cache_size = kernel_size * 2 * sizeof(int) +
                   kernel_size * config.thread_per_block.x * 2 * sizeof(int);
    }
    ProductSubmRuleBookKernel<IntT><<<config.block_per_grid.x,