fix uniform_rand_kernel FP16 support in dygraph mode (#46212)

ccab0e2a · 傅剑寒 · GitHub · 596d8209 · ccab0e2a · ccab0e2a
3 changed file
--- a/paddle/phi/kernels/gpu/uniform_random_kernel.cu
+++ b/paddle/phi/kernels/gpu/uniform_random_kernel.cu
@@ -74,8 +74,12 @@ void UniformRandomRawKernel(const Context& dev_ctx,
    funcs::distribution_and_transform<T>(dev_ctx, out, dist, trans);
  } else {
    // Use OP seed
-    auto func = UniformGenerator<T>(
+    auto func = UniformGenerator<T>(static_cast<T>(min.to<float>()),
-        min.to<float>(), max.to<float>(), seed, diag_num, diag_step, diag_val);
+                                    static_cast<T>(max.to<float>()),
+                                    seed,
+                                    diag_num,
+                                    diag_step,
+                                    static_cast<T>(diag_val));
    IndexKernel<T, UniformGenerator<T>>(dev_ctx, out, func);
  }
 }
@@ -87,4 +91,5 @@ PD_REGISTER_KERNEL(uniform_random_raw,
                   ALL_LAYOUT,
                   phi::UniformRandomRawKernel,
                   float,
-                   double) {}
+                   double,
+                   phi::dtype::float16) {}
--- a/paddle/phi/kernels/uniform_random_kernel.cc
+++ b/paddle/phi/kernels/uniform_random_kernel.cc
@@ -51,8 +51,13 @@ PD_REGISTER_KERNEL(uniform_random,
                   phi::dtype::bfloat16) {}
 #if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP)
-PD_REGISTER_KERNEL(
+PD_REGISTER_KERNEL(uniform_random,
-    uniform_random, GPU, ALL_LAYOUT, phi::UniformRandomKernel, float, double) {}
+                   GPU,
+                   ALL_LAYOUT,
+                   phi::UniformRandomKernel,
+                   float,
+                   double,
+                   phi::dtype::float16) {}
 #endif
 #ifdef PADDLE_WITH_XPU

--- a/python/paddle/fluid/tests/unittests/test_uniform_random_op.py
+++ b/python/paddle/fluid/tests/unittests/test_uniform_random_op.py
@@ -585,8 +585,17 @@ class TestUniformDtype(unittest.TestCase):
            out = paddle.tensor.random.uniform([2, 3])
            self.assertEqual(out.dtype, fluid.core.VarDesc.VarType.FP64)
+        def test_dygraph_fp16():
+            if not paddle.is_compiled_with_cuda():
+                paddle.enable_static()
+                return
+            paddle.set_device('gpu')
+            out = paddle.uniform([2, 3], dtype=paddle.float16)
+            self.assertEqual(out.dtype, fluid.core.VarDesc.VarType.FP16)
        test_default_fp64()
        test_default_fp32()
+        test_dygraph_fp16()
        paddle.enable_static()