[cherry-pick]layer.to api support numpy.dtype and paddle.dtype (#38108)

Issue37932 反馈 layer.to 不支持paddle.dtype类型的问题，新增了对这类型的支持。详情见：#38018 同时，也一并cherry-pick了遗漏的 PR 36779 的commit。修改内容： Cherry-pick #36779 cherrry-pick #38018

[cherry-pick]layer.to api support numpy.dtype and paddle.dtype (#38108)
Issue37932 反馈 layer.to 不支持paddle.dtype类型的问题，新增了对这类型的支持。详情见：#38018 同时，也一并cherry-pick了遗漏的 PR 36779 的commit。修改内容： Cherry-pick #36779 cherrry-pick #38018
8100c16a · chentianyu03 · GitHub · 81469615 · 8100c16a · 8100c16a
Showing with 81 addition and 32 deletion

python/paddle/fluid/dygraph/layers.py python/paddle/fluid/dygraph/layers.py +35 -32

python/paddle/fluid/tests/unittests/test_base_layer.py python/paddle/fluid/tests/unittests/test_base_layer.py +46 -0

未找到文件。
--- a/python/paddle/fluid/dygraph/layers.py
+++ b/python/paddle/fluid/dygraph/layers.py
@@ -37,6 +37,7 @@ from ..param_attr import ParamAttr
 from paddle.fluid.executor import Executor, global_scope
 from paddle.fluid.framework import in_dygraph_mode, convert_np_dtype_to_dtype_
 from paddle.fluid.framework import _current_expected_place as _get_device
+from paddle.fluid.core import VarDesc
 from paddle.fluid.dygraph import no_grad
 import paddle.utils.deprecated as deprecated

@@ -1488,17 +1489,18 @@ class Layer(core.Layer):
            If None, the device is the same with the original Tensor. If device is string, it can be ``cpu``, ``gpu:x`` and ``xpu:x``, where ``x`` is the
            index of the GPUs or XPUs. Default: None.

-            dtype(str|core.VarDesc.VarType|None, optional): The type of the data. If None, the dtype is the same with the original Tensor. Default: None.
+            dtype(str|numpy.dtype|paddle.dtype|None, optional): The type of the data. If None, the dtype is the same with the original Tensor. Default: None.

            blocking(bool|None, optional): If False and the source is in pinned memory, the copy will be
              asynchronous with respect to the host. Otherwise, the argument has no effect. If None, the blocking is set True. Default: None.

        Returns:
-            None
+            self

        Examples:
            .. code-block:: python

+                # required: skip
                import paddle

                linear=paddle.nn.Linear(2, 2)
@@ -1529,7 +1531,7 @@ class Layer(core.Layer):
        '''

        if device is None and dtype is None and blocking is None:
-            return
+            return self

        if device is not None:
            if isinstance(device, str):
@@ -1555,7 +1557,7 @@ class Layer(core.Layer):
            if dtype is None:
                dtype = t.dtype

-            if type(dtype) is str:
+            if type(dtype) is not VarDesc.VarType:
                dtype = convert_np_dtype_to_dtype_(dtype)

            # 1. gpu place need to determine whether the memory is sufficient for allocation:
@@ -1604,6 +1606,7 @@ class Layer(core.Layer):
            self._apply(transform, device, dtype, blocking)

        self._dtype = dtype
+        return self

    # [aliases] Compatible with old method names
    set_dict = set_state_dict

--- a/python/paddle/fluid/tests/unittests/test_base_layer.py
+++ b/python/paddle/fluid/tests/unittests/test_base_layer.py
@@ -403,6 +403,52 @@ class TestLayerTo(unittest.TestCase):

        self.assertRaises(AssertionError, self.linear.to, blocking=1)

+    def test_to_api_paddle_dtype(self):
+        self.linear.to(dtype=paddle.float64)
+        self.assertEqual(self.linear.weight.dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        self.assertEqual(self.linear.buf_name.dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        self.assertTrue(
+            np.allclose(self.linear.weight.grad.numpy(), self.new_grad))
+        self.assertEqual(self.linear.weight._grad_ivar().dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+
+        self.linear.to()
+        self.assertEqual(self.linear.weight.dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        self.assertEqual(self.linear.buf_name.dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        self.assertTrue(
+            np.allclose(self.linear.weight.grad.numpy(), self.new_grad))
+        self.assertEqual(self.linear.weight._grad_ivar().dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        for p in self.linear.parameters():
+            self.assertTrue(isinstance(p, paddle.fluid.framework.ParamBase))
+
+    def test_to_api_numpy_dtype(self):
+        self.linear.to(dtype=np.float64)
+        self.assertEqual(self.linear.weight.dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        self.assertEqual(self.linear.buf_name.dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        self.assertTrue(
+            np.allclose(self.linear.weight.grad.numpy(), self.new_grad))
+        self.assertEqual(self.linear.weight._grad_ivar().dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+
+        self.linear.to()
+        self.assertEqual(self.linear.weight.dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        self.assertEqual(self.linear.buf_name.dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        self.assertTrue(
+            np.allclose(self.linear.weight.grad.numpy(), self.new_grad))
+        self.assertEqual(self.linear.weight._grad_ivar().dtype,
+                         paddle.fluid.core.VarDesc.VarType.FP64)
+        for p in self.linear.parameters():
+            self.assertTrue(isinstance(p, paddle.fluid.framework.ParamBase))
+

 if __name__ == '__main__':
    unittest.main()