test_imperative_data_parallel.py 2.4 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import unittest
16

17 18 19
import numpy as np

import paddle.fluid as fluid
20
import paddle.fluid.core as core
21
import paddle.fluid.dygraph as dygraph
W
wangxiaoning 已提交
22
from paddle.distributed import init_parallel_env
23
from paddle.nn import Linear
24 25 26 27


class MLP(fluid.Layer):
    def __init__(self, param_attr=None, bias_attr=None):
28
        super().__init__()
29 30 31 32 33 34 35 36 37 38 39 40 41

        self._linear1 = Linear(784, 10)
        self._linear2 = Linear(10, 10)

    def forward(self, inputs):
        y = self._linear1(inputs)
        y = self._linear2(y)
        return y


class TestDataParallelStateDict(unittest.TestCase):
    def test_data_parallel_state_dict(self):
        with fluid.dygraph.guard():
W
wangxiaoning 已提交
42
            init_parallel_env()
43
            mlp = MLP()
W
wangxiaoning 已提交
44
            parallel_mlp = dygraph.parallel.DataParallel(mlp)
45 46 47 48 49

            single_state = mlp.state_dict()
            parallel_state = parallel_mlp.state_dict()

            base_para = {}
50 51 52 53 54
            place = (
                fluid.CPUPlace()
                if not core.is_compiled_with_cuda()
                else fluid.CUDAPlace(0)
            )
55 56 57
            for k, v in single_state.items():
                self.assertTrue(k in parallel_state)

58 59 60
                np.testing.assert_array_equal(
                    v.numpy(), parallel_state[k].numpy()
                )
61 62 63 64 65 66 67 68 69 70 71 72 73 74 75

                base_para[k] = v.numpy()

            for k, v in parallel_state.items():
                np_t = v.numpy()
                var = v.value().get_tensor()
                var.set(np.zeros_like(np_t), place)

                self.assertTrue(np.sum(np.abs(v.numpy())) == 0)

            parallel_mlp.set_dict(base_para)

            parallel_state = parallel_mlp.state_dict()

            for k, v in parallel_state.items():
76
                np.testing.assert_array_equal(v.numpy(), base_para[k])
77 78 79 80 81 82

            parallel_mlp.load_dict(base_para)


if __name__ == '__main__':
    unittest.main()