test_fleet_base_2.py 3.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import unittest
import paddle
T
tangwei12 已提交
17 18
paddle.enable_static()

19 20 21 22 23 24 25
import os
import paddle.fluid as fluid


class TestFleetBase(unittest.TestCase):
    def setUp(self):
        os.environ["POD_IP"] = "127.0.0.1"
26
        os.environ["PADDLE_PORT"] = "36000"
27 28
        os.environ["PADDLE_TRAINERS_NUM"] = "2"
        os.environ["PADDLE_PSERVERS_IP_PORT_LIST"] = \
T
tangwei12 已提交
29
            "127.0.0.1:36001,127.0.0.2:36001"
30 31 32 33 34

    def test_ps_minimize(self):
        import paddle
        import paddle.distributed.fleet as fleet

T
tangwei12 已提交
35 36
        os.environ["TRAINING_ROLE"] = "TRAINER"
        os.environ["PADDLE_TRAINER_ID"] = "1"
37 38 39

        input_x = paddle.fluid.layers.data(
            name="x", shape=[32], dtype='float32')
40 41
        input_slot = paddle.fluid.layers.data(
            name="slot", shape=[1], dtype='int64')
42 43
        input_y = paddle.fluid.layers.data(name="y", shape=[1], dtype='int64')

44 45 46
        emb = paddle.fluid.layers.embedding(
            input=input_slot, size=[10, 9], is_sparse=True)
        input_x = paddle.concat(x=[input_x, emb], axis=1)
47 48 49 50 51 52 53
        fc_1 = paddle.fluid.layers.fc(input=input_x, size=64, act='tanh')
        fc_2 = paddle.fluid.layers.fc(input=fc_1, size=64, act='tanh')
        prediction = paddle.fluid.layers.fc(input=[fc_2], size=2, act='softmax')
        cost = paddle.fluid.layers.cross_entropy(
            input=prediction, label=input_y)
        avg_cost = paddle.fluid.layers.mean(x=cost)

54
        role = fleet.PaddleCloudRoleMaker(is_collective=False)
55
        fleet.init(role)
T
tangwei12 已提交
56

57 58
        strategy = paddle.distributed.fleet.DistributedStrategy()
        strategy.a_sync = False
T
tangwei12 已提交
59 60
        strategy.a_sync_configs = {"launch_barrier": False}

61 62 63 64 65 66
        optimizer = paddle.optimizer.SGD(learning_rate=0.001)
        optimizer = fleet.distributed_optimizer(optimizer, strategy=strategy)
        optimizer.minimize(avg_cost)

        place = fluid.CPUPlace()
        exe = fluid.Executor(place)
T
tangwei12 已提交
67
        exe.run(paddle.static.default_startup_program())
68 69 70
        pe = fluid.ParallelExecutor(use_cuda=False, loss_name=avg_cost.name)
        compiled_prog = fluid.compiler.CompiledProgram(
            fluid.default_main_program())
T
tangwei12 已提交
71

72
        fleet.init_worker()
T
tangwei12 已提交
73 74 75 76
        fleet.fleet.save(dirname="/tmp", feed=['x', 'y'], fetch=[avg_cost])
        fleet.fleet.save(
            dirname="/tmp", feed=[input_x, input_y], fetch=[avg_cost])
        fleet.fleet.save(dirname="/tmp")
77

78 79
        fleet.load_model(path="/tmp", mode=0)

80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112
        self.assertRaises(
            Exception,
            fleet.save_inference_model,
            dirname='/tmp/',
            feeded_var_names=['x', 'y'],
            target_vars=[avg_cost],
            executor="exe")

        self.assertRaises(
            Exception,
            fleet.save_inference_model,
            dirname='/tmp/',
            feeded_var_names=['x', 'y'],
            target_vars=[avg_cost],
            executor=exe,
            main_program=compiled_prog)

        self.assertRaises(
            Exception, fleet.save_persistables, executor=pe, dirname='/tmp/')

        self.assertRaises(
            Exception, fleet.save_persistables, executor="exe", dirname='/tmp/')

        self.assertRaises(
            Exception,
            fleet.save_persistables,
            executor=exe,
            dirname='/tmp/',
            main_program=compiled_prog)


if __name__ == "__main__":
    unittest.main()