test_dist_shape.py 2.6 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import unittest
16

17 18 19 20 21 22 23 24 25 26 27 28
import paddle
from paddle.distributed.fleet import auto

paddle.enable_static()


def make_program():
    main_program = paddle.fluid.Program()
    start_program = paddle.fluid.Program()
    with paddle.static.program_guard(main_program, start_program):
        x = paddle.static.data(name='x', shape=[4, 4, 8], dtype='float32')
        x.stop_gradient = False
29 30 31
        auto.shard_tensor(
            x, auto.ProcessMesh([0, 1], dim_names=["x"]), ["x", None, None]
        )
32 33 34 35 36
        shape = paddle.shape(x)
    return main_program, start_program


def parallelizer(program_func, rank):
37 38 39 40 41
    from paddle.distributed.auto_parallel.static.completion import Completer
    from paddle.distributed.auto_parallel.static.dist_context import (
        DistributedContext,
    )
    from paddle.distributed.auto_parallel.static.partitioner import Partitioner
42 43 44 45 46 47 48 49 50

    main_program, start_program = program_func()

    dist_context = DistributedContext()
    completer = Completer(dist_context)
    completer.complete_forward_annotation(main_program)
    dist_context.block_state.parse_forward_blocks(main_program)

    partitioner = Partitioner(dist_context, rank)
51 52 53
    dist_main_prog, _, _ = partitioner.partition(
        main_program, start_program, []
    )
54 55 56 57 58 59 60 61 62 63 64

    return dist_main_prog, dist_context


class TestDistShape(unittest.TestCase):
    def test_dist_shape(self):

        dist_main_prog, dist_context = parallelizer(make_program, 0)
        ops = dist_main_prog.global_block().ops
        shape_op = ops[0]
        dist_op = dist_context.get_dist_op_for_program(shape_op)
65 66
        assert dist_op.dist_attr.impl_type == "shape"
        assert dist_op.dist_attr.impl_idx == 0
67 68 69 70 71 72 73 74 75 76 77 78

        in_name = shape_op.input_arg_names[0]
        out_name = shape_op.output_arg_names[0]
        in_dims_mapping = dist_op.dist_attr.get_input_dims_mapping(in_name)
        out_dims_mapping = dist_op.dist_attr.get_output_dims_mapping(out_name)

        assert in_dims_mapping == [0, -1, -1]
        assert out_dims_mapping == [-1]


if __name__ == "__main__":
    unittest.main()