test_data_feeder.py 3.3 KB
Newer Older
1
#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
D
dzhwinter 已提交
2
#
D
dzhwinter 已提交
3 4 5
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
D
dzhwinter 已提交
6
#
D
dzhwinter 已提交
7
#     http://www.apache.org/licenses/LICENSE-2.0
D
dzhwinter 已提交
8
#
D
dzhwinter 已提交
9 10 11 12 13 14
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

15
import paddle.fluid as fluid
K
Kexin Zhao 已提交
16
import unittest
P
pangyoki 已提交
17 18 19
import paddle

paddle.enable_static()
Y
Yu Yang 已提交
20 21


K
Kexin Zhao 已提交
22 23 24 25 26 27 28 29 30
class TestDataFeeder(unittest.TestCase):
    def test_lod_level_0_converter(self):
        img = fluid.layers.data(name='image', shape=[1, 28, 28])
        label = fluid.layers.data(name='label', shape=[1], dtype='int64')
        feeder = fluid.DataFeeder([img, label], fluid.CPUPlace())
        result = feeder.feed([([0] * 784, [9]), ([1] * 784, [1])])

        self.assertEqual(result['image'].shape(), [2, 1, 28, 28])
        self.assertEqual(result['label'].shape(), [2, 1])
31 32
        self.assertEqual(result['image'].recursive_sequence_lengths(), [])
        self.assertEqual(result['label'].recursive_sequence_lengths(), [])
K
Kexin Zhao 已提交
33

S
sneaxiy 已提交
34 35 36 37 38 39
        try:
            result = feeder.feed([([0] * 783, [9]), ([1] * 783, [1])])
            self.assertTrue(False)
        except ValueError:
            self.assertTrue(True)

K
Kexin Zhao 已提交
40 41 42
    def test_lod_level_1_converter(self):
        # lod_level = 1
        # each sentence has a different number of words
43 44 45
        sentences = fluid.layers.data(
            name='sentences', shape=[1], dtype='int64', lod_level=1
        )
K
Kexin Zhao 已提交
46 47 48 49 50 51
        label = fluid.layers.data(name='label', shape=[1], dtype='int64')
        feeder = fluid.DataFeeder([sentences, label], fluid.CPUPlace())

        # lod = [[0, 3, 5, 9]]
        # data = [[1, 2, 3], [4, 5], [6, 7, 8, 9]]
        # label = [1] * len(data)
52 53 54
        result = feeder.feed(
            [([1, 2, 3], [1]), ([4, 5], [1]), ([6, 7, 8, 9], [1])]
        )
K
Kexin Zhao 已提交
55 56 57

        self.assertEqual(result['sentences'].shape(), [9, 1])
        self.assertEqual(result['label'].shape(), [3, 1])
58 59 60
        self.assertEqual(
            result['sentences'].recursive_sequence_lengths(), [[3, 2, 4]]
        )
61
        self.assertEqual(result['label'].recursive_sequence_lengths(), [])
K
Kexin Zhao 已提交
62 63 64 65

    def test_lod_level_2_converter(self):
        # lod_level = 2
        # paragraphs -> sentences -> words
66 67 68
        paragraphs = fluid.layers.data(
            name='paragraphs', shape=[1], dtype='int64', lod_level=2
        )
K
Kexin Zhao 已提交
69 70 71 72 73 74
        label = fluid.layers.data(name='label', shape=[1], dtype='int64')
        feeder = fluid.DataFeeder([paragraphs, label], fluid.CPUPlace())

        # lod = [[0, 2, 3], [0, 3, 5, 9]]
        # data = [[[1, 2, 3], [4, 5]], [[6, 7, 8, 9]]]
        # label = [1] * len(data)
75 76 77
        result = feeder.feed(
            [([[1, 2, 3], [4, 5]], [1]), ([[6, 7, 8, 9]], [1])]
        )
K
Kexin Zhao 已提交
78 79 80

        self.assertEqual(result['paragraphs'].shape(), [9, 1])
        self.assertEqual(result['label'].shape(), [2, 1])
81 82 83 84
        self.assertEqual(
            result['paragraphs'].recursive_sequence_lengths(),
            [[2, 1], [3, 2, 4]],
        )
85
        self.assertEqual(result['label'].recursive_sequence_lengths(), [])
Y
Yu Yang 已提交
86 87 88


if __name__ == '__main__':
K
Kexin Zhao 已提交
89
    unittest.main()