test_imperative_checkpoint.py 5.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20
# Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import unittest
import numpy as np

import paddle
import paddle.fluid as fluid
from paddle.fluid.optimizer import SGDOptimizer
21
from paddle.fluid import Conv2D, Pool2D, FC, core
L
lujun 已提交
22
from paddle.fluid.dygraph.base import to_variable
23 24


25
class SimpleImgConvPool(fluid.Layer):
26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71
    def __init__(self,
                 name_scope,
                 num_filters,
                 filter_size,
                 pool_size,
                 pool_stride,
                 pool_padding=0,
                 pool_type='max',
                 global_pooling=False,
                 conv_stride=1,
                 conv_padding=0,
                 conv_dilation=1,
                 conv_groups=1,
                 act=None,
                 use_cudnn=False,
                 param_attr=None,
                 bias_attr=None):
        super(SimpleImgConvPool, self).__init__(name_scope)

        self._conv2d = Conv2D(
            self.full_name(),
            num_filters=num_filters,
            filter_size=filter_size,
            stride=conv_stride,
            padding=conv_padding,
            dilation=conv_dilation,
            groups=conv_groups,
            param_attr=None,
            bias_attr=None,
            use_cudnn=use_cudnn)

        self._pool2d = Pool2D(
            self.full_name(),
            pool_size=pool_size,
            pool_type=pool_type,
            pool_stride=pool_stride,
            pool_padding=pool_padding,
            global_pooling=global_pooling,
            use_cudnn=use_cudnn)

    def forward(self, inputs):
        x = self._conv2d(inputs)
        x = self._pool2d(x)
        return x


72
class MNIST(fluid.Layer):
73 74 75 76
    def __init__(self, name_scope):
        super(MNIST, self).__init__(name_scope)

        self._simple_img_conv_pool_1 = SimpleImgConvPool(
77
            self.full_name(), 20, 5, 2, 2, act="relu")
78 79

        self._simple_img_conv_pool_2 = SimpleImgConvPool(
80
            self.full_name(), 50, 5, 2, 2, act="relu")
81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98

        pool_2_shape = 50 * 4 * 4
        SIZE = 10
        scale = (2.0 / (pool_2_shape**2 * SIZE))**0.5
        self._fc = FC(self.full_name(),
                      10,
                      param_attr=fluid.param_attr.ParamAttr(
                          initializer=fluid.initializer.NormalInitializer(
                              loc=0.0, scale=scale)),
                      act="softmax")

    def forward(self, inputs):
        x = self._simple_img_conv_pool_1(inputs)
        x = self._simple_img_conv_pool_2(x)
        x = self._fc(x)
        return x


L
lujun 已提交
99
class TestDygraphCheckpoint(unittest.TestCase):
100 101 102 103 104 105 106 107 108
    def reader_decorator(self, reader):
        def _reader_imple():
            for item in reader():
                image = np.array(item[0]).reshape(1, 28, 28)
                label = np.array(item[1]).astype('int64').reshape(1)
                yield image, label

        return _reader_imple

109
    def test_save_load_persistables(self):
110 111
        seed = 90
        epoch_num = 1
112
        batch_size = 128
113

L
lujun 已提交
114
        with fluid.dygraph.guard():
115 116 117 118 119
            fluid.default_startup_program().random_seed = seed
            fluid.default_main_program().random_seed = seed

            mnist = MNIST("mnist")
            sgd = SGDOptimizer(learning_rate=1e-3)
120 121 122 123 124 125 126 127

            batch_py_reader = fluid.io.PyReader(capacity=1)
            batch_py_reader.decorate_sample_list_generator(
                paddle.batch(
                    self.reader_decorator(paddle.dataset.mnist.train()),
                    batch_size=batch_size,
                    drop_last=True),
                places=fluid.CPUPlace())
128 129 130 131

            dy_param_init_value = {}

            for epoch in range(epoch_num):
132 133 134
                for batch_id, data in enumerate(batch_py_reader()):
                    img = data[0]
                    label = data[1]
135
                    label.stop_gradient = True
136 137 138 139 140

                    cost = mnist(img)
                    loss = fluid.layers.cross_entropy(cost, label)
                    avg_loss = fluid.layers.mean(loss)

141
                    dy_out = avg_loss.numpy()
142

L
lujun 已提交
143
                    avg_loss.backward()
144
                    sgd.minimize(avg_loss)
J
Jiabin Yang 已提交
145
                    fluid.dygraph.save_persistables(mnist.state_dict(),
146
                                                    "save_dir")
147 148 149
                    mnist.clear_gradients()

                    for param in mnist.parameters():
150
                        dy_param_init_value[param.name] = param.numpy()
151

152
                    restore, _ = fluid.dygraph.load_persistables("save_dir")
153 154 155 156

                    self.assertRaises(IOError, fluid.dygraph.load_persistables,
                                      "not_exist_dir")

L
lujun 已提交
157
                    mnist.load_dict(restore)
158 159

                    self.assertEqual(len(dy_param_init_value), len(restore))
L
lujun 已提交
160
                    for ky, value in restore.items():
161
                        self.assertTrue(
162 163 164 165
                            np.allclose(value.numpy(), dy_param_init_value[
                                value.name]))
                        self.assertTrue(np.isfinite(value.numpy().all()))
                        self.assertFalse(np.isnan(value.numpy().any()))
166

167
                    if batch_id > 10:
168 169 170 171 172
                        break


if __name__ == '__main__':
    unittest.main()