test_softmax_op.py 6.5 KB
Newer Older
1
#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
D
dzhwinter 已提交
2
#
D
dzhwinter 已提交
3 4 5
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
D
dzhwinter 已提交
6
#
D
dzhwinter 已提交
7
#     http://www.apache.org/licenses/LICENSE-2.0
D
dzhwinter 已提交
8
#
D
dzhwinter 已提交
9 10 11 12 13 14
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

15 16
from __future__ import print_function

Q
qijun 已提交
17 18
import unittest
import numpy as np
Q
qijun 已提交
19
from op_test import OpTest
20
import paddle.fluid.core as core
21 22
import paddle.fluid as fluid
from paddle.fluid import compiler, Program, program_guard
Q
qijun 已提交
23 24 25 26


def stable_softmax(x):
    """Compute the softmax of vector x in a numerically stable way."""
27 28 29
    # clip to shiftx, otherwise, when calc loss with
    # log(exp(shiftx)), may get log(0)=INF
    shiftx = (x - np.max(x)).clip(-64.)
Q
qijun 已提交
30 31 32 33
    exps = np.exp(shiftx)
    return exps / np.sum(exps)


Q
qijun 已提交
34
class TestSoftmaxOp(OpTest):
F
fengjiayi 已提交
35 36 37
    def get_x_shape(self):
        return [10, 10]

D
dengkaipeng 已提交
38 39 40
    def get_axis(self):
        return -1

Q
qijun 已提交
41
    def setUp(self):
Q
fix bug  
qijun 已提交
42
        self.op_type = "softmax"
43
        self.use_cudnn = False
K
Kexin Zhao 已提交
44
        self.use_mkldnn = False
45
        self.dtype = np.float64
K
Kexin Zhao 已提交
46
        self.init_kernel_type()
F
fengjiayi 已提交
47
        self.shape = self.get_x_shape()
D
dengkaipeng 已提交
48
        self.axis = self.get_axis()
F
fengjiayi 已提交
49

50
        np.random.seed(0)
F
fengjiayi 已提交
51
        x = np.random.uniform(0.1, 1, self.shape).astype(self.dtype)
D
dengkaipeng 已提交
52
        out = np.apply_along_axis(stable_softmax, self.axis, x)
K
Kexin Zhao 已提交
53 54 55

        self.inputs = {'X': OpTest.np_dtype_to_fluid_dtype(x)}
        self.outputs = {'Out': out}
56
        self.attrs = {
D
dengkaipeng 已提交
57
            'axis': self.axis,
58
            'use_cudnn': self.use_cudnn,
59
            'use_mkldnn': self.use_mkldnn
60
        }
61

K
Kexin Zhao 已提交
62
    def init_kernel_type(self):
63
        pass
Q
qijun 已提交
64

Q
qijun 已提交
65
    def test_check_output(self):
66
        # TODO(wangzhongpu): support mkldnn op in dygraph mode
67 68
        if self.use_cudnn:
            place = core.CUDAPlace(0)
69 70
            self.check_output_with_place(
                place, atol=1e-5, check_dygraph=(self.use_mkldnn == False))
71
        else:
72
            self.check_output(check_dygraph=(self.use_mkldnn == False))
Q
qijun 已提交
73

Q
qijun 已提交
74
    def test_check_grad(self):
75
        # TODO(wangzhongpu): support mkldnn op in dygraph mode
C
chengduo 已提交
76
        if self.use_cudnn or self.dtype == np.float16:
77
            place = core.CUDAPlace(0)
C
chengduo 已提交
78 79
            if core.is_float16_supported(place):
                self.check_grad_with_place(
80 81 82 83
                    place, ["X"],
                    "Out",
                    max_relative_error=0.01,
                    check_dygraph=(self.use_mkldnn == False))
84
        else:
85 86 87 88 89
            self.check_grad(
                ["X"],
                "Out",
                max_relative_error=0.01,
                check_dygraph=(self.use_mkldnn == False))
90 91


92
class TestSoftmaxOpError(unittest.TestCase):
93 94 95 96 97 98
    def test_errors(self):
        with program_guard(Program(), Program()):
            # The input type of softmax_op must be Variable.
            x1 = fluid.create_lod_tensor(
                np.array([[-1]]), [[1]], fluid.CPUPlace())
            self.assertRaises(TypeError, fluid.layers.softmax, x1)
99
            # The input dtype of softmax_op must be float16, float32 or float64.
100 101
            x2 = fluid.layers.data(name='x2', shape=[4], dtype="int32")
            self.assertRaises(TypeError, fluid.layers.softmax, x2)
102 103
            x3 = fluid.layers.data(name='x3', shape=[4], dtype="float16")
            fluid.layers.softmax(x3)
104 105


F
fengjiayi 已提交
106 107 108 109 110
class TestSoftmaxOp2(TestSoftmaxOp):
    def get_x_shape(self):
        return [2, 3, 4, 5]


D
dengkaipeng 已提交
111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134
class TestSoftmaxOp3(TestSoftmaxOp):
    def get_x_shape(self):
        return [2, 3, 4, 5]

    def get_axis(self):
        return 0


class TestSoftmaxOp4(TestSoftmaxOp):
    def get_x_shape(self):
        return [2, 3, 4, 5]

    def get_axis(self):
        return 1


class TestSoftmaxOp5(TestSoftmaxOp):
    def get_x_shape(self):
        return [2, 3, 4, 5]

    def get_axis(self):
        return 2


135
class TestSoftmaxOp6(TestSoftmaxOp):
D
dengkaipeng 已提交
136 137 138 139 140 141 142
    def get_x_shape(self):
        return [2, 3, 4, 5]

    def get_axis(self):
        return 3


143 144
@unittest.skipIf(not core.is_compiled_with_cuda(),
                 "core is not compiled with CUDA")
145
class TestSoftmaxCUDNNOp(TestSoftmaxOp):
K
Kexin Zhao 已提交
146 147 148 149
    def init_kernel_type(self):
        self.use_cudnn = True


F
fengjiayi 已提交
150 151 152 153 154 155 156
@unittest.skipIf(not core.is_compiled_with_cuda(),
                 "core is not compiled with CUDA")
class TestSoftmaxCUDNNOp2(TestSoftmaxCUDNNOp):
    def get_x_shape(self):
        return [2, 3, 4, 5]


D
dengkaipeng 已提交
157 158
@unittest.skipIf(not core.is_compiled_with_cuda(),
                 "core is not compiled with CUDA")
D
dengkaipeng 已提交
159
class TestSoftmaxCUDNNOp5(TestSoftmaxCUDNNOp):
D
dengkaipeng 已提交
160 161 162 163
    def get_x_shape(self):
        return [2, 3, 4, 5]

    def get_axis(self):
164
        return 3
D
dengkaipeng 已提交
165 166


167 168
@unittest.skipIf(not core.is_compiled_with_cuda(),
                 "core is not compiled with CUDA")
169 170 171 172 173 174 175 176 177 178
class TestSoftmaxFP16Op(TestSoftmaxOp):
    def init_kernel_type(self):
        self.dtype = np.float16

    def test_check_output(self):
        if core.is_compiled_with_cuda():
            place = core.CUDAPlace(0)
            if core.is_float16_supported(place):
                self.check_output_with_place(place, atol=1e-3)

C
chengduo 已提交
179 180 181 182
    # FIXME: If the x_shape is [10, 10], gradient failed.
    def test_check_grad(self):
        pass

183

184
@unittest.skip('disable TestSoftmaxFP16Op2')
C
chengduo 已提交
185 186 187 188 189 190 191 192 193 194
class TestSoftmaxFP16Op2(TestSoftmaxOp):
    def init_kernel_type(self):
        self.dtype = np.float16

    def test_check_output(self):
        if core.is_compiled_with_cuda():
            place = core.CUDAPlace(0)
            if core.is_float16_supported(place):
                self.check_output_with_place(place, atol=1e-3)

F
fengjiayi 已提交
195 196 197
    def get_x_shape(self):
        return [2, 3, 4, 5]

198 199 200
    def test_check_grad(self):
        pass

F
fengjiayi 已提交
201

202 203
@unittest.skipIf(not core.is_compiled_with_cuda(),
                 "core is not compiled with CUDA")
K
Kexin Zhao 已提交
204 205
class TestSoftmaxFP16CUDNNOp(TestSoftmaxOp):
    def init_kernel_type(self):
206
        self.use_cudnn = True
K
Kexin Zhao 已提交
207 208 209 210 211 212 213
        self.dtype = np.float16

    def test_check_output(self):
        if core.is_compiled_with_cuda():
            place = core.CUDAPlace(0)
            if core.is_float16_supported(place):
                self.check_output_with_place(place, atol=1e-3)
Q
Qiao Longfei 已提交
214 215


F
fengjiayi 已提交
216 217 218 219 220 221 222
@unittest.skipIf(not core.is_compiled_with_cuda(),
                 "core is not compiled with CUDA")
class TestSoftmaxFP16CUDNNOp2(TestSoftmaxFP16CUDNNOp):
    def get_x_shape(self):
        return [2, 3, 4, 5]


C
caoying03 已提交
223
if __name__ == "__main__":
Q
qijun 已提交
224
    unittest.main()