test_npair_loss_op.py 6.5 KB
Newer Older
C
ceci3 已提交
1
#   Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
C
ceci3 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from __future__ import print_function

import unittest
import paddle.fluid as fluid
import paddle.fluid.core as core
import numpy as np
21
from paddle.fluid import Program, program_guard
C
ceci3 已提交
22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55


def npairloss(anchor, positive, labels, l2_reg=0.002):
    def softmax_cross_entropy_with_logits(logits, labels):
        logits = np.exp(logits)
        logits = logits / np.sum(logits, axis=1).reshape(-1, 1)

        return np.mean(
            -np.sum(labels * np.log(logits), axis=1), dtype=np.float32)

    batch_size = labels.shape[0]

    labels = np.reshape(labels, (batch_size, 1))
    labels = np.equal(labels, labels.transpose()).astype(float)
    labels = labels / np.sum(labels, axis=1, keepdims=True)

    l2loss = np.mean(np.sum(np.power(anchor, 2), 1)) + np.mean(
        np.sum(np.power(positive, 2), 1))
    l2loss = (l2loss * 0.25 * l2_reg).astype(np.float32)

    similarity_matrix = np.matmul(anchor, positive.transpose())
    celoss = np.mean(
        softmax_cross_entropy_with_logits(similarity_matrix, labels))

    return l2loss + celoss


class TestNpairLossOp(unittest.TestCase):
    def setUp(self):
        self.dtype = np.float32

    def __assert_close(self, tensor, np_array, msg, atol=1e-4):
        self.assertTrue(np.allclose(np.array(tensor), np_array, atol=atol), msg)

C
ceci3 已提交
56
    def test_npair_loss(self):
C
ceci3 已提交
57
        reg_lambda = 0.002
C
ceci3 已提交
58
        num_data, feat_dim, num_classes = 18, 6, 3
C
ceci3 已提交
59

C
ceci3 已提交
60
        place = core.CPUPlace()
C
ceci3 已提交
61 62
        exe = fluid.Executor(place)
        exe.run(fluid.default_startup_program())
63

C
ceci3 已提交
64 65 66 67
        embeddings_anchor = np.random.rand(num_data,
                                           feat_dim).astype(np.float32)
        embeddings_positive = np.random.rand(num_data,
                                             feat_dim).astype(np.float32)
C
ceci3 已提交
68
        row_labels = np.random.randint(
C
ceci3 已提交
69 70
            0, num_classes, size=(num_data)).astype(np.float32)
        out_loss = npairloss(
C
ceci3 已提交
71 72 73 74
            embeddings_anchor,
            embeddings_positive,
            row_labels,
            l2_reg=reg_lambda)
C
ceci3 已提交
75

76 77 78 79 80 81 82 83 84 85 86 87 88 89 90
        anc = fluid.layers.data(
            dtype='float32',
            name='anc',
            shape=embeddings_anchor.shape,
            append_batch_size=False)
        pos = fluid.layers.data(
            dtype='float32',
            name='pos',
            shape=embeddings_positive.shape,
            append_batch_size=False)
        lab = fluid.layers.data(
            dtype='float32',
            name='lab',
            shape=row_labels.shape,
            append_batch_size=False)
C
ceci3 已提交
91 92

        npair_loss_op = fluid.layers.npair_loss(
C
ceci3 已提交
93
            anchor=anc, positive=pos, labels=lab, l2_reg=reg_lambda)
94 95 96 97 98
        out_tensor = exe.run(feed={
            'anc': embeddings_anchor,
            'pos': embeddings_positive,
            'lab': row_labels
        },
C
ceci3 已提交
99 100 101 102 103 104
                             fetch_list=[npair_loss_op.name])

        self.__assert_close(
            out_tensor,
            out_loss,
            "inference output are different at " + str(place) + ", " +
C
ceci3 已提交
105 106
            str(np.dtype('float32')) + str(np.array(out_tensor)) +
            str(out_loss),
C
ceci3 已提交
107 108 109
            atol=1e-3)


110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178
class TestNpairLossOpError(unittest.TestCase):
    def test_errors(self):
        with program_guard(Program(), Program()):
            anchor_np = np.random.random((2, 4)).astype("float32")
            positive_np = np.random.random((2, 4)).astype("float32")
            labels_np = np.random.random((2)).astype("float32")
            anchor_data = fluid.data(
                name='anchor', shape=[2, 4], dtype='float32')
            positive_data = fluid.data(
                name='positive', shape=[2, 4], dtype='float32')
            labels_data = fluid.data(name='labels', shape=[2], dtype='float32')

            def test_anchor_Variable():
                # the anchor type must be Variable
                fluid.layers.npair_loss(
                    anchor=anchor_np,
                    positive=positive_data,
                    labels=labels_data)

            def test_positive_Variable():
                # the positive type must be Variable
                fluid.layers.npair_loss(
                    anchor=anchor_data,
                    positive=positive_np,
                    labels=labels_data)

            def test_labels_Variable():
                # the labels type must be Variable
                fluid.layers.npair_loss(
                    anchor=anchor_data,
                    positive=positive_data,
                    labels=labels_np)

            self.assertRaises(TypeError, test_anchor_Variable)
            self.assertRaises(TypeError, test_positive_Variable)
            self.assertRaises(TypeError, test_labels_Variable)

            def test_anchor_type():
                # dtype must be float32 or float64
                anchor_data1 = fluid.data(
                    name='anchor1', shape=[2, 4], dtype='int32')
                fluid.layers.npair_loss(
                    anchor=anchor_data,
                    positive=positive_data,
                    labels=labels_np)

            def test_positive_type():
                # dtype must be float32 or float64
                positive_data1 = fluid.data(
                    name='positive1', shape=[2, 4], dtype='int32')
                fluid.layers.npair_loss(
                    anchor=anchor_data,
                    positive=positive_data1,
                    labels=labels_np)

            def test_labels_type():
                # dtype must be float32 or float64
                labels_data1 = fluid.data(
                    name='labels1', shape=[2], dtype='int32')
                fluid.layers.npair_loss(
                    anchor=anchor_data,
                    positive=positive_data,
                    labels=labels_data1)

            self.assertRaises(TypeError, test_anchor_type)
            self.assertRaises(TypeError, test_positive_type)
            self.assertRaises(TypeError, test_labels_type)


C
ceci3 已提交
179 180
if __name__ == '__main__':
    unittest.main()