celoss.py 2.4 KB
Newer Older
1
# copyright (c) 2021 PaddlePaddle Authors. All Rights Reserve.
B
Bin Lu 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import paddle
16
import paddle.nn as nn
B
Bin Lu 已提交
17 18 19
import paddle.nn.functional as F


20
class CELoss(nn.Layer):
C
cuicheng01 已提交
21 22 23 24
    """
    Cross entropy loss
    """

25 26 27 28 29
    def __init__(self, epsilon=None):
        super().__init__()
        if epsilon is not None and (epsilon <= 0 or epsilon >= 1):
            epsilon = None
        self.epsilon = epsilon
B
Bin Lu 已提交
30

31
    def _labelsmoothing(self, target, class_num):
32
        if target.ndim == 1 or target.shape[-1] != class_num:
33
            one_hot_target = F.one_hot(target, class_num)
B
Bin Lu 已提交
34 35
        else:
            one_hot_target = target
36 37
        soft_target = F.label_smooth(one_hot_target, epsilon=self.epsilon)
        soft_target = paddle.reshape(soft_target, shape=[-1, class_num])
B
Bin Lu 已提交
38 39
        return soft_target

40 41 42 43 44 45 46 47
    def forward(self, x, label):
        if isinstance(x, dict):
            x = x["logits"]
        if self.epsilon is not None:
            class_num = x.shape[-1]
            label = self._labelsmoothing(label, class_num)
            x = -F.log_softmax(x, axis=-1)
            loss = paddle.sum(x * label, axis=-1)
D
dongshuilong 已提交
48
        else:
49 50 51 52 53 54
            if label.shape[-1] == x.shape[-1]:
                label = F.softmax(label, axis=-1)
                soft_label = True
            else:
                soft_label = False
            loss = F.cross_entropy(x, label=label, soft_label=soft_label)
55
        loss = loss.mean()
56
        return {"CELoss": loss}
C
cuicheng01 已提交
57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74


class MixCELoss(CELoss):
    """
    Cross entropy loss with mix(mixup, cutmix, fixmix)
    """

    def __init__(self, epsilon=None):
        super().__init__()
        self.epsilon = epsilon

    def __call__(self, input, batch):
        target0, target1, lam = batch
        loss0 = super().forward(input, target0)["CELoss"]
        loss1 = super().forward(input, target1)["CELoss"]
        loss = lam * loss0 + (1.0 - lam) * loss1
        loss = paddle.mean(loss)
        return {"MixCELoss": loss}