model.py 4.4 KB
Newer Older
T
tangwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
#   Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

X
xujiaqi01 已提交
15 16 17 18 19
import paddle.fluid as fluid
import paddle.fluid.layers.nn as nn
import paddle.fluid.layers.tensor as tensor
import paddle.fluid.layers.control_flow as cf

C
Chengmo 已提交
20
from paddlerec.core.model import ModelBase
T
for mat  
tangwei 已提交
21
from paddlerec.core.utils import envs
T
tangwei 已提交
22 23


X
xujiaqi01 已提交
24 25 26 27 28
class Model(ModelBase):
    def __init__(self, config):
        ModelBase.__init__(self, config)
        self.cost = None
        self.metrics = {}
X
xjqbest 已提交
29 30 31 32 33 34 35 36 37
        self.vocab_text_size = envs.get_global_env(
            "hyper_parameters.vocab_text_size")
        self.vocab_tag_size = envs.get_global_env(
            "hyper_parameters.vocab_tag_size")
        self.emb_dim = envs.get_global_env("hyper_parameters.emb_dim")
        self.hid_dim = envs.get_global_env("hyper_parameters.hid_dim")
        self.win_size = envs.get_global_env("hyper_parameters.win_size")
        self.margin = envs.get_global_env("hyper_parameters.margin")
        self.neg_size = envs.get_global_env("hyper_parameters.neg_size")
X
xujiaqi01 已提交
38

X
xjqbest 已提交
39
    def input_data(self, is_infer=False, **kwargs):
T
tangwei 已提交
40 41
        text = fluid.data(
            name="text", shape=[None, 1], lod_level=1, dtype='int64')
X
xujiaqi01 已提交
42 43 44 45
        pos_tag = fluid.data(
            name="pos_tag", shape=[None, 1], lod_level=1, dtype='int64')
        neg_tag = fluid.data(
            name="neg_tag", shape=[None, 1], lod_level=1, dtype='int64')
X
xjqbest 已提交
46
        return [text, pos_tag, neg_tag]
X
xujiaqi01 已提交
47

X
xjqbest 已提交
48 49 50 51 52
    def net(self, input, is_infer=False):
        """ network"""
        text = input[0]
        pos_tag = input[1]
        neg_tag = input[2]
X
xujiaqi01 已提交
53 54

        text_emb = fluid.embedding(
T
tangwei 已提交
55 56 57
            input=text,
            size=[self.vocab_text_size, self.emb_dim],
            param_attr="text_emb")
X
xujiaqi01 已提交
58 59
        text_emb = fluid.layers.squeeze(input=text_emb, axes=[1])
        pos_tag_emb = fluid.embedding(
T
tangwei 已提交
60 61 62
            input=pos_tag,
            size=[self.vocab_tag_size, self.emb_dim],
            param_attr="tag_emb")
X
xujiaqi01 已提交
63 64
        pos_tag_emb = fluid.layers.squeeze(input=pos_tag_emb, axes=[1])
        neg_tag_emb = fluid.embedding(
T
tangwei 已提交
65 66 67
            input=neg_tag,
            size=[self.vocab_tag_size, self.emb_dim],
            param_attr="tag_emb")
X
xujiaqi01 已提交
68 69 70 71 72 73 74 75 76 77 78 79 80
        neg_tag_emb = fluid.layers.squeeze(input=neg_tag_emb, axes=[1])

        conv_1d = fluid.nets.sequence_conv_pool(
            input=text_emb,
            num_filters=self.hid_dim,
            filter_size=self.win_size,
            act="tanh",
            pool_type="max",
            param_attr="cnn")
        text_hid = fluid.layers.fc(input=conv_1d,
                                   size=self.emb_dim,
                                   param_attr="text_hid")
        cos_pos = nn.cos_sim(pos_tag_emb, text_hid)
T
tangwei 已提交
81 82
        mul_text_hid = fluid.layers.sequence_expand_as(
            x=text_hid, y=neg_tag_emb)
X
xujiaqi01 已提交
83 84 85
        mul_cos_neg = nn.cos_sim(neg_tag_emb, mul_text_hid)
        cos_neg_all = fluid.layers.sequence_reshape(
            input=mul_cos_neg, new_dim=self.neg_size)
C
Chengmo 已提交
86
        # choose max negtive cosine
X
xujiaqi01 已提交
87
        cos_neg = nn.reduce_max(cos_neg_all, dim=1, keep_dim=True)
C
Chengmo 已提交
88
        # calculate hinge loss
X
xujiaqi01 已提交
89 90
        loss_part1 = nn.elementwise_sub(
            tensor.fill_constant_batch_size_like(
T
tangwei 已提交
91 92 93 94
                input=cos_pos,
                shape=[-1, 1],
                value=self.margin,
                dtype='float32'),
X
xujiaqi01 已提交
95 96 97 98 99 100 101 102 103
            cos_pos)
        loss_part2 = nn.elementwise_add(loss_part1, cos_neg)
        loss_part3 = nn.elementwise_max(
            tensor.fill_constant_batch_size_like(
                input=loss_part2, shape=[-1, 1], value=0.0, dtype='float32'),
            loss_part2)
        avg_cost = nn.mean(loss_part3)
        less = tensor.cast(cf.less_than(cos_neg, cos_pos), dtype='float32')
        correct = nn.reduce_sum(less)
X
xjqbest 已提交
104
        self._cost = avg_cost
X
xujiaqi01 已提交
105

X
xjqbest 已提交
106 107 108 109 110 111
        if is_infer:
            self._infer_results["correct"] = correct
            self._infer_results["cos_pos"] = cos_pos
        else:
            self._metrics["correct"] = correct
            self._metrics["cos_pos"] = cos_pos