diff --git a/PaddleRec/din/network.py b/PaddleRec/din/network.py index a65e155f22d52680380a46d715ad09f48bf995d6..26b9fbb0a4a03275fc224aa3c2b5b340984c0d85 100644 --- a/PaddleRec/din/network.py +++ b/PaddleRec/din/network.py @@ -14,7 +14,7 @@ import paddle.fluid as fluid -def din_attention(hist, target_expand, max_len, mask): +def din_attention(hist, target_expand, mask): """activation weight""" hidden_size = hist.shape[-1] @@ -45,9 +45,10 @@ def din_attention(hist, target_expand, max_len, mask): return out -def network(item_count, cat_count, max_len): +def network(item_count, cat_count): """network definition""" + seq_len = -1 item_emb_size = 64 cat_emb_size = 64 is_sparse = False @@ -56,60 +57,60 @@ def network(item_count, cat_count, max_len): item_emb_attr = fluid.ParamAttr(name="item_emb") cat_emb_attr = fluid.ParamAttr(name="cat_emb") - hist_item_seq = fluid.layers.data( - name="hist_item_seq", shape=[max_len, 1], dtype="int64") - hist_cat_seq = fluid.layers.data( - name="hist_cat_seq", shape=[max_len, 1], dtype="int64") - target_item = fluid.layers.data( - name="target_item", shape=[1], dtype="int64") - target_cat = fluid.layers.data( - name="target_cat", shape=[1], dtype="int64") - label = fluid.layers.data( - name="label", shape=[1], dtype="float32") - mask = fluid.layers.data( - name="mask", shape=[max_len, 1], dtype="float32") - target_item_seq = fluid.layers.data( - name="target_item_seq", shape=[max_len, 1], dtype="int64") - target_cat_seq = fluid.layers.data( - name="target_cat_seq", shape=[max_len, 1], dtype="int64", lod_level=0) - - hist_item_emb = fluid.layers.embedding( + hist_item_seq = fluid.data( + name="hist_item_seq", shape=[None, seq_len], dtype="int64") + hist_cat_seq = fluid.data( + name="hist_cat_seq", shape=[None, seq_len], dtype="int64") + target_item = fluid.data( + name="target_item", shape=[None], dtype="int64") + target_cat = fluid.data( + name="target_cat", shape=[None], dtype="int64") + label = fluid.data( + name="label", shape=[None, 1], dtype="float32") + mask = fluid.data( + name="mask", shape=[None, seq_len, 1], dtype="float32") + target_item_seq = fluid.data( + name="target_item_seq", shape=[None, seq_len], dtype="int64") + target_cat_seq = fluid.data( + name="target_cat_seq", shape=[None, seq_len], dtype="int64") + + hist_item_emb = fluid.embedding( input=hist_item_seq, size=[item_count, item_emb_size], param_attr=item_emb_attr, is_sparse=is_sparse) - hist_cat_emb = fluid.layers.embedding( + hist_cat_emb = fluid.embedding( input=hist_cat_seq, size=[cat_count, cat_emb_size], param_attr=cat_emb_attr, is_sparse=is_sparse) - target_item_emb = fluid.layers.embedding( + target_item_emb = fluid.embedding( input=target_item, size=[item_count, item_emb_size], param_attr=item_emb_attr, is_sparse=is_sparse) - target_cat_emb = fluid.layers.embedding( + target_cat_emb = fluid.embedding( input=target_cat, size=[cat_count, cat_emb_size], param_attr=cat_emb_attr, is_sparse=is_sparse) - target_item_seq_emb = fluid.layers.embedding( + target_item_seq_emb = fluid.embedding( input=target_item_seq, size=[item_count, item_emb_size], param_attr=item_emb_attr, is_sparse=is_sparse) - target_cat_seq_emb = fluid.layers.embedding( + target_cat_seq_emb = fluid.embedding( input=target_cat_seq, size=[cat_count, cat_emb_size], param_attr=cat_emb_attr, is_sparse=is_sparse) - item_b = fluid.layers.embedding( + item_b = fluid.embedding( input=target_item, size=[item_count, 1], param_attr=fluid.initializer.Constant(value=0.0)) @@ -120,7 +121,7 @@ def network(item_count, cat_count, max_len): target_concat = fluid.layers.concat( [target_item_emb, target_cat_emb], axis=1) - out = din_attention(hist_seq_concat, target_seq_concat, max_len, mask) + out = din_attention(hist_seq_concat, target_seq_concat, mask) out_fc = fluid.layers.fc(name="out_fc", input=out, size=item_emb_size + cat_emb_size, diff --git a/PaddleRec/din/reader.py b/PaddleRec/din/reader.py index a50a90894b3619f8f752c1d18663f1677c0f6154..07d1c33c904517e863967b93cbb0e4fe2001e058 100644 --- a/PaddleRec/din/reader.py +++ b/PaddleRec/din/reader.py @@ -20,7 +20,7 @@ import pickle def pad_batch_data(input, max_len): res = np.array([x + [0] * (max_len - len(x)) for x in input]) - res = res.astype("int64").reshape([-1, max_len, 1]) + res = res.astype("int64").reshape([-1, max_len]) return res @@ -34,10 +34,10 @@ def make_data(b): [-1, max_len, 1]) target_item_seq = np.array( [[x[2]] * max_len for x in b]).astype("int64").reshape( - [-1, max_len, 1]) + [-1, max_len]) target_cat_seq = np.array( [[x[3]] * max_len for x in b]).astype("int64").reshape( - [-1, max_len, 1]) + [-1, max_len]) res = [] for i in range(len(b)): res.append([ diff --git a/PaddleRec/din/train.py b/PaddleRec/din/train.py index 9697961510c786ddd7f9f4fd4560e3f8d62fe4b1..9c6190c3277d213bbd918d3459aa3fb6618d12f3 100644 --- a/PaddleRec/din/train.py +++ b/PaddleRec/din/train.py @@ -78,7 +78,7 @@ def train(): args.num_devices) logger.info("reading data completes") - avg_cost, pred = network.network(item_count, cat_count, max_len) + avg_cost, pred = network.network(item_count, cat_count) fluid.clip.set_gradient_clip(clip=fluid.clip.GradientClipByGlobalNorm( clip_norm=5.0)) base_lr = args.base_lr