提交 02eacafe 编写于 作者: X Xing Wu 提交者: Guo Sheng

fix_lac_windows_int64_error (#4223)

上级 57ac2201
...@@ -21,7 +21,7 @@ import __future__ ...@@ -21,7 +21,7 @@ import __future__
import io import io
import glob import glob
import paddle.fluid as fluid import paddle.fluid as fluid
import numpy as np
def load_kv_dict(dict_path, def load_kv_dict(dict_path,
reverse=False, reverse=False,
...@@ -56,10 +56,10 @@ class Dataset(object): ...@@ -56,10 +56,10 @@ class Dataset(object):
def __init__(self, args, mode="train"): def __init__(self, args, mode="train"):
# read dict # read dict
self.word2id_dict = load_kv_dict( self.word2id_dict = load_kv_dict(
args.word_dict_path, reverse=True, value_func=int) args.word_dict_path, reverse=True, value_func=np.int64)
self.id2word_dict = load_kv_dict(args.word_dict_path) self.id2word_dict = load_kv_dict(args.word_dict_path)
self.label2id_dict = load_kv_dict( self.label2id_dict = load_kv_dict(
args.label_dict_path, reverse=True, value_func=int) args.label_dict_path, reverse=True, value_func=np.int64)
self.id2label_dict = load_kv_dict(args.label_dict_path) self.id2label_dict = load_kv_dict(args.label_dict_path)
self.word_replace_dict = load_kv_dict(args.word_rep_dict_path) self.word_replace_dict = load_kv_dict(args.word_rep_dict_path)
...@@ -150,7 +150,7 @@ class Dataset(object): ...@@ -150,7 +150,7 @@ class Dataset(object):
new_batch = [] new_batch = []
for words_len, (word_ids, label_ids) in zip(init_lens, batch): for words_len, (word_ids, label_ids) in zip(init_lens, batch):
word_ids = word_ids[0:max_seq_len] word_ids = word_ids[0:max_seq_len]
words_len = len(word_ids) words_len = np.int64(len(word_ids))
word_ids += [0 for _ in range(max_seq_len-words_len)] word_ids += [0 for _ in range(max_seq_len-words_len)]
label_ids = label_ids[0:max_seq_len] label_ids = label_ids[0:max_seq_len]
label_ids += [0 for _ in range(max_seq_len-words_len)] label_ids += [0 for _ in range(max_seq_len-words_len)]
...@@ -164,7 +164,7 @@ class Dataset(object): ...@@ -164,7 +164,7 @@ class Dataset(object):
for words_len, (word_ids, label_ids) in zip(init_lens, batch): for words_len, (word_ids, label_ids) in zip(init_lens, batch):
max_seq_len = min(max(init_lens), max_seq_len) max_seq_len = min(max(init_lens), max_seq_len)
word_ids = words[0:max_seq_len] word_ids = words[0:max_seq_len]
words_len = len(word_ids) words_len = np.int64(len(word_ids))
word_ids += [0 for _ in range(max_seq_len-words_len)] word_ids += [0 for _ in range(max_seq_len-words_len)]
label_ids = label_ids[0:max_seq_len] label_ids = label_ids[0:max_seq_len]
label_ids += [0 for _ in range(max_seq_len-words_len)] label_ids += [0 for _ in range(max_seq_len-words_len)]
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册