From 344276cc07570682b32ef92a082577f92c11bcce Mon Sep 17 00:00:00 2001 From: xiegegege Date: Thu, 30 May 2019 06:55:47 +0000 Subject: [PATCH] fix for py3 --- ERNIE/reader/pretraining.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ERNIE/reader/pretraining.py b/ERNIE/reader/pretraining.py index c1233ad..ced2107 100644 --- a/ERNIE/reader/pretraining.py +++ b/ERNIE/reader/pretraining.py @@ -75,7 +75,7 @@ class ErnieDataReader(object): def parse_line(self, line, max_seq_len=512): """ parse one line to token_ids, sentence_ids, pos_ids, label """ - line = line.strip().split(";") + line = line.strip().decode().split(";") assert len(line) == 5, "One sample must have 5 fields!" (token_ids, sent_ids, pos_ids, seg_labels, label) = line token_ids = [int(token) for token in token_ids.split(" ")] -- GitLab