From e5e887b0816d3bf649cd13b4f6514ff61e4affef Mon Sep 17 00:00:00 2001 From: kinghuin Date: Wed, 20 Nov 2019 17:21:15 +0800 Subject: [PATCH] modify tnews --- paddlehub/dataset/tnews.py | 28 +++++++++++++++++++++++----- 1 file changed, 23 insertions(+), 5 deletions(-) diff --git a/paddlehub/dataset/tnews.py b/paddlehub/dataset/tnews.py index 6a304ae6..1cf08eee 100644 --- a/paddlehub/dataset/tnews.py +++ b/paddlehub/dataset/tnews.py @@ -73,12 +73,30 @@ class TNews(HubDataset): def get_labels(self): return [ - 'news_game', 'news_sports', 'news_finance', 'news_entertainment', - 'news_tech', 'news_house', 'news_car', 'news_culture', 'news_world', - 'news_travel', 'news_agriculture', 'news_military', 'news_edu', - 'news_story', 'stock' + '100', '101', '102', '103', '104', '106', '107', '108', '109', + '110', '112', '113', '114', '115', '116' ] + def get_label_name(self, id): + label_name = { + "100": "news_story", + "101": "news_culture", + "102": "news_entertainment", + "103": "news_sports", + "104": "news_finance", + "106": "news_house", + "107": "news_car", + "108": "news_edu", + "109": "news_tech", + "110": "news_military", + "112": "news_travel", + "113": "news_world", + "114": "stock", + "115": "news_agriculture", + "116": "news_game" + } + return label_name[id] + @property def num_labels(self): """ @@ -93,7 +111,7 @@ class TNews(HubDataset): for line in file: data = line.strip().split("_!_") example = InputExample( - guid=data[0], label=data[2], text_a=data[3]) + guid=data[0], label=data[1], text_a=data[3]) examples.append(example) return examples -- GitLab