# Copyright (c) 2016 Baidu, Inc. All Rights Reserved## Licensed under the Apache License, Version 2.0 (the "License");# you may not use this file except in compliance with the License.# You may obtain a copy of the License at## http://www.apache.org/licenses/LICENSE-2.0## Unless required by applicable law or agreed to in writing, software# distributed under the License is distributed on an "AS IS" BASIS,# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.# See the License for the specific language governing permissions and# limitations under the License.frompaddle.trainer.PyDataProvider2import*defhook(settings,dictionary,**kwargs):settings.word_dict=dictionarysettings.input_types=[integer_value(len(settings.word_dict),seq_type=SequenceType.SEQUENCE),integer_value(2)]settings.logger.info('dict len : %d'%(len(settings.word_dict)))@provider(init_hook=hook)defprocess(settings,file_name):withopen(file_name,'r')asfdata:forline_count,lineinenumerate(fdata):label,comment=line.strip().split('\t\t')label=int(label)words=comment.split()word_slot=[settings.word_dict[w]forwinwordsifwinsettings.word_dict]yieldword_slot,label