# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.## Licensed under the Apache License, Version 2.0 (the "License");# you may not use this file except in compliance with the License.# You may obtain a copy of the License at## http://www.apache.org/licenses/LICENSE-2.0## Unless required by applicable law or agreed to in writing, software# distributed under the License is distributed on an "AS IS" BASIS,# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.# See the License for the specific language governing permissions and# limitations under the License.from__future__importprint_functionfrompaddlerec.core.readerimportReaderBaseclassReader(ReaderBase):definit(self):passdefgenerate_sample(self,line):""" Read the data line by line and process it as a dictionary """defreader():""" This function needs to be implemented by the user, based on data format """features=line.strip('\n').split('\t')doc1=[int(word_id)forword_idinfeatures[0].split(",")]doc2=[int(word_id)forword_idinfeatures[1].split(",")]features_name=["doc1","doc2"]yieldzip(features_name,[doc1]+[doc2])returnreader