“86fd748808dee2448bf368f3b1389f91ec6e9d29”上不存在“develop/doc_cn/howto/usage”
未验证 提交 75370f71 编写于 作者: L littletomatodonkey 提交者: GitHub

Merge pull request #112 from littletomatodonkey/fix_deli

add delimiter reader
#copyright (c) 2020 PaddlePaddle Authors. All Rights Reserve. # copyright (c) 2020 PaddlePaddle Authors. All Rights Reserve.
# #
#Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
#you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
#You may obtain a copy of the License at # You may obtain a copy of the License at
# #
# http://www.apache.org/licenses/LICENSE-2.0 # http://www.apache.org/licenses/LICENSE-2.0
# #
#Unless required by applicable law or agreed to in writing, software # Unless required by applicable law or agreed to in writing, software
#distributed under the License is distributed on an "AS IS" BASIS, # distributed under the License is distributed on an "AS IS" BASIS,
#WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
#limitations under the License. # limitations under the License.
import cv2
import numpy as np import numpy as np
import os import os
import signal import signal
import imghdr
import paddle import paddle
from . import imaug from . import imaug
from .imaug import transform from .imaug import transform
from .imaug import MixupOperator
from ppcls.utils import logger from ppcls.utils import logger
trainers_num = int(os.environ.get('PADDLE_TRAINERS_NUM', 1)) trainers_num = int(os.environ.get('PADDLE_TRAINERS_NUM', 1))
...@@ -176,7 +174,7 @@ def partial_reader(params, full_lines, part_id=0, part_num=1): ...@@ -176,7 +174,7 @@ def partial_reader(params, full_lines, part_id=0, part_num=1):
part_id(int): part index of the current partial data part_id(int): part index of the current partial data
part_num(int): part num of the dataset part_num(int): part num of the dataset
""" """
assert part_id < part_num, ("part_num: {} should be larger " \ assert part_id < part_num, ("part_num: {} should be larger "
"than part_id: {}".format(part_num, part_id)) "than part_id: {}".format(part_num, part_id))
full_lines = full_lines[part_id::part_num] full_lines = full_lines[part_id::part_num]
...@@ -187,8 +185,9 @@ def partial_reader(params, full_lines, part_id=0, part_num=1): ...@@ -187,8 +185,9 @@ def partial_reader(params, full_lines, part_id=0, part_num=1):
def reader(): def reader():
ops = create_operators(params['transforms']) ops = create_operators(params['transforms'])
delimiter = params.get('delimiter', ' ')
for line in full_lines: for line in full_lines:
img_path, label = line.split() img_path, label = line.split(delimiter)
img_path = os.path.join(params['data_dir'], img_path) img_path = os.path.join(params['data_dir'], img_path)
with open(img_path, 'rb') as f: with open(img_path, 'rb') as f:
img = f.read() img = f.read()
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册