Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle
提交
cee0079a
P
Paddle
项目概览
PaddlePaddle
/
Paddle
1 年多 前同步成功
通知
2305
Star
20932
Fork
5423
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1423
列表
看板
标记
里程碑
合并请求
543
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1,423
Issue
1,423
列表
看板
标记
里程碑
合并请求
543
合并请求
543
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
cee0079a
编写于
9月 20, 2019
作者:
Z
Zeng Jinle
提交者:
GitHub
9月 20, 2019
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
fix readers bug, test=develop (#19868)
上级
747d4498
变更
5
隐藏空白更改
内联
并排
Showing
5 changed file
with
199 addition
and
17 deletion
+199
-17
python/paddle/dataset/cifar.py
python/paddle/dataset/cifar.py
+7
-6
python/paddle/fluid/tests/unittests/CMakeLists.txt
python/paddle/fluid/tests/unittests/CMakeLists.txt
+1
-0
python/paddle/fluid/tests/unittests/test_cyclic_cifar_dataset.py
...paddle/fluid/tests/unittests/test_cyclic_cifar_dataset.py
+38
-0
python/paddle/fluid/tests/unittests/test_multiprocess_reader_exception.py
...uid/tests/unittests/test_multiprocess_reader_exception.py
+126
-0
python/paddle/reader/decorator.py
python/paddle/reader/decorator.py
+27
-11
未找到文件。
python/paddle/dataset/cifar.py
浏览文件 @
cee0079a
...
...
@@ -55,11 +55,11 @@ def reader_creator(filename, sub_name, cycle=False):
yield
(
sample
/
255.0
).
astype
(
numpy
.
float32
),
int
(
label
)
def
reader
():
with
tarfile
.
open
(
filename
,
mode
=
'r'
)
as
f
:
names
=
(
each_item
.
name
for
each_item
in
f
if
sub_name
in
each_item
.
name
)
while
True
:
with
tarfile
.
open
(
filename
,
mode
=
'r'
)
as
f
:
names
=
(
each_item
.
name
for
each_item
in
f
if
sub_name
in
each_item
.
name
)
while
True
:
for
name
in
names
:
if
six
.
PY2
:
batch
=
pickle
.
load
(
f
.
extractfile
(
name
))
...
...
@@ -68,8 +68,9 @@ def reader_creator(filename, sub_name, cycle=False):
f
.
extractfile
(
name
),
encoding
=
'bytes'
)
for
item
in
read_batch
(
batch
):
yield
item
if
not
cycle
:
break
if
not
cycle
:
break
return
reader
...
...
python/paddle/fluid/tests/unittests/CMakeLists.txt
浏览文件 @
cee0079a
...
...
@@ -38,6 +38,7 @@ endif()
if
(
WIN32
)
LIST
(
REMOVE_ITEM TEST_OPS test_boxps
)
LIST
(
REMOVE_ITEM TEST_OPS test_trainer_desc
)
LIST
(
REMOVE_ITEM TEST_OPS test_multiprocess_reader_exception
)
endif
()
LIST
(
REMOVE_ITEM TEST_OPS test_launch
)
...
...
python/paddle/fluid/tests/unittests/test_cyclic_cifar_dataset.py
0 → 100644
浏览文件 @
cee0079a
# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import
paddle
import
unittest
class
TestCifar10
(
unittest
.
TestCase
):
def
test_main
(
self
):
reader
=
paddle
.
dataset
.
cifar
.
train10
(
cycle
=
False
)
sample_num
=
0
for
_
in
reader
():
sample_num
+=
1
cyclic_reader
=
paddle
.
dataset
.
cifar
.
train10
(
cycle
=
True
)
read_num
=
0
for
data
in
cyclic_reader
():
read_num
+=
1
self
.
assertEquals
(
len
(
data
),
2
)
if
read_num
==
sample_num
*
2
:
break
self
.
assertEquals
(
read_num
,
sample_num
*
2
)
if
__name__
==
'__main__'
:
unittest
.
main
()
python/paddle/fluid/tests/unittests/test_multiprocess_reader_exception.py
0 → 100644
浏览文件 @
cee0079a
# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import
paddle.fluid
as
fluid
from
paddle.fluid.io
import
multiprocess_reader
import
unittest
import
numpy
as
np
import
six
import
sys
class
TestMultiprocessReaderException
(
unittest
.
TestCase
):
def
setUp
(
self
):
self
.
use_pipe
=
False
self
.
raise_exception
=
False
def
places
(
self
):
if
fluid
.
is_compiled_with_cuda
():
return
[
fluid
.
CPUPlace
(),
fluid
.
CUDAPlace
(
0
)]
else
:
return
[
fluid
.
CPUPlace
()]
def
main_impl
(
self
,
place
,
iterable
):
def
fake_reader
():
def
__impl__
():
for
_
in
range
(
40
):
if
not
self
.
raise_exception
:
yield
list
(
np
.
random
.
uniform
(
low
=-
1
,
high
=
1
,
size
=
[
10
])),
else
:
raise
ValueError
()
return
__impl__
with
fluid
.
program_guard
(
fluid
.
Program
(),
fluid
.
Program
()):
image
=
fluid
.
layers
.
data
(
name
=
'image'
,
dtype
=
'float32'
,
shape
=
[
10
])
reader
=
fluid
.
io
.
PyReader
(
feed_list
=
[
image
],
capacity
=
2
,
iterable
=
iterable
)
image_p_1
=
image
+
1
decorated_reader
=
multiprocess_reader
(
[
fake_reader
(),
fake_reader
()],
use_pipe
=
self
.
use_pipe
)
if
isinstance
(
place
,
fluid
.
CUDAPlace
):
reader
.
decorate_sample_generator
(
decorated_reader
,
batch_size
=
4
,
places
=
fluid
.
cuda_places
())
else
:
reader
.
decorate_sample_generator
(
decorated_reader
,
batch_size
=
4
,
places
=
fluid
.
cpu_places
())
exe
=
fluid
.
Executor
(
place
)
exe
.
run
(
fluid
.
default_startup_program
())
if
iterable
:
for
_
in
range
(
3
):
num
=
0
for
data
in
reader
():
exe
.
run
(
feed
=
data
,
fetch_list
=
[
image_p_1
])
num
+=
1
if
not
self
.
raise_exception
:
self
.
assertEquals
(
num
,
20
)
else
:
self
.
assertEquals
(
num
,
0
)
raise
ValueError
(
'Reader raises exception'
)
else
:
for
_
in
range
(
3
):
num
=
0
reader
.
start
()
try
:
while
True
:
exe
.
run
(
fetch_list
=
[
image_p_1
])
num
+=
1
except
fluid
.
core
.
EOFException
:
reader
.
reset
()
if
not
self
.
raise_exception
:
self
.
assertEquals
(
num
,
20
)
else
:
self
.
assertEquals
(
num
,
0
)
raise
ValueError
(
'Reader raises exception'
)
def
test_main
(
self
):
for
p
in
self
.
places
():
for
iterable
in
[
False
,
True
]:
try
:
with
fluid
.
scope_guard
(
fluid
.
Scope
()):
self
.
main_impl
(
p
,
iterable
)
self
.
assertTrue
(
not
self
.
raise_exception
)
except
ValueError
:
self
.
assertTrue
(
self
.
raise_exception
)
class
TestCase1
(
TestMultiprocessReaderException
):
def
setUp
(
self
):
self
.
use_pipe
=
False
self
.
raise_exception
=
True
class
TestCase2
(
TestMultiprocessReaderException
):
def
setUp
(
self
):
self
.
use_pipe
=
True
self
.
raise_exception
=
False
class
TestCase3
(
TestMultiprocessReaderException
):
def
setUp
(
self
):
self
.
use_pipe
=
True
self
.
raise_exception
=
True
if
__name__
==
'__main__'
:
unittest
.
main
()
python/paddle/reader/decorator.py
浏览文件 @
cee0079a
...
...
@@ -21,6 +21,7 @@ __all__ = [
from
threading
import
Thread
import
subprocess
import
multiprocessing
import
six
import
sys
from
six.moves.queue
import
Queue
...
...
@@ -390,11 +391,15 @@ def multiprocess_reader(readers, use_pipe=True, queue_size=1000):
assert
type
(
readers
)
is
list
and
len
(
readers
)
>
0
def
_read_into_queue
(
reader
,
queue
):
for
sample
in
reader
():
if
sample
is
None
:
raise
ValueError
(
"sample has None"
)
queue
.
put
(
sample
)
queue
.
put
(
None
)
try
:
for
sample
in
reader
():
if
sample
is
None
:
raise
ValueError
(
"sample has None"
)
queue
.
put
(
sample
)
queue
.
put
(
None
)
except
:
queue
.
put
(
""
)
six
.
reraise
(
*
sys
.
exc_info
())
def
queue_reader
():
queue
=
multiprocessing
.
Queue
(
queue_size
)
...
...
@@ -409,16 +414,23 @@ def multiprocess_reader(readers, use_pipe=True, queue_size=1000):
sample
=
queue
.
get
()
if
sample
is
None
:
finish_num
+=
1
elif
sample
==
""
:
raise
ValueError
(
"multiprocess reader raises an exception"
)
else
:
yield
sample
def
_read_into_pipe
(
reader
,
conn
):
for
sample
in
reader
():
if
sample
is
None
:
raise
ValueError
(
"sample has None!"
)
conn
.
send
(
json
.
dumps
(
sample
))
conn
.
send
(
json
.
dumps
(
None
))
conn
.
close
()
try
:
for
sample
in
reader
():
if
sample
is
None
:
raise
ValueError
(
"sample has None!"
)
conn
.
send
(
json
.
dumps
(
sample
))
conn
.
send
(
json
.
dumps
(
None
))
conn
.
close
()
except
:
conn
.
send
(
json
.
dumps
(
""
))
conn
.
close
()
six
.
reraise
(
*
sys
.
exc_info
())
def
pipe_reader
():
conns
=
[]
...
...
@@ -442,6 +454,10 @@ def multiprocess_reader(readers, use_pipe=True, queue_size=1000):
finish_num
+=
1
conn
.
close
()
conn_to_remove
.
append
(
conn
)
elif
sample
==
""
:
conn
.
close
()
conn_to_remove
.
append
(
conn
)
raise
ValueError
(
"multiprocess reader raises an exception"
)
else
:
yield
sample
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录