Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
Crayon鑫
Paddle
提交
fb2a9cdf
P
Paddle
项目概览
Crayon鑫
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
fb2a9cdf
编写于
9月 27, 2019
作者:
C
chengduo
提交者:
GitHub
9月 27, 2019
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
Add fp16 support for pad and split (#19881)
* make pad and split support fp16 test=develop
上级
c9ea317b
变更
8
显示空白变更内容
内联
并排
Showing
8 changed file
with
110 addition
and
32 deletion
+110
-32
paddle/fluid/operators/math/padding.h
paddle/fluid/operators/math/padding.h
+1
-1
paddle/fluid/operators/pad_op.cu
paddle/fluid/operators/pad_op.cu
+7
-2
paddle/fluid/operators/pad_op.h
paddle/fluid/operators/pad_op.h
+3
-3
paddle/fluid/operators/split_op.cc
paddle/fluid/operators/split_op.cc
+6
-5
paddle/fluid/operators/split_op.cu.cc
paddle/fluid/operators/split_op.cu.cc
+6
-4
python/paddle/fluid/tests/unittests/test_concat_op.py
python/paddle/fluid/tests/unittests/test_concat_op.py
+38
-15
python/paddle/fluid/tests/unittests/test_pad_op.py
python/paddle/fluid/tests/unittests/test_pad_op.py
+26
-1
python/paddle/fluid/tests/unittests/test_split_op.py
python/paddle/fluid/tests/unittests/test_split_op.py
+23
-1
未找到文件。
paddle/fluid/operators/math/padding.h
浏览文件 @
fb2a9cdf
...
@@ -58,7 +58,7 @@ void PadGradFunction(const framework::ExecutionContext& context,
...
@@ -58,7 +58,7 @@ void PadGradFunction(const framework::ExecutionContext& context,
auto
src_tensor
=
EigenTensor
<
T
,
D
>::
From
(
src
);
auto
src_tensor
=
EigenTensor
<
T
,
D
>::
From
(
src
);
auto
&
place
=
auto
&
place
=
*
context
.
template
device_context
<
DeviceContext
>().
eigen_device
();
*
context
.
template
device_context
<
DeviceContext
>().
eigen_device
();
d_out_tensor
.
device
(
place
)
=
src_tensor
.
pad
(
paddings
,
0
);
d_out_tensor
.
device
(
place
)
=
src_tensor
.
pad
(
paddings
,
static_cast
<
T
>
(
0
)
);
}
}
template
<
typename
DeviceContext
,
typename
T
>
template
<
typename
DeviceContext
,
typename
T
>
...
...
paddle/fluid/operators/pad_op.cu
浏览文件 @
fb2a9cdf
...
@@ -14,7 +14,12 @@ limitations under the License. */
...
@@ -14,7 +14,12 @@ limitations under the License. */
#include "paddle/fluid/operators/pad_op.h"
#include "paddle/fluid/operators/pad_op.h"
namespace
ops
=
paddle
::
operators
;
namespace
ops
=
paddle
::
operators
;
namespace
plat
=
paddle
::
platform
;
REGISTER_OP_CUDA_KERNEL
(
REGISTER_OP_CUDA_KERNEL
(
pad
,
ops
::
PadKernel
<
paddle
::
platform
::
CUDADeviceContext
,
float
>
);
pad
,
ops
::
PadKernel
<
paddle
::
platform
::
CUDADeviceContext
,
double
>
,
ops
::
PadKernel
<
paddle
::
platform
::
CUDADeviceContext
,
float
>
,
ops
::
PadKernel
<
paddle
::
platform
::
CUDADeviceContext
,
plat
::
float16
>
);
REGISTER_OP_CUDA_KERNEL
(
REGISTER_OP_CUDA_KERNEL
(
pad_grad
,
ops
::
PadGradKernel
<
paddle
::
platform
::
CUDADeviceContext
,
float
>
);
pad_grad
,
ops
::
PadGradKernel
<
paddle
::
platform
::
CUDADeviceContext
,
double
>
,
ops
::
PadGradKernel
<
paddle
::
platform
::
CUDADeviceContext
,
float
>
,
ops
::
PadGradKernel
<
paddle
::
platform
::
CUDADeviceContext
,
plat
::
float16
>
);
paddle/fluid/operators/pad_op.h
浏览文件 @
fb2a9cdf
...
@@ -30,14 +30,14 @@ class PadKernel : public framework::OpKernel<T> {
...
@@ -30,14 +30,14 @@ class PadKernel : public framework::OpKernel<T> {
public:
public:
void
Compute
(
const
framework
::
ExecutionContext
&
context
)
const
override
{
void
Compute
(
const
framework
::
ExecutionContext
&
context
)
const
override
{
auto
pads
=
context
.
Attr
<
std
::
vector
<
int
>>
(
"paddings"
);
auto
pads
=
context
.
Attr
<
std
::
vector
<
int
>>
(
"paddings"
);
T
pad_value
=
context
.
Attr
<
T
>
(
"pad_value"
);
float
pad_value
=
context
.
Attr
<
float
>
(
"pad_value"
);
auto
*
x
=
context
.
Input
<
Tensor
>
(
"X"
);
auto
*
x
=
context
.
Input
<
Tensor
>
(
"X"
);
auto
*
out
=
context
.
Output
<
Tensor
>
(
"Out"
);
auto
*
out
=
context
.
Output
<
Tensor
>
(
"Out"
);
out
->
mutable_data
<
T
>
(
context
.
GetPlace
());
out
->
mutable_data
<
T
>
(
context
.
GetPlace
());
int
rank
=
x
->
dims
().
size
();
int
rank
=
x
->
dims
().
size
();
math
::
PaddingFunctor
<
DeviceContext
,
T
>
(
rank
,
context
,
pads
,
pad_value
,
*
x
,
math
::
PaddingFunctor
<
DeviceContext
,
T
>
(
rank
,
context
,
pads
,
out
);
static_cast
<
T
>
(
pad_value
),
*
x
,
out
);
}
}
};
};
...
...
paddle/fluid/operators/split_op.cc
浏览文件 @
fb2a9cdf
...
@@ -119,10 +119,11 @@ Example:
...
@@ -119,10 +119,11 @@ Example:
}
// namespace paddle
}
// namespace paddle
namespace
ops
=
paddle
::
operators
;
namespace
ops
=
paddle
::
operators
;
namespace
plat
=
paddle
::
platform
;
REGISTER_OPERATOR
(
split
,
ops
::
SplitOp
,
ops
::
SplitOpMaker
,
ops
::
SplitGradMaker
);
REGISTER_OPERATOR
(
split
,
ops
::
SplitOp
,
ops
::
SplitOpMaker
,
ops
::
SplitGradMaker
);
REGISTER_OP_CPU_KERNEL
(
REGISTER_OP_CPU_KERNEL
(
split
,
ops
::
SplitOpKernel
<
paddle
::
platform
::
CPUDeviceContext
,
double
>
,
split
,
ops
::
SplitOpKernel
<
plat
::
CPUDeviceContext
,
double
>
,
ops
::
SplitOpKernel
<
paddle
::
platform
::
CPUDeviceContext
,
float
>
,
ops
::
SplitOpKernel
<
plat
::
CPUDeviceContext
,
float
>
,
ops
::
SplitOpKernel
<
paddle
::
platform
::
CPUDeviceContext
,
int64_t
>
,
ops
::
SplitOpKernel
<
plat
::
CPUDeviceContext
,
int64_t
>
,
ops
::
SplitOpKernel
<
paddle
::
platform
::
CPUDeviceContext
,
int
>
);
ops
::
SplitOpKernel
<
plat
::
CPUDeviceContext
,
int
>
,
ops
::
SplitOpKernel
<
plat
::
CPUDeviceContext
,
plat
::
float16
>
);
paddle/fluid/operators/split_op.cu.cc
浏览文件 @
fb2a9cdf
...
@@ -14,8 +14,10 @@ limitations under the License. */
...
@@ -14,8 +14,10 @@ limitations under the License. */
#include "paddle/fluid/operators/split_op.h"
#include "paddle/fluid/operators/split_op.h"
namespace
ops
=
paddle
::
operators
;
namespace
ops
=
paddle
::
operators
;
namespace
plat
=
paddle
::
platform
;
REGISTER_OP_CUDA_KERNEL
(
REGISTER_OP_CUDA_KERNEL
(
split
,
ops
::
SplitOpKernel
<
paddle
::
platform
::
CUDADeviceContext
,
double
>
,
split
,
ops
::
SplitOpKernel
<
plat
::
CUDADeviceContext
,
double
>
,
ops
::
SplitOpKernel
<
paddle
::
platform
::
CUDADeviceContext
,
float
>
,
ops
::
SplitOpKernel
<
plat
::
CUDADeviceContext
,
float
>
,
ops
::
SplitOpKernel
<
paddle
::
platform
::
CUDADeviceContext
,
int64_t
>
,
ops
::
SplitOpKernel
<
plat
::
CUDADeviceContext
,
int64_t
>
,
ops
::
SplitOpKernel
<
paddle
::
platform
::
CUDADeviceContext
,
int
>
);
ops
::
SplitOpKernel
<
plat
::
CUDADeviceContext
,
int
>
,
ops
::
SplitOpKernel
<
plat
::
CUDADeviceContext
,
plat
::
float16
>
);
python/paddle/fluid/tests/unittests/test_concat_op.py
浏览文件 @
fb2a9cdf
...
@@ -22,6 +22,7 @@ from op_test import OpTest
...
@@ -22,6 +22,7 @@ from op_test import OpTest
class
TestConcatOp
(
OpTest
):
class
TestConcatOp
(
OpTest
):
def
setUp
(
self
):
def
setUp
(
self
):
self
.
op_type
=
"concat"
self
.
op_type
=
"concat"
self
.
dtype
=
self
.
get_dtype
()
self
.
init_test_data
()
self
.
init_test_data
()
self
.
inputs
=
{
'X'
:
[(
'x0'
,
self
.
x0
),
(
'x1'
,
self
.
x1
),
(
'x2'
,
self
.
x2
)]}
self
.
inputs
=
{
'X'
:
[(
'x0'
,
self
.
x0
),
(
'x1'
,
self
.
x1
),
(
'x2'
,
self
.
x2
)]}
self
.
attrs
=
{
'axis'
:
self
.
axis
}
self
.
attrs
=
{
'axis'
:
self
.
axis
}
...
@@ -36,6 +37,9 @@ class TestConcatOp(OpTest):
...
@@ -36,6 +37,9 @@ class TestConcatOp(OpTest):
(
self
.
x0
,
self
.
x1
,
self
.
x2
),
axis
=
self
.
actual_axis
)
(
self
.
x0
,
self
.
x1
,
self
.
x2
),
axis
=
self
.
actual_axis
)
}
}
def
get_dtype
(
self
):
return
"float32"
def
test_check_output
(
self
):
def
test_check_output
(
self
):
self
.
check_output
()
self
.
check_output
()
...
@@ -45,25 +49,25 @@ class TestConcatOp(OpTest):
...
@@ -45,25 +49,25 @@ class TestConcatOp(OpTest):
self
.
check_grad
([
'x2'
],
'Out'
)
self
.
check_grad
([
'x2'
],
'Out'
)
def
init_test_data
(
self
):
def
init_test_data
(
self
):
self
.
x0
=
np
.
random
.
random
((
2
,
1
,
4
,
5
)).
astype
(
'float32'
)
self
.
x0
=
np
.
random
.
random
((
2
,
1
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
x1
=
np
.
random
.
random
((
2
,
2
,
4
,
5
)).
astype
(
'float32'
)
self
.
x1
=
np
.
random
.
random
((
2
,
2
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
x2
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
'float32'
)
self
.
x2
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
axis
=
1
self
.
axis
=
1
class
TestConcatOp2
(
TestConcatOp
):
class
TestConcatOp2
(
TestConcatOp
):
def
init_test_data
(
self
):
def
init_test_data
(
self
):
self
.
x0
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
'float32'
)
self
.
x0
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
x1
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
'float32'
)
self
.
x1
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
x2
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
'float32'
)
self
.
x2
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
axis
=
1
self
.
axis
=
1
class
TestConcatOp3
(
TestConcatOp
):
class
TestConcatOp3
(
TestConcatOp
):
def
init_test_data
(
self
):
def
init_test_data
(
self
):
self
.
x0
=
np
.
random
.
random
((
1
,
256
,
170
,
256
)).
astype
(
'float32'
)
self
.
x0
=
np
.
random
.
random
((
1
,
256
,
170
,
256
)).
astype
(
self
.
dtype
)
self
.
x1
=
np
.
random
.
random
((
1
,
128
,
170
,
256
)).
astype
(
'float32'
)
self
.
x1
=
np
.
random
.
random
((
1
,
128
,
170
,
256
)).
astype
(
self
.
dtype
)
self
.
x2
=
np
.
random
.
random
((
1
,
128
,
170
,
256
)).
astype
(
'float32'
)
self
.
x2
=
np
.
random
.
random
((
1
,
128
,
170
,
256
)).
astype
(
self
.
dtype
)
self
.
axis
=
1
self
.
axis
=
1
def
test_check_grad
(
self
):
def
test_check_grad
(
self
):
...
@@ -72,9 +76,9 @@ class TestConcatOp3(TestConcatOp):
...
@@ -72,9 +76,9 @@ class TestConcatOp3(TestConcatOp):
class
TestConcatOp4
(
TestConcatOp
):
class
TestConcatOp4
(
TestConcatOp
):
def
init_test_data
(
self
):
def
init_test_data
(
self
):
self
.
x0
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
'float32'
)
self
.
x0
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
x1
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
'float32'
)
self
.
x1
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
x2
=
np
.
random
.
random
((
0
,
3
,
4
,
5
)).
astype
(
'float32'
)
self
.
x2
=
np
.
random
.
random
((
0
,
3
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
axis
=
0
self
.
axis
=
0
def
test_check_grad
(
self
):
def
test_check_grad
(
self
):
...
@@ -83,11 +87,30 @@ class TestConcatOp4(TestConcatOp):
...
@@ -83,11 +87,30 @@ class TestConcatOp4(TestConcatOp):
class
TestConcatOp5
(
TestConcatOp
):
class
TestConcatOp5
(
TestConcatOp
):
def
init_test_data
(
self
):
def
init_test_data
(
self
):
self
.
x0
=
np
.
random
.
random
((
2
,
1
,
4
,
5
)).
astype
(
'float32'
)
self
.
x0
=
np
.
random
.
random
((
2
,
1
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
x1
=
np
.
random
.
random
((
2
,
2
,
4
,
5
)).
astype
(
'float32'
)
self
.
x1
=
np
.
random
.
random
((
2
,
2
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
x2
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
'float32'
)
self
.
x2
=
np
.
random
.
random
((
2
,
3
,
4
,
5
)).
astype
(
self
.
dtype
)
self
.
axis
=
-
3
self
.
axis
=
-
3
#----------------Concat Fp16----------------
def
create_test_fp16
(
parent
):
class
TestConcatFp16
(
parent
):
def
get_dtype
(
self
):
return
np
.
float16
cls_name
=
"{0}_{1}"
.
format
(
parent
.
__name__
,
"Fp16"
)
TestConcatFp16
.
__name__
=
cls_name
globals
()[
cls_name
]
=
TestConcatFp16
create_test_fp16
(
TestConcatOp
)
create_test_fp16
(
TestConcatOp2
)
create_test_fp16
(
TestConcatOp3
)
create_test_fp16
(
TestConcatOp4
)
create_test_fp16
(
TestConcatOp5
)
if
__name__
==
'__main__'
:
if
__name__
==
'__main__'
:
unittest
.
main
()
unittest
.
main
()
python/paddle/fluid/tests/unittests/test_pad_op.py
浏览文件 @
fb2a9cdf
...
@@ -22,8 +22,9 @@ from op_test import OpTest
...
@@ -22,8 +22,9 @@ from op_test import OpTest
class
TestPadOp
(
OpTest
):
class
TestPadOp
(
OpTest
):
def
setUp
(
self
):
def
setUp
(
self
):
self
.
initTestCase
()
self
.
initTestCase
()
self
.
dtype
=
self
.
get_dtype
()
self
.
op_type
=
"pad"
self
.
op_type
=
"pad"
self
.
inputs
=
{
'X'
:
np
.
random
.
random
(
self
.
shape
).
astype
(
"float32"
),
}
self
.
inputs
=
{
'X'
:
np
.
random
.
random
(
self
.
shape
).
astype
(
self
.
dtype
),
}
self
.
attrs
=
{}
self
.
attrs
=
{}
self
.
attrs
[
'paddings'
]
=
np
.
array
(
self
.
paddings
).
flatten
()
self
.
attrs
[
'paddings'
]
=
np
.
array
(
self
.
paddings
).
flatten
()
self
.
attrs
[
'pad_value'
]
=
self
.
pad_value
self
.
attrs
[
'pad_value'
]
=
self
.
pad_value
...
@@ -34,6 +35,9 @@ class TestPadOp(OpTest):
...
@@ -34,6 +35,9 @@ class TestPadOp(OpTest):
constant_values
=
self
.
pad_value
)
constant_values
=
self
.
pad_value
)
}
}
def
get_dtype
(
self
):
return
np
.
float32
def
test_check_output
(
self
):
def
test_check_output
(
self
):
self
.
check_output
()
self
.
check_output
()
...
@@ -67,5 +71,26 @@ class TestCase3(TestPadOp):
...
@@ -67,5 +71,26 @@ class TestCase3(TestPadOp):
self
.
pad_value
=
0.9
self
.
pad_value
=
0.9
#----------------Pad Fp16----------------
def
create_test_fp16
(
parent
):
class
TestPadFp16
(
parent
):
def
get_dtype
(
self
):
return
np
.
float16
def
test_check_grad_normal
(
self
):
self
.
check_grad
([
'X'
],
'Out'
,
max_relative_error
=
0.3
)
cls_name
=
"{0}_{1}"
.
format
(
parent
.
__name__
,
"Fp16"
)
TestPadFp16
.
__name__
=
cls_name
globals
()[
cls_name
]
=
TestPadFp16
create_test_fp16
(
TestPadOp
)
create_test_fp16
(
TestCase1
)
create_test_fp16
(
TestCase2
)
create_test_fp16
(
TestCase3
)
if
__name__
==
'__main__'
:
if
__name__
==
'__main__'
:
unittest
.
main
()
unittest
.
main
()
python/paddle/fluid/tests/unittests/test_split_op.py
浏览文件 @
fb2a9cdf
...
@@ -22,14 +22,18 @@ from op_test import OpTest
...
@@ -22,14 +22,18 @@ from op_test import OpTest
class
TestSplitOp
(
OpTest
):
class
TestSplitOp
(
OpTest
):
def
setUp
(
self
):
def
setUp
(
self
):
self
.
_set_op_type
()
self
.
_set_op_type
()
self
.
dtype
=
self
.
get_dtype
()
axis
=
1
axis
=
1
x
=
np
.
random
.
random
((
4
,
5
,
6
)).
astype
(
'float32'
)
x
=
np
.
random
.
random
((
4
,
5
,
6
)).
astype
(
self
.
dtype
)
out
=
np
.
split
(
x
,
[
2
,
3
],
axis
)
out
=
np
.
split
(
x
,
[
2
,
3
],
axis
)
self
.
inputs
=
{
'X'
:
x
}
self
.
inputs
=
{
'X'
:
x
}
self
.
attrs
=
{
'axis'
:
axis
,
'sections'
:
[
2
,
1
,
2
]}
self
.
attrs
=
{
'axis'
:
axis
,
'sections'
:
[
2
,
1
,
2
]}
self
.
outputs
=
{
'Out'
:
[(
'out%d'
%
i
,
out
[
i
])
\
self
.
outputs
=
{
'Out'
:
[(
'out%d'
%
i
,
out
[
i
])
\
for
i
in
range
(
len
(
out
))]}
for
i
in
range
(
len
(
out
))]}
def
get_dtype
(
self
):
return
"float32"
def
_set_op_type
(
self
):
def
_set_op_type
(
self
):
self
.
op_type
=
"split"
self
.
op_type
=
"split"
...
@@ -45,5 +49,23 @@ class TestSplitByrefOp(OpTest):
...
@@ -45,5 +49,23 @@ class TestSplitByrefOp(OpTest):
self
.
op_type
=
"split_byref"
self
.
op_type
=
"split_byref"
#----------------Split Fp16----------------
def
create_test_fp16
(
parent
):
class
TestSplitFp16
(
parent
):
def
get_dtype
(
self
):
return
np
.
float16
def
test_check_grad
(
self
):
pass
cls_name
=
"{0}_{1}"
.
format
(
parent
.
__name__
,
"Fp16"
)
TestSplitFp16
.
__name__
=
cls_name
globals
()[
cls_name
]
=
TestSplitFp16
create_test_fp16
(
TestSplitOp
)
if
__name__
==
'__main__'
:
if
__name__
==
'__main__'
:
unittest
.
main
()
unittest
.
main
()
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录