Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle
提交
cbeff5fc
P
Paddle
项目概览
PaddlePaddle
/
Paddle
1 年多 前同步成功
通知
2302
Star
20931
Fork
5422
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1423
列表
看板
标记
里程碑
合并请求
543
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1,423
Issue
1,423
列表
看板
标记
里程碑
合并请求
543
合并请求
543
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
cbeff5fc
编写于
5月 31, 2023
作者:
C
Charles-hit
提交者:
GitHub
5月 31, 2023
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
support activation prim op bf16 dtype (#54193)
* support activation prim op bf16 dtype * remove useless code
上级
2db64d08
变更
4
展开全部
隐藏空白更改
内联
并排
Showing
4 changed file
with
317 addition
and
309 deletion
+317
-309
paddle/phi/kernels/funcs/activation_functor.h
paddle/phi/kernels/funcs/activation_functor.h
+7
-3
python/paddle/fluid/tests/unittests/prim_op_test.py
python/paddle/fluid/tests/unittests/prim_op_test.py
+101
-99
python/paddle/fluid/tests/unittests/test_activation_op.py
python/paddle/fluid/tests/unittests/test_activation_op.py
+206
-205
python/paddle/incubate/autograd/composite_rules.py
python/paddle/incubate/autograd/composite_rules.py
+3
-2
未找到文件。
paddle/phi/kernels/funcs/activation_functor.h
浏览文件 @
cbeff5fc
...
...
@@ -3083,11 +3083,15 @@ struct CudaRsqrtFunctor : public BaseActivationFunctor<T> {
template
<
typename
T
>
struct
CudaRsqrtGradFunctor
:
public
BaseActivationFunctor
<
T
>
{
T
minus_one_half
=
static_cast
<
T
>
(
-
0.5
f
);
using
MPType
=
typename
phi
::
dtype
::
MPTypeTrait
<
T
>::
Type
;
MPType
minus_one_half
=
static_cast
<
MPType
>
(
-
0.5
f
);
// dx = -0.5 * dout * out^3
__device__
__forceinline__
T
operator
()(
const
T
dout
,
const
T
out
)
const
{
return
minus_one_half
*
dout
*
out
*
out
*
out
;
__device__
__forceinline__
T
operator
()(
const
T
arg_dout
,
const
T
arg_out
)
const
{
MPType
dout
=
static_cast
<
MPType
>
(
arg_dout
);
MPType
out
=
static_cast
<
MPType
>
(
arg_out
);
return
static_cast
<
T
>
(
minus_one_half
*
dout
*
out
*
out
*
out
);
}
static
constexpr
ActBwdOpFwdDeps
FwdDeps
()
{
...
...
python/paddle/fluid/tests/unittests/prim_op_test.py
浏览文件 @
cbeff5fc
...
...
@@ -578,45 +578,45 @@ class PrimForwardChecker:
# forward comp only for comp op
if
self
.
prim_op_type
==
"prim"
:
return
paddle
.
enable_static
()
core
.
_set_prim_forward_enabled
(
self
.
enable_fw_comp
)
startup_program
,
main_program
=
(
paddle
.
static
.
Program
(),
paddle
.
static
.
Program
(),
)
with
paddle
.
static
.
program_guard
(
main_program
,
startup_program
):
(
static_inputs
,
attrs
,
input_dict
,
feed
,
)
=
self
.
get_static_input_attr_inputdict_and_feed
(
stop_gradient
=
True
)
args
=
OpTestUtils
.
prepare_python_api_arguments
(
self
.
public_python_api
,
static_inputs
,
attrs
,
self
.
kernel_sig
,
)
inputs_sig
,
_
,
_
=
self
.
kernel_sig
args
=
OpTestUtils
.
assumption_assert_and_transform
(
args
,
len
(
inputs_sig
)
)
ret
=
flatten
(
_as_list
(
self
.
public_python_api
(
*
args
)))
primapi
.
to_prim
(
main_program
.
blocks
)
# ensure the operator not in program if check_prim is True
forward_ops
=
[
op
.
type
for
op
in
main_program
.
blocks
[
0
].
ops
]
assert
self
.
op_type
not
in
forward_ops
,
(
"%s shouldn't appear in program when check_prim is True"
)
%
(
self
.
op_type
)
exe
=
paddle
.
static
.
Executor
(
self
.
place
)
exe
.
run
(
startup_program
)
ret
=
exe
.
run
(
main_program
,
feed
=
feed
,
fetch_list
=
ret
)
if
OpTestUtils
.
is_bfloat16_type
(
self
.
dtype
):
ret
=
paddle
.
utils
.
map_structure
(
lambda
x
:
convert_uint16_to_float
(
x
),
ret
with
paddle
.
fluid
.
framework
.
_static_guard
():
core
.
_set_prim_forward_enabled
(
self
.
enable_fw_comp
)
startup_program
,
main_program
=
(
paddle
.
static
.
Program
(),
paddle
.
static
.
Program
(),
)
with
paddle
.
static
.
program_guard
(
main_program
,
startup_program
):
(
static_inputs
,
attrs
,
input_dict
,
feed
,
)
=
self
.
get_static_input_attr_inputdict_and_feed
(
stop_gradient
=
True
)
args
=
OpTestUtils
.
prepare_python_api_arguments
(
self
.
public_python_api
,
static_inputs
,
attrs
,
self
.
kernel_sig
,
)
inputs_sig
,
_
,
_
=
self
.
kernel_sig
args
=
OpTestUtils
.
assumption_assert_and_transform
(
args
,
len
(
inputs_sig
)
)
ret
=
flatten
(
_as_list
(
self
.
public_python_api
(
*
args
)))
primapi
.
to_prim
(
main_program
.
blocks
)
# ensure the operator not in program if check_prim is True
forward_ops
=
[
op
.
type
for
op
in
main_program
.
blocks
[
0
].
ops
]
assert
self
.
op_type
not
in
forward_ops
,
(
"%s shouldn't appear in program when check_prim is True"
)
%
(
self
.
op_type
)
exe
=
paddle
.
static
.
Executor
(
self
.
place
)
exe
.
run
(
startup_program
)
ret
=
exe
.
run
(
main_program
,
feed
=
feed
,
fetch_list
=
ret
)
if
OpTestUtils
.
is_bfloat16_type
(
self
.
dtype
):
ret
=
paddle
.
utils
.
map_structure
(
lambda
x
:
convert_uint16_to_float
(
x
),
ret
)
# check static forward
if
len
(
ret
)
!=
len
(
self
.
eager_desire
):
msg
=
(
...
...
@@ -1024,7 +1024,6 @@ class PrimGradChecker(PrimForwardChecker):
core
.
set_prim_eager_enabled
(
False
)
def
check_static_comp
(
self
):
paddle
.
enable_static
()
if
self
.
prim_op_type
==
"prim"
:
core
.
_set_prim_backward_enabled
(
self
.
enable_rev_comp
)
else
:
...
...
@@ -1032,67 +1031,70 @@ class PrimGradChecker(PrimForwardChecker):
core
.
_set_prim_backward_enabled
(
self
.
enable_rev_comp
)
atol
=
self
.
rev_comp_atol
if
self
.
enable_rev_comp
else
self
.
fw_comp_atol
rtol
=
self
.
rev_comp_rtol
if
self
.
enable_rev_comp
else
self
.
fw_comp_rtol
startup_program
,
main_program
=
(
paddle
.
static
.
Program
(),
paddle
.
static
.
Program
(),
)
with
paddle
.
static
.
program_guard
(
main_program
,
startup_program
):
(
static_inputs
,
attrs
,
inputs_dict
,
feed
,
)
=
self
.
get_static_input_attr_inputdict_and_feed
(
stop_gradient
=
False
)
args
=
OpTestUtils
.
prepare_python_api_arguments
(
self
.
public_python_api
,
static_inputs
,
attrs
,
self
.
kernel_sig
,
)
inputs_sig
,
_
,
outputs_sig
=
self
.
kernel_sig
if
hasattr
(
self
.
op_test
,
"python_out_sig"
):
outputs_sig
=
self
.
op_test
.
python_out_sig
args
=
OpTestUtils
.
assumption_assert_and_transform
(
args
,
len
(
inputs_sig
)
)
fw_outs
=
_as_list
(
self
.
public_python_api
(
*
args
))
outputs_dict
=
self
.
get_output_dict
(
self
.
outputs
,
fw_outs
,
outputs_sig
)
primapi
.
to_prim
(
main_program
.
blocks
)
ys
=
[]
if
isinstance
(
self
.
output_names
,
list
):
for
output_name
in
self
.
output_names
:
ys
.
append
(
outputs_dict
[
output_name
])
else
:
ys
.
append
(
outputs_dict
[
self
.
output_names
])
xs
=
[]
if
isinstance
(
self
.
inputs_to_check
,
list
):
for
input_name
in
self
.
inputs_to_check
:
xs
.
append
(
inputs_dict
[
input_name
])
else
:
xs
.
append
(
inputs_dict
[
self
.
inputs_to_check
])
vs
,
vs_feed
=
self
.
gen_static_grad_outputs_and_feed
()
feed
.
update
(
vs_feed
)
no_grad_vars
=
self
.
gen_no_grad_set
(
var_dict
=
{
**
inputs_dict
,
**
outputs_dict
}
)
ret
=
paddle
.
static
.
gradients
(
ys
,
xs
,
vs
,
no_grad_set
=
no_grad_vars
)
# check the backward operator not in program when check_prim is True
ops
=
[
op
.
type
for
op
in
main_program
.
blocks
[
0
].
ops
]
backward_op_type
=
self
.
op_type
+
"_grad"
assert
backward_op_type
not
in
ops
,
(
"%s shouldn't appear in program when check_prim is True"
)
%
(
backward_op_type
)
exe
=
paddle
.
static
.
Executor
(
self
.
place
)
exe
.
run
(
startup_program
)
actual_ret
=
exe
.
run
(
main_program
,
feed
=
feed
,
fetch_list
=
ret
)
if
OpTestUtils
.
is_bfloat16_type
(
self
.
dtype
):
actual_ret
=
paddle
.
utils
.
map_structure
(
lambda
x
:
convert_uint16_to_float
(
x
),
actual_ret
with
paddle
.
fluid
.
framework
.
_static_guard
():
startup_program
,
main_program
=
(
paddle
.
static
.
Program
(),
paddle
.
static
.
Program
(),
)
with
paddle
.
static
.
program_guard
(
main_program
,
startup_program
):
(
static_inputs
,
attrs
,
inputs_dict
,
feed
,
)
=
self
.
get_static_input_attr_inputdict_and_feed
(
stop_gradient
=
False
)
args
=
OpTestUtils
.
prepare_python_api_arguments
(
self
.
public_python_api
,
static_inputs
,
attrs
,
self
.
kernel_sig
,
)
inputs_sig
,
_
,
outputs_sig
=
self
.
kernel_sig
if
hasattr
(
self
.
op_test
,
"python_out_sig"
):
outputs_sig
=
self
.
op_test
.
python_out_sig
args
=
OpTestUtils
.
assumption_assert_and_transform
(
args
,
len
(
inputs_sig
)
)
fw_outs
=
_as_list
(
self
.
public_python_api
(
*
args
))
outputs_dict
=
self
.
get_output_dict
(
self
.
outputs
,
fw_outs
,
outputs_sig
)
primapi
.
to_prim
(
main_program
.
blocks
)
ys
=
[]
if
isinstance
(
self
.
output_names
,
list
):
for
output_name
in
self
.
output_names
:
ys
.
append
(
outputs_dict
[
output_name
])
else
:
ys
.
append
(
outputs_dict
[
self
.
output_names
])
xs
=
[]
if
isinstance
(
self
.
inputs_to_check
,
list
):
for
input_name
in
self
.
inputs_to_check
:
xs
.
append
(
inputs_dict
[
input_name
])
else
:
xs
.
append
(
inputs_dict
[
self
.
inputs_to_check
])
vs
,
vs_feed
=
self
.
gen_static_grad_outputs_and_feed
()
feed
.
update
(
vs_feed
)
no_grad_vars
=
self
.
gen_no_grad_set
(
var_dict
=
{
**
inputs_dict
,
**
outputs_dict
}
)
ret
=
paddle
.
static
.
gradients
(
ys
,
xs
,
vs
,
no_grad_set
=
no_grad_vars
)
# check the backward operator not in program when check_prim is True
ops
=
[
op
.
type
for
op
in
main_program
.
blocks
[
0
].
ops
]
backward_op_type
=
self
.
op_type
+
"_grad"
assert
backward_op_type
not
in
ops
,
(
"%s shouldn't appear in program when check_prim is True"
)
%
(
backward_op_type
)
exe
=
paddle
.
static
.
Executor
(
self
.
place
)
exe
.
run
(
startup_program
)
actual_ret
=
exe
.
run
(
main_program
,
feed
=
feed
,
fetch_list
=
ret
)
if
OpTestUtils
.
is_bfloat16_type
(
self
.
dtype
):
actual_ret
=
paddle
.
utils
.
map_structure
(
lambda
x
:
convert_uint16_to_float
(
x
),
actual_ret
)
# check static grad out
if
len
(
actual_ret
)
!=
len
(
self
.
eager_desire
):
msg
=
(
...
...
python/paddle/fluid/tests/unittests/test_activation_op.py
浏览文件 @
cbeff5fc
此差异已折叠。
点击以展开。
python/paddle/incubate/autograd/composite_rules.py
浏览文件 @
cbeff5fc
...
...
@@ -631,12 +631,13 @@ def rsqrt_composite(x):
is_amp
=
False
from
paddle.fluid.data_feeder
import
convert_dtype
if
convert_dtype
(
x
.
dtype
)
==
"float16"
:
dtype
=
convert_dtype
(
x
.
dtype
)
if
dtype
==
"float16"
or
dtype
==
"uint16"
:
is_amp
=
True
x
=
cast
(
x
,
"float32"
)
y
=
full
(
x
.
shape
if
len
(
x
.
shape
)
==
0
else
[
1
],
-
0.5
,
x
.
dtype
)
res
=
pow
(
x
,
y
)
return
res
if
not
is_amp
else
cast
(
res
,
"float16"
)
return
res
if
not
is_amp
else
cast
(
res
,
dtype
)
@
REGISTER_COMPOSITE
(
'group_norm'
)
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录