未验证 提交 33ce249f 编写于 作者: L Li Min 提交者: GitHub

Fix scatter_op fp16 perf problem. (#38499)

* Fix scatter_op fp16 perf problem.

* Add scatter into black list.

* Add scatter into black list for dygraph.
上级 f9e8a775
...@@ -18,7 +18,9 @@ from ... import core ...@@ -18,7 +18,9 @@ from ... import core
__all__ = ["CustomOpLists", "AutoMixedPrecisionLists"] __all__ = ["CustomOpLists", "AutoMixedPrecisionLists"]
# lookup_table fp16 is slower than fp32, though fp16 is supported. # lookup_table fp16 is slower than fp32, though fp16 is supported.
_extra_unsupported_fp16_list = {'lookup_table', 'lookup_table_v2'} _extra_unsupported_fp16_list = {
'lookup_table', 'lookup_table_v2', 'scatter', 'scatter_grad'
}
class AutoMixedPrecisionLists(object): class AutoMixedPrecisionLists(object):
......
...@@ -71,7 +71,9 @@ AMP_RELATED_FLAGS_SETTING = { ...@@ -71,7 +71,9 @@ AMP_RELATED_FLAGS_SETTING = {
} }
PURE_FP16_WHITE_LIST = {' '} PURE_FP16_WHITE_LIST = {' '}
PURE_FP16_BLACK_LIST = {'lookup_table', 'lookup_table_v2'} PURE_FP16_BLACK_LIST = {
'lookup_table', 'lookup_table_v2', 'scatter', 'scatter_grad'
}
#NOTE(zhiqiu): similar as paddle.fluid.contrib.mixed_precision.fp16_lists.AutoMixedPrecisionLists._update_list #NOTE(zhiqiu): similar as paddle.fluid.contrib.mixed_precision.fp16_lists.AutoMixedPrecisionLists._update_list
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册