From 33ce249f82a2a1a4af4b305c254a63c0a010f43f Mon Sep 17 00:00:00 2001 From: Li Min <11663212+limin2021@users.noreply.github.com> Date: Tue, 28 Dec 2021 09:46:50 +0800 Subject: [PATCH] Fix scatter_op fp16 perf problem. (#38499) * Fix scatter_op fp16 perf problem. * Add scatter into black list. * Add scatter into black list for dygraph. --- python/paddle/fluid/contrib/mixed_precision/fp16_lists.py | 4 +++- python/paddle/fluid/dygraph/amp/auto_cast.py | 4 +++- 2 files changed, 6 insertions(+), 2 deletions(-) diff --git a/python/paddle/fluid/contrib/mixed_precision/fp16_lists.py b/python/paddle/fluid/contrib/mixed_precision/fp16_lists.py index c466cafe1f..80d2ccb0d5 100644 --- a/python/paddle/fluid/contrib/mixed_precision/fp16_lists.py +++ b/python/paddle/fluid/contrib/mixed_precision/fp16_lists.py @@ -18,7 +18,9 @@ from ... import core __all__ = ["CustomOpLists", "AutoMixedPrecisionLists"] # lookup_table fp16 is slower than fp32, though fp16 is supported. -_extra_unsupported_fp16_list = {'lookup_table', 'lookup_table_v2'} +_extra_unsupported_fp16_list = { + 'lookup_table', 'lookup_table_v2', 'scatter', 'scatter_grad' +} class AutoMixedPrecisionLists(object): diff --git a/python/paddle/fluid/dygraph/amp/auto_cast.py b/python/paddle/fluid/dygraph/amp/auto_cast.py index 14a2bce63f..8f0e0dff2f 100644 --- a/python/paddle/fluid/dygraph/amp/auto_cast.py +++ b/python/paddle/fluid/dygraph/amp/auto_cast.py @@ -71,7 +71,9 @@ AMP_RELATED_FLAGS_SETTING = { } PURE_FP16_WHITE_LIST = {' '} -PURE_FP16_BLACK_LIST = {'lookup_table', 'lookup_table_v2'} +PURE_FP16_BLACK_LIST = { + 'lookup_table', 'lookup_table_v2', 'scatter', 'scatter_grad' +} #NOTE(zhiqiu): similar as paddle.fluid.contrib.mixed_precision.fp16_lists.AutoMixedPrecisionLists._update_list -- GitLab