amp_lists.py 4.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
#   Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import copy
16

A
arlesniak 已提交
17 18
from paddle.fluid import core

19 20 21
from ..fp16_lists import black_list as black_list_fp16
from ..fp16_lists import gray_list as gray_list_fp16
from ..fp16_lists import white_list as white_list_fp16
22 23 24 25

__all__ = ["AutoMixedPrecisionListsBF16"]


26
class AutoMixedPrecisionListsBF16:
27 28 29 30 31 32 33 34 35 36 37 38 39 40 41
    """
    AutoMixedPrecisionListsBF16 is a class for fp32/bf16 op types list. The lists are used for an
    algorithm which determines op's execution mode (fp32 or bf16).It can update pre-defined
    fp32 list and bf16 list according to users' custom fp32 bf16 lists.

    Args:
        custom_bf16_list (set): Users' custom bf16 list.
        custom_fp32_list (set): Users' custom fp32 list.
        custom_fp32_varnames (set): Users' custom fp32 variables' names.

    Examples:
        .. code-block:: python
        import paddle
        paddle.enable_static()
        with paddle.static.amp.bf16_guard():
42
            paddle.static.amp.bf16.AutoMixedPrecisionListsBF16(custom_fp32_list={'lstm'})
43 44
    """

45 46 47 48 49 50
    def __init__(
        self,
        custom_bf16_list=None,
        custom_fp32_list=None,
        custom_fp32_varnames=None,
    ):
51 52 53 54 55
        self._custom_bf16_list = custom_bf16_list
        self._custom_fp32_list = custom_fp32_list
        self.bf16_list = copy.copy(bf16_list)
        self.fp32_list = copy.copy(fp32_list)
        self.gray_list = copy.copy(gray_list)
56
        self.bf16_initializer_list = copy.copy(bf16_initializer_list)
57 58 59 60 61 62 63 64 65 66 67
        self.unsupported_list = copy.copy(unsupported_list)
        self.fp32_varnames = copy.copy(custom_fp32_varnames)
        self._update_list()

    def _update_list(self):
        """
        Update fp32 and bf16 list according to users' custom list.
        """
        if self._custom_bf16_list and self._custom_fp32_list:
            for op_name in self._custom_bf16_list:
                if op_name in self._custom_fp32_list:
68 69 70
                    raise ValueError(
                        "Custom bf16 list overlap " "custom fp32 list"
                    )
71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87
        if self._custom_bf16_list:
            for op_name in self._custom_bf16_list:
                if op_name in self.fp32_list:
                    self.fp32_list.remove(op_name)
                elif op_name in self.gray_list:
                    self.gray_list.remove(op_name)
                self.bf16_list.add(op_name)
        if self._custom_fp32_list:
            for op_name in self._custom_fp32_list:
                if op_name in self.bf16_list:
                    self.bf16_list.remove(op_name)
                elif op_name in self.gray_list:
                    self.gray_list.remove(op_name)
                self.fp32_list.add(op_name)
                self.unsupported_list.add(op_name)


88 89
bf16_initializer_list = {'fill_constant', 'uniform_random'}

90
# always bf16
A
arlesniak 已提交
91 92 93 94 95 96
bf16_list = {
    'conv2d',
    'matmul',
    'matmul_v2',
    'mul',
}
97 98 99

# depends on the prev_op type
gray_list = {
100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116
    'elementwise_add',
    'elementwise_sub',
    'elementwise_mul',
    'elementwise_div',
    'relu',
    'layer_norm',
    'slice',
    'concat',
    'uniform_random',
    'reshape2',
    'transpose2',
    'pool2d',
    'sigmoid',
    'cast',
    'scale',
    'fill_constant',
    'split',
117 118
}

A
arlesniak 已提交
119
_, _, _sys_unsupported_bf16_list = core.op_supported_infos(
120 121
    'CPU', core.VarDesc.VarType.BF16
)
A
arlesniak 已提交
122 123
unsupported_list = _sys_unsupported_bf16_list

124 125 126 127 128 129 130 131
fp32_list = black_list_fp16.copy().copy()
fp32_list |= white_list_fp16
fp32_list |= gray_list_fp16

fp32_list -= bf16_list
fp32_list -= gray_list
unsupported_list -= bf16_list
unsupported_list -= gray_list