primapi.py 10.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

15
import logging
16 17
import typing

18
import paddle
19
from paddle.fluid import backward, core, framework
20
from paddle.fluid.core import prim_config
21
from paddle.incubate.autograd import primx, utils
22 23 24


@framework.static_only
25
def forward_grad(outputs, inputs, grad_inputs=None):
26 27
    """Forward mode of automatic differentiation.

28
    Note:
29
        **ONLY available in the static graph mode and primitive operators.**
30 31

    Args:
X
Xiaoxu Chen 已提交
32 33
        outputs(Tensor|Sequence[Tensor]): The output tensor or tensors.
        inputs(Tensor|Sequence[Tensor]): The input tensor or tensors.
34 35
        grad_inputs(Tensor|Sequence[Tensor]): Optional, the gradient Tensor or
            Tensors of inputs which has the same shape with inputs, Defaults to
X
Xiaoxu Chen 已提交
36
            None, in this case is equivalent to all ones.
37 38

    Returns:
X
Xiaoxu Chen 已提交
39
        grad_outputs(Tensor|Sequence[Tensor]): The gradients for outputs.
40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55

    Examples:

        .. code-block:: python

            import numpy as np
            import paddle

            paddle.enable_static()
            paddle.incubate.autograd.enable_prim()

            startup_program = paddle.static.Program()
            main_program = paddle.static.Program()

            with paddle.static.program_guard(main_program, startup_program):
                x = paddle.static.data('x', shape=[1], dtype='float32')
56
                y = x * x
57
                y_grad = paddle.incubate.autograd.forward_grad(y, x)
58 59 60 61 62 63 64 65 66 67 68
                paddle.incubate.autograd.prim2orig()

            exe = paddle.static.Executor()
            exe.run(startup_program)
            y_grad = exe.run(main_program, feed={'x': np.array([2.]).astype('float32')}, fetch_list=[y_grad])
            print(y_grad)
            # [array([4.], dtype=float32)]

            paddle.incubate.autograd.disable_prim()
            paddle.disable_static()
    """
69
    if not utils.prim_enabled():
70 71 72 73
        raise RuntimeError(
            'forward_grad must be running on primitive'
            'operators, use enable_prim to turn it on.'
        )
74

75
    if not isinstance(outputs, (framework.Variable, typing.Sequence)):
76 77 78 79
        raise TypeError(
            f'Expected outputs is Tensor|Sequence[Tesnor], '
            f'but got {type(outputs)}.'
        )
80 81

    if not isinstance(inputs, (framework.Variable, typing.Sequence)):
82 83 84 85
        raise TypeError(
            f'Expected inputs is Tensor|Sequence[Tesnor], '
            f'but got {type(inputs)}.'
        )
86

87 88 89 90 91
    ys, xs, xs_dot = (
        utils.as_tensors(outputs),
        utils.as_tensors(inputs),
        utils.as_tensors(grad_inputs),
    )
92 93 94 95 96

    block = framework.default_main_program().current_block()
    if any(x.block != block for x in xs + ys):
        raise RuntimeError(
            'Variable in inputs and targets should exist in current block of '
97 98
            'main program.'
        )
99 100 101 102 103

    primx.orig2prim(block)
    ad = primx.Transform(ys[0].block)
    _, ys_dot = ad.linearize(xs, ys, xs_dot)

104 105 106 107 108 109 110
    return ys_dot[0] if isinstance(outputs, framework.Variable) else ys_dot


@framework.static_only
def grad(outputs, inputs, grad_outputs=None):
    """Reverse mode of automatic differentiation.

111
    Note:
112
        **ONLY available in the static graph mode and primitive operators**
113 114

    Args:
X
Xiaoxu Chen 已提交
115 116
        outputs(Tensor|Sequence[Tensor]): The output Tensor or Tensors.
        inputs(Tensor|Sequence[Tensor]): The input Tensor or Tensors.
117 118
        grad_outputs(Tensor|Sequence[Tensor]): Optional, the gradient Tensor or
            Tensors of outputs which has the same shape with outputs, Defaults
X
Xiaoxu Chen 已提交
119
            to None, in this case is equivalent to all ones.
120 121

    Returns:
122
        grad_inputs(Tensor|Tensors): The gradients for inputs.
123 124 125 126 127 128 129

    Examples:

        .. code-block:: python

            import numpy as np
            import paddle
X
Xiaoxu Chen 已提交
130

131 132
            paddle.enable_static()
            paddle.incubate.autograd.enable_prim()
X
Xiaoxu Chen 已提交
133

134 135 136 137 138
            startup_program = paddle.static.Program()
            main_program = paddle.static.Program()
            with paddle.static.program_guard(main_program, startup_program):
                x = paddle.static.data('x', shape=[1], dtype='float32')
                x.stop_gradients = False
139
                y = x * x
140 141
                x_grad = paddle.incubate.autograd.grad(y, x)
                paddle.incubate.autograd.prim2orig()
X
Xiaoxu Chen 已提交
142

143 144 145 146 147
            exe = paddle.static.Executor()
            exe.run(startup_program)
            x_grad = exe.run(main_program, feed={'x': np.array([2.]).astype('float32')}, fetch_list=[x_grad])
            print(x_grad)
            # [array([4.], dtype=float32)]
148

149 150 151 152
            paddle.incubate.autograd.disable_prim()
            paddle.disable_static()
    """
    if not utils.prim_enabled():
153 154 155 156
        grad_inputs = backward.gradients(outputs, inputs, grad_outputs)
        # backward.gradients returns a list though the inputs is a signle Tensor.
        # The follow code snippet fixes the problem by return the first element
        # of grad_inputs when the inputs is a signle Tensor.
157 158 159 160 161
        if (
            isinstance(inputs, framework.Variable)
            and isinstance(grad_inputs, typing.Sequence)
            and len(grad_inputs) > 0
        ):
162 163 164
            return grad_inputs[0]
        else:
            return grad_inputs
165 166

    if not isinstance(outputs, (framework.Variable, typing.Sequence)):
167 168 169 170
        raise TypeError(
            f'Expected outputs is Tensor|Sequence[Tesnor], '
            f'but got {type(outputs)}.'
        )
171 172

    if not isinstance(inputs, (framework.Variable, typing.Sequence)):
173 174 175 176
        raise TypeError(
            f'Expected inputs is Tensor|Sequence[Tesnor], '
            f'but got {type(inputs)}.'
        )
177

178 179 180 181 182
    ys, xs, ys_bar = (
        utils.as_tensors(outputs),
        utils.as_tensors(inputs),
        utils.as_tensors(grad_outputs),
    )
183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216
    block = framework.default_main_program().current_block()
    if any((x is not None and x.block != block) for x in xs + ys):
        raise RuntimeError(
            'Variable in inputs and outputs should be None or in current block of main program'
        )

    # TODO(Tongxin) without any prior knowledge about whether the program
    # is completely lowered to primitive ops, it's mandatory to run the lowering
    # pass once and again. This is obviously inefficient and needs to be
    # optimized.
    primx.orig2prim(block)
    ad = primx.Transform(block)
    xs_dot, ys_dot = ad.linearize(xs, ys)
    if any(var is None for var in ys_dot):
        raise RuntimeError(
            'Grads cannot be computed. The given outputs does not depend on inputs'
        )
    ys_bar, xs_bar = ad.transpose(ys_dot, xs_dot, ys_bar)

    # remove xs_dot and their constructor ops
    op_indexes = []
    for var in xs_dot:
        if var is not None:
            op_index = block.ops.index(var.op)
            if op_index < 0:
                raise ValueError(
                    f'op_index should be greater than or equal to 0, but op_index={op_index}.'
                )
            op_indexes.append(op_index)

    ad.erase_ops(sorted(op_indexes))
    ad.erase_dots(xs_dot)

    return xs_bar[0] if isinstance(inputs, framework.Variable) else xs_bar
217 218 219


@framework.static_only
220
def to_prim(blocks, blacklist=frozenset(), whitelist=frozenset()):
221
    """Search nonbasic ops which have be registered composite rules and replace them with primitive ops.
222 223 224 225 226 227
    The operators in blacklist will be excluded from program when lowering into primitives, and only the
    operators in whitelist will be lowering. The priority of blacklist is higher than whitelist, it means
    an operator both in blacklist and whitelist will not be lowering.

    The finally set that will be lowering is:
        (blocks.ops & ops have decomposite rule & whitelist) - blacklist
228 229

    Args:
230 231
        blacklist(frozenset): The Operators that will be exclude when lowering into primitives.
        whitelist(frozenset): Only the operators in whitelist will be lowering into primitives.
232
    """
233
    if not core._is_fwd_prim_enabled():
234
        return
235
    if isinstance(blocks, paddle.fluid.framework.Block):
236
        logging.info("Atomize composite op to primitive ops begin.")
237
        main_program = blocks.program
238 239
    elif isinstance(blocks, typing.Sequence):
        for item in blocks:
240 241 242 243 244
            if not isinstance(item, paddle.fluid.framework.Block):
                raise TypeError(
                    f"Expect block or sequence of blocks, but sequence contains {type(item)}."
                )
        main_program = blocks[0].program
245
    else:
246 247 248
        raise TypeError(
            f"Expect block or sequence of blocks, but got {type(blocks)}."
        )
249 250 251 252 253
    if not isinstance(blacklist, (set, frozenset)):
        raise TypeError(
            f'Expected type of blacklisst is set|frozenset, but got {type(blacklist)}.'
        )
    if not isinstance(whitelist, (set, frozenset)):
254
        raise TypeError(
255
            f'Expected type of whiltelist is set|frozenset, but got {type(whitelist)}.'
256 257
        )

258 259
    blacklist = prim_config["forward_blacklist"] | blacklist

260
    with framework.program_guard(main_program):
261
        print("Lowering composite forward ops begin...")
262 263 264 265 266 267 268 269 270 271

        if len(blacklist) > 0 and len(whitelist) > 0:
            filter_ = lambda x: x.type in whitelist and x.type not in blacklist
        elif len(blacklist) > 0 and len(whitelist) == 0:
            filter_ = lambda x: x.type not in blacklist
        elif len(blacklist) == 0 and len(whitelist) > 0:
            filter_ = lambda x: x.type in whitelist
        else:
            filter_ = lambda x: True
        primx._lower_composite(blocks, filter_)
C
cyber-pioneer 已提交
272
        replace_ops = prim_config["composite_ops_record"]
273
        print(f"Lowering composite forward ops finish: {replace_ops}")