From 478e4d68820c84356bf88af02d02be8d37deb2f7 Mon Sep 17 00:00:00 2001
From: Youwei Song <youwei0314@gmail.com>
Date: Wed, 9 Oct 2019 19:41:10 +0800
Subject: [PATCH] polish append_backward en doc (#20199)

* polish append_backward, test=document_fix

* test=document_fix, test=develop

* test=document_fix, test=develop

* polish append_backward, test=document_fix, test=develop
---
 paddle/fluid/API.spec           |  2 +-
 python/paddle/fluid/backward.py | 47 ++++++++++++++++++---------------
 2 files changed, 27 insertions(+), 22 deletions(-)

diff --git a/paddle/fluid/API.spec b/paddle/fluid/API.spec
index a6c0330d81..005314d207 100755
--- a/paddle/fluid/API.spec
+++ b/paddle/fluid/API.spec
@@ -1041,7 +1041,7 @@ paddle.fluid.optimizer.RecomputeOptimizer.backward (ArgSpec(args=['self', 'loss'
 paddle.fluid.optimizer.RecomputeOptimizer.get_opti_var_name_list (ArgSpec(args=['self'], varargs=None, keywords=None, defaults=None), ('document', '6adf97f83acf6453d4a6a4b1070f3754'))
 paddle.fluid.optimizer.RecomputeOptimizer.load (ArgSpec(args=['self', 'stat_dict'], varargs=None, keywords=None, defaults=None), ('document', '7b2b8ae72011bc4decb67e97623f2c56'))
 paddle.fluid.optimizer.RecomputeOptimizer.minimize (ArgSpec(args=['self', 'loss', 'startup_program', 'parameter_list', 'no_grad_set', 'grad_clip'], varargs=None, keywords=None, defaults=(None, None, None, None)), ('document', '6adf97f83acf6453d4a6a4b1070f3754'))
-paddle.fluid.backward.append_backward (ArgSpec(args=['loss', 'parameter_list', 'no_grad_set', 'callbacks', 'checkpoints'], varargs=None, keywords=None, defaults=(None, None, None, None)), ('document', '52488008103886c793843a3828bacd5e'))
+paddle.fluid.backward.append_backward (ArgSpec(args=['loss', 'parameter_list', 'no_grad_set', 'callbacks', 'checkpoints'], varargs=None, keywords=None, defaults=(None, None, None, None)), ('document', 'c68fe1cb95d90762b57c309cae9b99d9'))
 paddle.fluid.backward.gradients (ArgSpec(args=['targets', 'inputs', 'target_gradients', 'no_grad_set'], varargs=None, keywords=None, defaults=(None, None)), ('document', 'e2097e1e0ed84ae44951437bfe269a1b'))
 paddle.fluid.regularizer.L1DecayRegularizer ('paddle.fluid.regularizer.L1DecayRegularizer', ('document', '34603757e70974d2fcc730643b382925'))
 paddle.fluid.regularizer.L1DecayRegularizer.__init__ (ArgSpec(args=['self', 'regularization_coeff'], varargs=None, keywords=None, defaults=(0.0,)), ('document', '6adf97f83acf6453d4a6a4b1070f3754'))
diff --git a/python/paddle/fluid/backward.py b/python/paddle/fluid/backward.py
index ec1a3721dd..1894ac4152 100644
--- a/python/paddle/fluid/backward.py
+++ b/python/paddle/fluid/backward.py
@@ -936,29 +936,31 @@ def append_backward(loss,
                     callbacks=None,
                     checkpoints=None):
     """
-    Append backward part to main_program.
+    This function appends backward part to main_program.
 
     A complete neural network training is made up of forward and backward
     propagation. However, when we configure a network, we only need to
-    specify its forwrd part. The backward part is generated automatically
-    according to the forward part by this function.
+    specify its forward part. This function uses the chain rule to automatically
+    generate the backward part according to the forward part.
 
-    In most cases, users do not need to invoke this function manually. It
-    will be automatically invoked by the optimizer's `minimize` function.
+    In most cases, users do not need to invoke this function manually.
+    It will be automatically invoked by the optimizer's `minimize` function.
 
-    Args:
-        loss(Variable): The loss variable of the network.
-        parameter_list(list[string]|None): Names of parameters that need
+    Parameters:
+        loss( :ref:`api_guide_Variable_en` ): The loss variable of the network.
+        parameter_list(list of str, optional): Names of parameters that need
                                            to be updated by optimizers.
                                            If it is None, all parameters
                                            will be updated.
-                                           Default: None
-        no_grad_set(set|None): Variables in the Block 0 whose gradients
+                                           Default: None.
+        no_grad_set(set of str, optional): Variable names in the :ref:`api_guide_Block_en` 0 whose gradients
                                should be ignored. All variables with
                                `stop_gradient=True` from all blocks will
                                be automatically added into this set.
-                               Default: None
-        callbacks(list[callable object]|None): The callbacks are used for
+                               If this parameter is not None, the names in this set will be added to the default set.
+                               Default: None.
+        callbacks(list of callable object, optional): List of callback functions.
+                                               The callbacks are used for
                                                doing some custom jobs during
                                                backward part building. All
                                                callable objects in it will
@@ -967,23 +969,23 @@ def append_backward(loss,
                                                into the program. The callable
                                                object must has two input
                                                parameters: 'block' and 'context'.
-                                               The 'block' is the block which
+                                               The 'block' is the :ref:`api_guide_Block_en` which
                                                the new gradient operator will
                                                be added to. The 'context' is a
                                                map, whose keys are gradient
                                                variable names and values are
-                                               corresponding original variables.
+                                               corresponding original :ref:`api_guide_Variable_en` .
                                                In addition to this, the 'context'
                                                has another special key-value pair:
                                                the key is string '__current_op_desc__'
                                                and the value is the op_desc of the
                                                gradient operator who has just
                                                triggered the callable object.
+                                               Default: None.
 
     Returns:
-        list[(Variable,Variable)]: Pairs of parameter and its
-        corresponding gradients. The key is the parameter and the
-        value is gradient variable.
+        list of tuple ( :ref:`api_guide_Variable_en` , :ref:`api_guide_Variable_en` ): Pairs of parameter and its corresponding gradients.
+        The key is the parameter and the value is gradient variable.
 
     Raises:
         AssertionError: If `loss` is not an instance of Variable.
@@ -991,17 +993,20 @@ def append_backward(loss,
     Examples:
         .. code-block:: python
 
-            # network configuration code
-            # loss from ...
             import paddle.fluid as fluid
-            x = fluid.layers.data(name='x', shape=[13], dtype='float32')
-            y = fluid.layers.data(name='y', shape=[1], dtype='float32')
+            x = fluid.data(name='x', shape=[None, 13], dtype='float32')
+            y = fluid.data(name='y', shape=[None, 1], dtype='float32')
 
             y_predict = fluid.layers.fc(input=x, size=1, act=None)
             loss = fluid.layers.square_error_cost(input=y_predict, label=y)
 
             avg_loss = fluid.layers.mean(loss)
             param_grad_list = fluid.backward.append_backward(loss=avg_loss)
+            p_g_list1 = fluid.backward.append_backward(loss=avg_loss)  # len(p_g_list1) == 2
+            p_g_list2 = fluid.backward.append_backward(loss=avg_loss, parameter_list=[p_g_list1[0][0].name])  # len(p_g_list1) == 1
+            p_g_list3 = fluid.backward.append_backward(loss=avg_loss, no_grad_set=set([p_g_list1[0][0].name]))  # len(p_g_list1) == 1
+            p_g_list4 = fluid.backward.append_backward(loss=avg_loss, parameter_list=[p_g_list1[0][0].name], no_grad_set=set([p_g_list1[0][0].name]))  # len(p_g_list1) == 0
+
     """
     assert isinstance(loss, framework.Variable)
 
-- 
GitLab