From 8b24bd4fe851a793521f88630f56e9d4afcf8263 Mon Sep 17 00:00:00 2001
From: "Yang Yang(Tony)" <yangyang62@baidu.com>
Date: Wed, 14 Feb 2018 11:56:46 -0800
Subject: [PATCH] Update parallel_do.md

---
 doc/design/parallel_do.md | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/doc/design/parallel_do.md b/doc/design/parallel_do.md
index d51b1014d4..221af6b6a4 100644
--- a/doc/design/parallel_do.md
+++ b/doc/design/parallel_do.md
@@ -13,7 +13,7 @@ AddInput(kParameters, "Parameters are duplicated over different devices")
 AddInput(kPlaces, "Devices used for parallel processing");
 AddOutput(kOutputs, "Outputs needed to be merged from different devices").AsDuplicable();
 AddOutput(kParallelScopes,
-          "Container for all local variables in forward pass.");
+          "Scopes for all local variables in forward pass. One scope for each device");
 AddAttr<framework::BlockDesc *>(kParallelBlock,
                                 "List of operaters to be executed in parallel");
 ```
@@ -33,6 +33,7 @@ In the backward pass
   ||||   Compute backward pass in parallel
   |      accumulate param@grad from different devices to the first device
   |      Merge input@grad from different devices
+  |      Copy param@grad to the place of parallel_do_op
 ```
 
 This implementation allows to write mixed device program like this
@@ -47,7 +48,7 @@ pd = ParallelDo(gpu_places)
 with pd.do():
     read_input(feature)
     prediction = my_net(feature)
-    write_output(activation)
+    write_output(prediction)
 prediction = pd()
 loss = cross_entropy(prediction, label)
 ```
@@ -98,7 +99,7 @@ looks like this.
 ```python
 pd = ParallelDo(gpu_places)
 with pd.do():
-    feature = pre_fetch(gpu_places)
+    feature = get_data_from_prefetch_queue(gpu_places)
     prediction = my_net(feature)
     write_output(activation)
 ```
-- 
GitLab