diff --git a/paddle/fluid/framework/details/scope_buffered_ssa_graph_executor.cc b/paddle/fluid/framework/details/scope_buffered_ssa_graph_executor.cc
index abc6b9f559ead54537c1f6f5d39811366aba88fd..85898af417e39358bd63fd10a5faffcd7d88fc5d 100644
--- a/paddle/fluid/framework/details/scope_buffered_ssa_graph_executor.cc
+++ b/paddle/fluid/framework/details/scope_buffered_ssa_graph_executor.cc
@@ -27,34 +27,31 @@ namespace framework {
 namespace details {
 ScopeBufferedSSAGraphExecutor::ScopeBufferedSSAGraphExecutor(
     ExecutionStrategy strategy, std::vector<Scope *> local_scopes,
-    std::vector<std::vector<VariableInfo>> var_infos_list,
-    std::vector<platform::Place> places,
+    std::vector<VariableInfo> var_infos, std::vector<platform::Place> places,
     std::unique_ptr<SSAGraphExecutor> &&underlying_executor)
     : strategy_(std::move(strategy)),
       underlying_executor_(std::move(underlying_executor)),
       local_scopes_(std::move(local_scopes)),
-      var_infos_list_(std::move(var_infos_list)),
+      var_infos_(std::move(var_infos)),
       places_(std::move(places)) {}
 
 FeedFetchList ScopeBufferedSSAGraphExecutor::Run(
     const std::vector<std::string> &fetch_tensors) {
   if (drop_scope_counter_ == 0) {
     // Create local scopes.
-    for (size_t i = 0; i < local_scopes_.size(); ++i) {
-      auto &scope = local_scopes_[i];
+    for (auto it = local_scopes_.rbegin(); it != local_scopes_.rend(); ++it) {
+      auto &scope = *it;
       Scope &local_scope = scope->NewScope();
       *scope->Var(details::kLocalExecScopeName)->GetMutable<Scope *>() =
           &local_scope;
-      for (auto &var_infos : var_infos_list_) {
-        for (auto &info : var_infos) {
-          if (scope->FindVar(info.name_) != nullptr) {
-            continue;
-          }
-          if (info.persistable_) {  // Persistable
-            InitializeVariable(scope->Var(info.name_), info.type_);
-          } else {
-            InitializeVariable(local_scope.Var(info.name_), info.type_);
-          }
+      for (auto &info : var_infos_) {
+        if (scope->FindVar(info.name_) != nullptr) {
+          continue;
+        }
+        if (info.persistable_) {  // Persistable
+          InitializeVariable(scope->Var(info.name_), info.type_);
+        } else {
+          InitializeVariable(local_scope.Var(info.name_), info.type_);
         }
       }
     }
diff --git a/paddle/fluid/framework/details/scope_buffered_ssa_graph_executor.h b/paddle/fluid/framework/details/scope_buffered_ssa_graph_executor.h
index 51230d4a42abd8efa8dc395db2117405cdb90ffc..5e87e0bf50b51d2b630aba06a5907dd721754d1f 100644
--- a/paddle/fluid/framework/details/scope_buffered_ssa_graph_executor.h
+++ b/paddle/fluid/framework/details/scope_buffered_ssa_graph_executor.h
@@ -38,8 +38,7 @@ class ScopeBufferedSSAGraphExecutor : public SSAGraphExecutor {
  public:
   ScopeBufferedSSAGraphExecutor(
       ExecutionStrategy strategy, std::vector<Scope*> local_scopes,
-      std::vector<std::vector<VariableInfo>> var_info_list,
-      std::vector<platform::Place> places,
+      std::vector<VariableInfo> var_infos, std::vector<platform::Place> places,
       std::unique_ptr<SSAGraphExecutor>&& underlying_executor);
 
   const ir::Graph& Graph() const override {
@@ -54,7 +53,7 @@ class ScopeBufferedSSAGraphExecutor : public SSAGraphExecutor {
   ExecutionStrategy strategy_;
   std::unique_ptr<SSAGraphExecutor> underlying_executor_;
   std::vector<Scope*> local_scopes_;
-  std::vector<std::vector<VariableInfo>> var_infos_list_;
+  std::vector<VariableInfo> var_infos_;
   std::vector<platform::Place> places_;
 };
 }  // namespace details
diff --git a/paddle/fluid/framework/details/threaded_ssa_graph_executor.cc b/paddle/fluid/framework/details/threaded_ssa_graph_executor.cc
index 677a2937945b03fa577317cb4f26e09354d06957..cebf63364da6a5d4588d5613d61d64f68e9fa0fd 100644
--- a/paddle/fluid/framework/details/threaded_ssa_graph_executor.cc
+++ b/paddle/fluid/framework/details/threaded_ssa_graph_executor.cc
@@ -216,7 +216,6 @@ void ThreadedSSAGraphExecutor::RunOp(
       if (LIKELY(!strategy_.dry_run_)) {
         op->Run(strategy_.use_cuda_);
       }
-      VLOG(10) << op << " " << op->Name() << " Done ";
       running_ops_--;
       ready_var_q->Extend(op->Outputs());
       VLOG(10) << op << " " << op->Name() << "Signal posted";
diff --git a/paddle/fluid/framework/parallel_executor.cc b/paddle/fluid/framework/parallel_executor.cc
index 186f0cb8034dc9e2eb1ec0afa40fcf9a944f4b3d..2a9ca3e815bd65332453655366bfe94479007097 100644
--- a/paddle/fluid/framework/parallel_executor.cc
+++ b/paddle/fluid/framework/parallel_executor.cc
@@ -141,7 +141,6 @@ ParallelExecutor::ParallelExecutor(
   std::vector<std::unique_ptr<ir::Graph>> graphs;
 #if defined(PADDLE_WITH_CUDA) && !defined(_WIN32)
   if (exec_strategy.type_ == ExecutionStrategy::kParallelGraph) {
-    VLOG(1) << "kParallelGraph mode!!";
     for (size_t i = 0; i < member_->places_.size(); ++i) {
       std::unique_ptr<ir::Graph> graph = build_strategy.Apply(
           main_program, {member_->places_[i]}, loss_var_name, params,
@@ -178,8 +177,8 @@ ParallelExecutor::ParallelExecutor(
         ref_cnt_pass->SetNotOwned(details::kGlobalReferenceCount, &ref_cnts_);
         ref_cnt_pass->SetNotOwned(details::kCurReferenceCount, &cur_ref_cnts_);
         ref_cnt_pass->SetNotOwned(details::kGarbageCollector, &gcs_);
-        graphs[0] = ref_cnt_pass->Apply(std::move(graphs[i]));
-        graphs[0]->SetNotOwned("garbage_collector", &gcs_);
+        graphs[i] = ref_cnt_pass->Apply(std::move(graphs[i]));
+        graphs[i]->SetNotOwned("garbage_collector", &gcs_);
       }
     }
   }
@@ -192,6 +191,18 @@ ParallelExecutor::ParallelExecutor(
 
   // Step 3. Create vars in each scope. Passes may also create new vars.
   //         skip control vars and empty vars
+  std::vector<details::VariableInfo> var_infos;
+  for (auto &graph : graphs) {
+    for (auto &node : graph->Nodes()) {
+      if (node->IsVar() && !node->IsCtrlVar() && node->Var()) {
+        var_infos.emplace_back();
+        var_infos.back().name_ = node->Var()->Name();
+        var_infos.back().type_ = node->Var()->GetType();
+        var_infos.back().persistable_ = node->Var()->Persistable();
+      }
+    }
+  }
+  /**
   std::vector<std::vector<details::VariableInfo>> var_infos_list;
   for (size_t i = 0; i < graphs.size(); ++i) {
     std::vector<details::VariableInfo> var_infos;
@@ -203,8 +214,9 @@ ParallelExecutor::ParallelExecutor(
         var_infos.back().persistable_ = node->Var()->Persistable();
       }
     }
-    var_infos_list.emplace_back(std::move(var_infos));
+    var_infos_list.push_back(std::move(var_infos));
   }
+  **/
 
   // If the loss_var_name is given, the number of graph should be only one.
   if (loss_var_name.size()) {
@@ -236,7 +248,7 @@ ParallelExecutor::ParallelExecutor(
   }
 
   member_->executor_.reset(new details::ScopeBufferedSSAGraphExecutor(
-      exec_strategy, member_->local_scopes_, std::move(var_infos_list),
+      exec_strategy, member_->local_scopes_, std::move(var_infos),
       member_->places_, std::move(member_->executor_)));
 }
 
diff --git a/paddle/fluid/operators/reader/buffered_reader.cc b/paddle/fluid/operators/reader/buffered_reader.cc
index cfa192f8e17c1bf56dc27be190e4d37341a9c7b0..26ff221dfa0768bd2bcc9e6485a32485f0212ac6 100644
--- a/paddle/fluid/operators/reader/buffered_reader.cc
+++ b/paddle/fluid/operators/reader/buffered_reader.cc
@@ -58,9 +58,7 @@ void BufferedReader::ReadAsync(size_t i) {
       TensorVec &gpu = gpu_buffer_[i];
       gpu.resize(cpu.size());
       for (size_t i = 0; i < cpu.size(); ++i) {
-        VLOG(1) << "launch tensor copy from cpu to cpu, idx: " << i;
         framework::TensorCopySync(cpu[i], place_, &gpu[i]);
-        VLOG(1) << "done " << i;
         gpu[i].set_lod(cpu[i].lod());
       }
     }
diff --git a/paddle/fluid/operators/reader/create_py_reader_op.cc b/paddle/fluid/operators/reader/create_py_reader_op.cc
index 093b0e56b3d975ea02d3248b6a4d4c734231856b..901a92ab5b5c74b071be8b57a7653d90e2a4fb29 100644
--- a/paddle/fluid/operators/reader/create_py_reader_op.cc
+++ b/paddle/fluid/operators/reader/create_py_reader_op.cc
@@ -28,10 +28,8 @@ class PyReader : public framework::FileReader {
   }
 
   void ReadNext(std::vector<framework::LoDTensor>* out) override {
-    VLOG(1) << "come in PyReader::ReadNext function, out: " << out;
     bool success;
     *out = queue_->Pop(&success);
-    VLOG(1) << "call PyReader::ReadNext " << success;
     if (!success) out->clear();
   }
 
diff --git a/paddle/fluid/operators/reader/open_files_op.cc b/paddle/fluid/operators/reader/open_files_op.cc
index ae37a187259e10388d83d5cf795f9474ee0b7962..38223e069975a08791d58d6ae10e2112b79a61fe 100644
--- a/paddle/fluid/operators/reader/open_files_op.cc
+++ b/paddle/fluid/operators/reader/open_files_op.cc
@@ -115,12 +115,10 @@ class PreemptiveReaderContainer : public IReaderContainer {
   }
 
   void ReadNext(std::vector<framework::LoDTensor>* out) override {
-    VLOG(1) << "flag";
     if (!pending_.empty()) {
       auto future_it = complete_queue_.Pop();
       FutureItem item = future_it->get();
       if (item.exception_) {
-        VLOG(1) << "item has exception!!!";
         for (auto it = futures_.begin(); it != futures_.end(); ++it) {
           if (it != future_it) {
             it->wait();  // Wait all other threads complete.