add timeline(recordevent) for new executor, test=develop (#35831)

5574c8cf · wanghuancoder · GitHub · fab1a029 · 5574c8cf
隐藏空白更改
内联并排

Showing with 13 addition and 5 deletion

paddle/fluid/framework/new_executor/interpretercore.cc paddle/fluid/framework/new_executor/interpretercore.cc +13 -5

未找到文件。
--- a/paddle/fluid/framework/new_executor/interpretercore.cc
+++ b/paddle/fluid/framework/new_executor/interpretercore.cc
@@ -18,6 +18,7 @@
 #include <unordered_set>
 #include "paddle/fluid/framework/details/share_tensor_buffer_functor.h"
+#include "paddle/fluid/platform/profiler.h"
 PADDLE_DEFINE_EXPORTED_bool(new_executor_use_inplace, true,
                            "Use inplace in new executor");
@@ -304,9 +305,12 @@ void InterpreterCore::RunInstruction(const Instruction& instr_node) {
  VLOG(3) << "RunInstruction:  "
          << instr_node.kernel_func_.operator_base_->Type();
-  static_cast<const framework::OperatorWithKernel*>(
+  {
-      instr_node.kernel_func_.operator_base_)
+    platform::RecordEvent infershape_event("InferShape");
-      ->InferShape(instr_node.infershape_ctx_.get());
+    static_cast<const framework::OperatorWithKernel*>(
+        instr_node.kernel_func_.operator_base_)
+        ->InferShape(instr_node.infershape_ctx_.get());
+  }
  if (FLAGS_new_executor_use_inplace) {
    for (auto& pair : instr_node.vec_inplace_in_to_out_) {
@@ -318,8 +322,10 @@ void InterpreterCore::RunInstruction(const Instruction& instr_node) {
      }
    }
  }
+  {
-  instr_node.kernel_func_.compute_func_(*instr_node.execution_ctx_.get());
+    platform::RecordEvent compute_event("Compute");
+    instr_node.kernel_func_.compute_func_(*instr_node.execution_ctx_.get());
+  }
 }
 void InterpreterCore::ExecuteInstructionList(
@@ -350,6 +356,8 @@ void InterpreterCore::RunInstructionAsync(size_t instr_id,
                                          AtomicVectorSizeT* atomic_var_ref,
                                          std::atomic<size_t>* op_run_number) {
  auto& instr_node = vec_instruction_[instr_id];
+  platform::RecordEvent instruction_event(
+      instr_node.kernel_func_.operator_base_->Type());
  event_manager_.WaitEvent(instr_node, place_);
  RunInstruction(instr_node);