event_python.h 3.6 KB
Newer Older
1
/* Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17

licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once

#include <map>
C
chenjian 已提交
18 19
#include <memory>
#include <unordered_map>
20 21

#include "paddle/fluid/platform/profiler/event_node.h"
C
chenjian 已提交
22
#include "paddle/fluid/platform/profiler/extra_info.h"
23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45

namespace paddle {
namespace platform {

struct DevicePythonNode {
  DevicePythonNode() = default;
  ~DevicePythonNode() {}
  // record name
  std::string name;
  // record type, one of TracerEventType
  TracerEventType type;
  // start timestamp of the record
  uint64_t start_ns;
  // end timestamp of the record
  uint64_t end_ns;
  // device id
  uint64_t device_id;
  // context id
  uint64_t context_id;
  // stream id
  uint64_t stream_id;
};

46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
struct MemPythonNode {
  MemPythonNode() = default;
  ~MemPythonNode() {}

  // timestamp of the record
  uint64_t timestamp_ns;
  // memory addr of allocation or free
  uint64_t addr;
  // memory manipulation type
  TracerMemEventType type;
  // process id of the record
  uint64_t process_id;
  // thread id of the record
  uint64_t thread_id;
  // increase bytes after this manipulation, allocation for sign +, free for
  // sign -
  int64_t increase_bytes;
  // place
  std::string place;
  // current total allocated memory
  uint64_t current_allocated;
  // current total reserved memory
  uint64_t current_reserved;
69 70 71 72
  // peak  allocated memory
  uint64_t peak_allocated;
  // peak  reserved memory
  uint64_t peak_reserved;
73 74
};

75 76 77 78 79 80 81 82 83 84 85 86 87 88 89
struct HostPythonNode {
  HostPythonNode() = default;
  ~HostPythonNode();
  // record name
  std::string name;
  // record type, one of TracerEventType
  TracerEventType type;
  // start timestamp of the record
  uint64_t start_ns;
  // end timestamp of the record
  uint64_t end_ns;
  // process id of the record
  uint64_t process_id;
  // thread id of the record
  uint64_t thread_id;
90 91 92 93 94
  // input shapes
  std::map<std::string, std::vector<std::vector<int64_t>>> input_shapes;
  std::map<std::string, std::vector<std::string>> dtypes;
  // call stack
  std::string callstack;
95 96 97 98 99 100
  // children node
  std::vector<HostPythonNode*> children_node_ptrs;
  // runtime node
  std::vector<HostPythonNode*> runtime_node_ptrs;
  // device node
  std::vector<DevicePythonNode*> device_node_ptrs;
101 102
  // mem node
  std::vector<MemPythonNode*> mem_node_ptrs;
103 104 105 106 107
};

class ProfilerResult {
 public:
  ProfilerResult() : tree_(nullptr) {}
C
chenjian 已提交
108 109
  explicit ProfilerResult(std::unique_ptr<NodeTrees> tree,
                          const ExtraInfo& extra_info);
110 111
  ~ProfilerResult();
  std::map<uint64_t, HostPythonNode*> GetData() {
C
chenjian 已提交
112
    return thread_event_trees_map_;
113
  }
C
chenjian 已提交
114 115 116 117 118 119 120
  std::unordered_map<std::string, std::string> GetExtraInfo() {
    return extra_info_.GetExtraInfo();
  }

  void Save(const std::string& file_name,
            const std::string format = std::string("json"));

L
liutiexing 已提交
121
  std::shared_ptr<NodeTrees> GetNodeTrees() { return tree_; }
122 123

 private:
C
chenjian 已提交
124
  std::map<uint64_t, HostPythonNode*> thread_event_trees_map_;
L
liutiexing 已提交
125
  std::shared_ptr<NodeTrees> tree_;
C
chenjian 已提交
126 127
  ExtraInfo extra_info_;
  HostPythonNode* CopyTree(HostTraceEventNode* root);
128 129
};

C
chenjian 已提交
130 131
std::unique_ptr<ProfilerResult> LoadProfilerResult(std::string filename);

132 133
}  // namespace platform
}  // namespace paddle