timeline.py 6.2 KB
Newer Older
X
Xin Pan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123
#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import argparse
import json
import sys
import unittest

import google.protobuf.text_format as text_format
import paddle.fluid.proto.profiler.profiler_pb2 as profiler_pb2

parser = argparse.ArgumentParser(description=__doc__)
parser.add_argument(
    '--profile_path', type=str, default='', help='Input profile file name.')
parser.add_argument(
    '--timeline_path', type=str, default='', help='Output timeline file name.')
args = parser.parse_args()


class _ChromeTraceFormatter(object):
    def __init__(self):
        self._events = []
        self._metadata = []

    def _create_event(self, ph, category, name, pid, tid, timestamp):
        """Creates a new Chrome Trace event.

        For details of the file format, see:
        https://github.com/catapult-project/catapult/blob/master/tracing/README.md

        Args:
          ph:  The type of event - usually a single character.
          category: The event category as a string.
          name:  The event name as a string.
          pid:  Identifier of the process generating this event as an integer.
          tid:  Identifier of the thread generating this event as an integer.
          timestamp:  The timestamp of this event as a long integer.

        Returns:
          A JSON compatible event object.
        """
        event = {}
        event['ph'] = ph
        event['cat'] = category
        event['name'] = name
        event['pid'] = pid
        event['tid'] = tid
        event['ts'] = timestamp
        return event

    def emit_pid(self, name, pid):
        """Adds a process metadata event to the trace.

        Args:
          name:  The process name as a string.
          pid:  Identifier of the process as an integer.
        """
        event = {}
        event['name'] = 'process_name'
        event['ph'] = 'M'
        event['pid'] = pid
        event['args'] = {'name': name}
        self._metadata.append(event)

    def emit_region(self, timestamp, duration, pid, tid, category, name, args):
        """Adds a region event to the trace.

        Args:
          timestamp:  The start timestamp of this region as a long integer.
          duration:  The duration of this region as a long integer.
          pid:  Identifier of the process generating this event as an integer.
          tid:  Identifier of the thread generating this event as an integer.
          category: The event category as a string.
          name:  The event name as a string.
          args:  A JSON-compatible dictionary of event arguments.
        """
        event = self._create_event('X', category, name, pid, tid, timestamp)
        event['dur'] = duration
        event['args'] = args
        self._events.append(event)

    def format_to_string(self, pretty=False):
        """Formats the chrome trace to a string.

        Args:
          pretty: (Optional.)  If True, produce human-readable JSON output.

        Returns:
          A JSON-formatted string in Chrome Trace format.
        """
        trace = {}
        trace['traceEvents'] = self._metadata + self._events
        if pretty:
            return json.dumps(trace, indent=4, separators=(',', ': '))
        else:
            return json.dumps(trace, separators=(',', ':'))


class Timeline(object):
    def __init__(self, profile_pb):
        self._profile_pb = profile_pb
        self._pid = 0
        self._devices = dict()
        self._chrome_trace = _ChromeTraceFormatter()

    def _allocate_pid(self):
        cur_pid = self._pid
        self._pid += 1
        return cur_pid

    def _allocate_pids(self):
        for event in self._profile_pb.events:
X
Xin Pan 已提交
124 125 126 127 128 129 130 131 132 133 134 135
            if event.type == profiler_pb2.Event.CPU:
                if (event.device_id, "CPU") not in self._devices:
                    pid = self._allocate_pid()
                    self._devices[(event.device_id, "CPU")] = pid
                    self._chrome_trace.emit_pid("cpu:block:%d" %
                                                (event.device_id), pid)
            elif event.type == profiler_pb2.Event.GPUKernel:
                if (event.device_id, "GPUKernel") not in self._devices:
                    pid = self._allocate_pid()
                    self._devices[(event.device_id, "GPUKernel")] = pid
                    self._chrome_trace.emit_pid("gpu:%d" % (event.device_id),
                                                pid)
X
Xin Pan 已提交
136 137 138

    def _allocate_events(self):
        for event in self._profile_pb.events:
X
Xin Pan 已提交
139 140 141 142 143
            if event.type == profiler_pb2.Event.CPU:
                type = "CPU"
            elif event.type == profiler_pb2.Event.GPUKernel:
                type = "GPUKernel"
            pid = self._devices[(event.device_id, type)]
X
Xin Pan 已提交
144
            args = {'name': event.name}
X
Xin Pan 已提交
145 146
            if event.memcopy.bytes > 0:
                args = {'mem_bytes': event.memcopy.bytes}
X
Xin Pan 已提交
147 148
            # TODO(panyx0718): Chrome tracing only handles ms. However, some
            # ops takes micro-seconds. Hence, we keep the ns here.
X
Xin Pan 已提交
149 150 151
            self._chrome_trace.emit_region(
                event.start_ns, (event.end_ns - event.start_ns) / 1.0, pid,
                event.sub_device_id, 'Op', event.name, args)
X
Xin Pan 已提交
152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168

    def generate_chrome_trace(self):
        self._allocate_pids()
        self._allocate_events()
        return self._chrome_trace.format_to_string()


profile_path = '/tmp/profile'
if args.profile_path:
    profile_path = args.profile_path
timeline_path = '/tmp/timeline'
if args.timeline_path:
    timeline_path = args.timeline_path

with open(profile_path, 'r') as f:
    profile_s = f.read()
    profile_pb = profiler_pb2.Profile()
X
Xin Pan 已提交
169
    profile_pb.ParseFromString(profile_s)
X
Xin Pan 已提交
170 171 172 173

tl = Timeline(profile_pb)
with open(timeline_path, 'w') as f:
    f.write(tl.generate_chrome_trace())