Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
机器未来
Paddle
提交
0f441075
P
Paddle
项目概览
机器未来
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
0f441075
编写于
1月 05, 2018
作者:
Y
Yibing Liu
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
Confirm the contents in profiling report
上级
770aff2c
变更
3
显示空白变更内容
内联
并排
Showing
3 changed file
with
43 addition
and
16 deletion
+43
-16
paddle/platform/profiler.cc
paddle/platform/profiler.cc
+36
-16
paddle/platform/profiler.h
paddle/platform/profiler.h
+1
-0
paddle/platform/profiler_test.cc
paddle/platform/profiler_test.cc
+6
-0
未找到文件。
paddle/platform/profiler.cc
浏览文件 @
0f441075
...
@@ -3,7 +3,7 @@
...
@@ -3,7 +3,7 @@
licensed under the Apache License, Version 2.0 (the "License");
licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
You may obtain a copy of the License at
`
http://www.apache.org/licenses/LICENSE-2.0
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
Unless required by applicable law or agreed to in writing, software
...
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
...
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
limitations under the License. */
limitations under the License. */
#include "paddle/platform/profiler.h"
#include "paddle/platform/profiler.h"
#include <iomanip>
#include <map>
#include <map>
namespace
paddle
{
namespace
paddle
{
...
@@ -183,7 +184,8 @@ void PopEvent(const std::string& name, DeviceContext* dev_ctx) {
...
@@ -183,7 +184,8 @@ void PopEvent(const std::string& name, DeviceContext* dev_ctx) {
void
ParseEvents
(
std
::
vector
<
std
::
vector
<
Event
>>&
events
)
{
void
ParseEvents
(
std
::
vector
<
std
::
vector
<
Event
>>&
events
)
{
// Event name :: counts :: ave :: min :: max :: total
// Event name :: counts :: ave :: min :: max :: total
std
::
map
<
std
::
string
,
std
::
tuple
<
int
,
double
,
double
>>
events_table
;
std
::
map
<
std
::
string
,
std
::
tuple
<
int
,
double
,
double
,
double
,
double
>>
events_table
;
for
(
size_t
i
=
0
;
i
<
events
.
size
();
i
++
)
{
for
(
size_t
i
=
0
;
i
<
events
.
size
();
i
++
)
{
std
::
list
<
Event
>
pushed_events
;
std
::
list
<
Event
>
pushed_events
;
for
(
size_t
j
=
0
;
j
<
events
[
i
].
size
();
j
++
)
{
for
(
size_t
j
=
0
;
j
<
events
[
i
].
size
();
j
++
)
{
...
@@ -197,18 +199,28 @@ void ParseEvents(std::vector<std::vector<Event>>& events) {
...
@@ -197,18 +199,28 @@ void ParseEvents(std::vector<std::vector<Event>>& events) {
++
rit
;
++
rit
;
}
}
if
(
rit
!=
pushed_events
.
rend
())
{
if
(
rit
!=
pushed_events
.
rend
())
{
Event
pushed_event
=
*
rit
;
double
cpu_time
=
rit
->
CpuElapsedUs
(
events
[
i
][
j
]);
double
cuda_time
=
0
;
#ifdef PADDLE_WITH_CUDA
#ifdef PADDLE_WITH_CUDA
cuda_time
=
rit
->
CudaElapsedUs
(
events
[
i
][
j
]);
double
event_time
=
rit
->
CudaElapsedUs
(
events
[
i
][
j
]);
#else
double
event_time
=
rit
->
CpuElapsedUs
(
events
[
i
][
j
]);
#endif
#endif
if
(
events_table
.
find
(
rit
->
name
())
==
events_table
.
end
())
{
std
::
string
event_name
=
events_table
[
rit
->
name
()]
=
std
::
make_tuple
(
1
,
cpu_time
,
cuda_time
);
"thread"
+
std
::
to_string
(
rit
->
thread_id
())
+
"::"
+
rit
->
name
();
if
(
events_table
.
find
(
event_name
)
==
events_table
.
end
())
{
events_table
[
event_name
]
=
std
::
make_tuple
(
1
,
event_time
,
event_time
,
event_time
,
0
);
}
else
{
}
else
{
std
::
get
<
0
>
(
events_table
[
rit
->
name
()])
+=
1
;
std
::
get
<
0
>
(
events_table
[
event_name
])
+=
1
;
std
::
get
<
1
>
(
events_table
[
rit
->
name
()])
+=
cpu_time
;
// total time
std
::
get
<
2
>
(
events_table
[
rit
->
name
()])
+=
cuda_time
;
std
::
get
<
1
>
(
events_table
[
event_name
])
+=
event_time
;
// min time
if
(
std
::
get
<
2
>
(
events_table
[
event_name
])
>
event_time
)
{
std
::
get
<
2
>
(
events_table
[
event_name
])
=
event_time
;
}
// max time
if
(
std
::
get
<
3
>
(
events_table
[
event_name
])
<
event_time
)
{
std
::
get
<
3
>
(
events_table
[
event_name
])
=
event_time
;
}
}
}
// remove the start marker from the list
// remove the start marker from the list
pushed_events
.
erase
((
++
rit
).
base
());
pushed_events
.
erase
((
++
rit
).
base
());
...
@@ -220,13 +232,21 @@ void ParseEvents(std::vector<std::vector<Event>>& events) {
...
@@ -220,13 +232,21 @@ void ParseEvents(std::vector<std::vector<Event>>& events) {
}
}
}
}
// output events table
// output events table
std
::
cout
<<
"
\n
Events
\t\t
Calls
\t\t
Total CPU time
\t\t
Total GPU time
\n
"
;
std
::
cout
<<
std
::
setw
(
20
)
<<
"Events"
<<
std
::
setw
(
10
)
<<
"Calls"
for
(
std
::
map
<
std
::
string
,
std
::
tuple
<
int
,
double
,
double
>>::
iterator
it
=
<<
std
::
setw
(
10
)
<<
"Total"
<<
std
::
setw
(
10
)
<<
"Min"
<<
std
::
setw
(
10
)
<<
"Max"
<<
std
::
setw
(
10
)
<<
"Ave"
<<
std
::
endl
;
for
(
std
::
map
<
std
::
string
,
std
::
tuple
<
int
,
double
,
double
,
double
,
double
>>::
iterator
it
=
events_table
.
begin
();
events_table
.
begin
();
it
!=
events_table
.
end
();
++
it
)
{
it
!=
events_table
.
end
();
++
it
)
{
std
::
cout
<<
it
->
first
<<
"
\t\t
"
<<
std
::
get
<
0
>
(
it
->
second
)
<<
"
\t\t
"
// average time
<<
std
::
get
<
1
>
(
it
->
second
)
<<
"
\t\t
"
<<
std
::
get
<
2
>
(
it
->
second
)
std
::
get
<
4
>
(
it
->
second
)
=
std
::
get
<
1
>
(
it
->
second
)
/
std
::
get
<
0
>
(
it
->
second
);
<<
std
::
endl
;
std
::
cout
<<
std
::
setw
(
20
)
<<
it
->
first
<<
std
::
setw
(
10
)
<<
std
::
get
<
0
>
(
it
->
second
)
<<
std
::
setw
(
10
)
<<
std
::
get
<
1
>
(
it
->
second
)
<<
std
::
setw
(
10
)
<<
std
::
get
<
2
>
(
it
->
second
)
<<
std
::
setw
(
10
)
<<
std
::
get
<
3
>
(
it
->
second
)
<<
std
::
setw
(
10
)
<<
std
::
get
<
4
>
(
it
->
second
)
<<
std
::
endl
;
}
}
}
}
...
...
paddle/platform/profiler.h
浏览文件 @
0f441075
...
@@ -33,6 +33,7 @@ class Event {
...
@@ -33,6 +33,7 @@ class Event {
std
::
string
kind
()
const
;
std
::
string
kind
()
const
;
std
::
string
name
()
const
{
return
name_
;
}
std
::
string
name
()
const
{
return
name_
;
}
uint32_t
thread_id
()
const
{
return
thread_id_
;
}
bool
has_cuda
()
const
{
return
has_cuda_
;
}
bool
has_cuda
()
const
{
return
has_cuda_
;
}
#ifdef PADDLE_WITH_CUDA
#ifdef PADDLE_WITH_CUDA
...
...
paddle/platform/profiler_test.cc
浏览文件 @
0f441075
...
@@ -94,6 +94,12 @@ TEST(RecordEvent, RecordEvent) {
...
@@ -94,6 +94,12 @@ TEST(RecordEvent, RecordEvent) {
int
counter
=
1
;
int
counter
=
1
;
while
(
counter
!=
i
*
1000
)
counter
++
;
while
(
counter
!=
i
*
1000
)
counter
++
;
}
}
for
(
int
i
=
1
;
i
<
5
;
++
i
)
{
std
::
string
name
=
"evs_op_"
+
std
::
to_string
(
i
);
RecordEvent
record_event
(
name
,
dev_ctx
);
int
counter
=
1
;
while
(
counter
!=
i
*
1000
)
counter
++
;
}
std
::
vector
<
std
::
vector
<
Event
>>
events
=
paddle
::
platform
::
DisableProfiler
();
std
::
vector
<
std
::
vector
<
Event
>>
events
=
paddle
::
platform
::
DisableProfiler
();
int
cuda_startup_count
=
0
;
int
cuda_startup_count
=
0
;
int
start_profiler_count
=
0
;
int
start_profiler_count
=
0
;
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录