Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
MegEngine 天元
MegEngine
提交
11a383bc
MegEngine
项目概览
MegEngine 天元
/
MegEngine
大约 1 年 前同步成功
通知
399
Star
4705
Fork
582
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
MegEngine
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
体验新版 GitCode,发现更多精彩内容 >>
提交
11a383bc
编写于
9月 06, 2021
作者:
M
Megvii Engine Team
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
feat(mgb): add tensorboard tool c++ layer interface and python parsing
GitOrigin-RevId: ae98bc887f8509a6c79bdfe4892191ca67f0d9a4
上级
8084e4e2
变更
4
显示空白变更内容
内联
并排
Showing
4 changed file
with
455 addition
and
1 deletion
+455
-1
imperative/python/megengine/tools/README.md
imperative/python/megengine/tools/README.md
+1
-1
imperative/python/megengine/tools/graph_info_analyze.py
imperative/python/megengine/tools/graph_info_analyze.py
+235
-0
src/core/impl/utils/visable_data_set.cpp
src/core/impl/utils/visable_data_set.cpp
+131
-0
src/core/include/megbrain/utils/visable_data_set.h
src/core/include/megbrain/utils/visable_data_set.h
+88
-0
未找到文件。
imperative/python/megengine/tools/README.md
浏览文件 @
11a383bc
imperative/python/megengine/tools/graph_info_analyze.py
0 → 100644
浏览文件 @
11a383bc
#! /usr/bin/env python3
# MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
#
# Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
import
argparse
import
json
import
math
import
os
from
megengine.utils.module_stats
import
sizeof_fmt
from
megengine.utils.tensorboard
import
SummaryWriterExtend
def
load_single_graph
(
fpath
):
with
open
(
fpath
)
as
fin
:
data
=
json
.
load
(
fin
)
for
t
in
[
"operator"
,
"var"
]:
data
[
t
]
=
{
int
(
i
):
j
for
i
,
j
in
data
[
t
].
items
()}
gvars
=
data
[
"var"
]
for
oid
,
i
in
data
[
"operator"
].
items
():
i
[
"input"
]
=
list
(
map
(
int
,
i
[
"input"
]))
out
=
i
[
"output"
]
=
list
(
map
(
int
,
i
[
"output"
]))
for
j
in
out
:
gvars
[
j
][
"owner_opr"
]
=
oid
for
var
in
data
[
"var"
].
values
():
mp
=
var
.
get
(
"mem_plan"
,
None
)
if
mp
:
var
[
"shape"
]
=
"{"
+
","
.
join
(
map
(
str
,
mp
[
"layout"
][
"shape"
]))
+
"}"
else
:
var
[
"shape"
]
=
"<?>"
return
data
def
comp_graph_plotter
(
input
,
writer
):
jgraph
=
load_single_graph
(
input
)
all_oprs
=
jgraph
[
"operator"
]
all_vars
=
jgraph
[
"var"
]
for
i
in
all_oprs
:
opr
=
all_oprs
[
i
]
if
opr
[
"type"
]
==
"ImmutableTensor"
:
continue
inputlist
=
[]
for
var
in
opr
[
"input"
]:
inpopr
=
all_oprs
[
all_vars
[
var
][
"owner_opr"
]]
if
inpopr
[
"type"
]
==
"ImmutableTensor"
:
continue
inputlist
.
append
(
all_oprs
[
all_vars
[
var
][
"owner_opr"
]][
"name"
])
writer
.
add_node_raw
(
opr
[
"name"
],
opr
[
"type"
],
inputlist
)
writer
.
add_graph_by_node_raw_list
()
def
load_mem_info
(
fpath
):
with
open
(
fpath
)
as
fin
:
data
=
json
.
load
(
fin
)
oprs
=
data
[
"opr"
]
for
oid
,
i
in
oprs
.
items
():
i
[
"size"
]
=
0
for
oid
,
i
in
data
[
"chunk"
].
items
():
i
[
"size"
]
=
int
(
i
[
"logic_addr_end"
])
-
int
(
i
[
"logic_addr_begin"
])
data
[
"peak_memory"
]
=
0
data
[
"weight_memory"
]
=
0
for
oid
,
i
in
data
[
"chunk"
].
items
():
if
i
[
"type"
]
==
"static_mem"
:
i
[
"owner_opr"
]
=
oprs
[
i
[
"time_begin"
]][
"name"
]
life_begin
=
int
(
i
[
"time_begin"
])
life_end
=
int
(
i
[
"time_end"
])
if
i
[
"overwrite_dest_id"
]
!=
"-1"
:
life_begin
=
life_begin
+
1
if
data
[
"peak_memory"
]
<
int
(
i
[
"logic_addr_end"
]):
data
[
"peak_memory"
]
=
int
(
i
[
"logic_addr_end"
])
for
j
in
range
(
life_begin
,
life_end
):
oprs
[
str
(
j
)][
"size"
]
=
oprs
[
str
(
j
)][
"size"
]
+
i
[
"size"
]
elif
i
[
"type"
]
==
"weight_mem"
:
data
[
"weight_memory"
]
+=
int
(
i
[
"logic_addr_end"
])
-
int
(
i
[
"logic_addr_begin"
]
)
return
data
def
peak_mem_regist
(
input
,
writer
):
jmem
=
load_mem_info
(
input
)
writer
.
add_text
(
"PEAK_MEMORY_SIZE"
,
[
sizeof_fmt
(
jmem
[
"peak_memory"
])
+
"("
+
str
(
jmem
[
"peak_memory"
])
+
" B)"
],
)
writer
.
add_text
(
"WEIGHT_MEMORY_SIZE"
,
[
sizeof_fmt
(
jmem
[
"weight_memory"
])
+
"("
+
str
(
jmem
[
"weight_memory"
])
+
" B)"
],
)
all_oprs
=
jmem
[
"opr"
]
all_chunks
=
jmem
[
"chunk"
]
max_size
=
0
max_size_oprs
=
[]
# get oprs that reach the max memory
for
oid
,
i
in
all_oprs
.
items
():
if
i
[
"size"
]
==
max_size
:
max_size_oprs
.
append
(
int
(
i
[
"id"
]))
elif
i
[
"size"
]
>
max_size
:
max_size
=
i
[
"size"
]
max_size_oprs
.
clear
()
max_size_oprs
.
append
(
int
(
i
[
"id"
]))
# get component of chunks
max_size_oprs
.
sort
()
opr2chunks
=
[]
num
=
len
(
max_size_oprs
)
for
i
in
range
(
num
):
opr2chunks
.
append
([])
for
oid
,
i
in
all_chunks
.
items
():
if
i
[
"type"
]
==
"static_mem"
:
life_begin
=
int
(
i
[
"time_begin"
])
life_end
=
int
(
i
[
"time_end"
])
if
i
[
"overwrite_dest_id"
]
!=
"-1"
:
life_begin
=
life_begin
+
1
if
max_size_oprs
[
0
]
>=
life_end
or
max_size_oprs
[
-
1
]
<
life_begin
:
continue
for
j
in
range
(
num
):
if
max_size_oprs
[
j
]
>=
life_end
:
break
elif
max_size_oprs
[
j
]
>=
life_begin
:
opr2chunks
[
j
].
append
(
i
[
"id"
])
peak_num
=
0
for
i
in
range
(
num
):
suffix_1
=
"PEAK"
+
str
(
peak_num
)
if
i
-
1
>
0
and
opr2chunks
[
i
-
1
]
==
opr2chunks
[
i
]:
continue
max_num
=
0
opr2chunks
[
i
]
=
sorted
(
opr2chunks
[
i
],
key
=
lambda
chunk_id
:
all_chunks
[
chunk_id
][
"size"
],
reverse
=
True
,
)
writer
.
add_text
(
suffix_1
+
"/"
+
"<SUMMARY_INFO>"
,
[
"reached_max_opr_name: "
+
all_oprs
[
str
(
max_size_oprs
[
i
])][
"name"
]],
0
,
)
writer
.
add_text
(
suffix_1
+
"/"
+
"<SUMMARY_INFO>"
,
[
"max_used_size: "
+
sizeof_fmt
(
max_size
)],
1
,
)
for
j
in
opr2chunks
[
i
]:
suffix_2
=
"MAX"
+
str
(
max_num
)
j_size
=
sizeof_fmt
(
all_chunks
[
j
][
"size"
])
j_percent
=
round
(
all_chunks
[
j
][
"size"
]
/
max_size
*
100
,
3
)
writer
.
add_text
(
suffix_1
+
"/"
+
suffix_2
+
"_OPR"
,
[
"percent: "
+
str
(
j_percent
)
+
"%"
],
0
,
)
writer
.
add_text
(
suffix_1
+
"/"
+
suffix_2
+
"_OPR"
,
[
"memory_size: "
+
j_size
],
1
,
)
writer
.
add_text
(
suffix_1
+
"/"
+
suffix_2
+
"_OPR"
,
[
"owner_opr: "
+
all_chunks
[
j
][
"owner_opr"
]],
2
,
)
writer
.
add_node_raw_attributes
(
all_chunks
[
j
][
"owner_opr"
],
{
"memory_"
+
all_chunks
[
j
][
"id"
]:
j_size
,
"memory_percent"
:
str
(
j_percent
)
+
"%"
,
"summary_memory_"
+
str
(
peak_num
):
sizeof_fmt
(
max_size
),
},
)
writer
.
add_node_raw_name_suffix
(
all_chunks
[
j
][
"owner_opr"
],
"_"
+
suffix_1
+
"_"
+
suffix_2
)
max_num
+=
1
peak_num
+=
1
writer
.
add_graph_by_node_raw_list
()
def
convert
(
args
):
file_process_order
=
{
"graph.json"
:
comp_graph_plotter
,
"StaticMemoryInfo.json"
:
peak_mem_regist
,
}
g
=
os
.
walk
(
args
.
input
)
for
path
,
dir_list
,
file_list
in
g
:
out_path
=
path
.
replace
(
args
.
input
,
args
.
output
)
writer
=
SummaryWriterExtend
(
out_path
)
for
key
,
value
in
file_process_order
.
items
():
if
key
in
file_list
:
value
(
os
.
path
.
join
(
path
,
key
),
writer
)
def
main
():
"""`graph_info_analyze.py` is uesed to convert json dumped by `VisableDataSet`
class to logs which can be read by python `tensorboard`.
Now `get_static_memory_alloc_info()` support this feature,it will dump a dir
which can be convert by `graph_info_analyze.py`.
Examples::
graph_info_analyze.py -i <input_dir_name> -o <output_dir_name>
tensorboard --logdir <output_dir_name>
"""
parser
=
argparse
.
ArgumentParser
(
"convert json dumped by c to logs which can be read by python tensorboard"
,
formatter_class
=
argparse
.
ArgumentDefaultsHelpFormatter
,
)
parser
.
add_argument
(
"-i"
,
"--input"
,
required
=
True
,
help
=
"input dirctor name(c tensorboard info)"
)
parser
.
add_argument
(
"-o"
,
"--output"
,
required
=
True
,
help
=
"output dirctor name(python tensorboard info)"
,
)
args
=
parser
.
parse_args
()
convert
(
args
)
if
__name__
==
"__main__"
:
main
()
src/core/impl/utils/visable_data_set.cpp
0 → 100644
浏览文件 @
11a383bc
/**
* \file src/core/impl/utils/tensorboard.cpp
* MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
*
* Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or
* implied.
*/
#include "megbrain/utils/visable_data_set.h"
#if MGB_ENABLE_JSON
#include <fstream>
#include <iostream>
using
namespace
mgb
;
#if WIN32
#include <direct.h>
#include <fcntl.h>
#include <io.h>
#define getcwd _getcwd
namespace
{
auto
mkdir
(
const
char
*
path
,
int
)
{
return
_mkdir
(
path
);
}
}
// namespace
#else
#include <sys/stat.h>
#include <sys/types.h>
#include <unistd.h>
#endif
namespace
{
#if defined(IOS)
#pragma message "build test on iOS; need ios_get_mgb_output_dir() to be defined"
extern
"C"
void
ios_get_mgb_output_dir
(
char
**
dir
);
#endif
std
::
string
output_file
(
std
::
string
dir_name
,
const
std
::
string
&
fname
)
{
static
std
::
string
cwd
;
static
std
::
mutex
cwd_mtx
;
MGB_LOCK_GUARD
(
cwd_mtx
);
if
(
cwd
.
empty
())
{
#if defined(IOS)
char
*
buf
=
nullptr
;
ios_get_mgb_output_dir
(
&
buf
);
#else
auto
buf
=
getcwd
(
nullptr
,
0
);
#endif
mgb_assert
(
buf
);
cwd
=
buf
;
free
(
buf
);
dir_name
=
dir_name
+
"/"
;
for
(
size_t
i
=
0
;
i
<
dir_name
.
size
();
i
++
)
{
size_t
pos
=
dir_name
.
find
(
"/"
,
i
);
if
(
pos
<
dir_name
.
size
()
&&
pos
-
i
>
1
)
{
cwd
.
append
(
"/"
+
dir_name
.
substr
(
i
,
pos
-
i
));
mkdir
(
cwd
.
c_str
(),
0755
);
i
=
pos
;
}
}
}
if
(
fname
.
empty
())
return
cwd
;
auto
ret
=
cwd
+
"/"
+
fname
;
FILE
*
fout
=
fopen
(
ret
.
c_str
(),
"w"
);
mgb_assert
(
fout
,
"failed to open %s: %s"
,
ret
.
c_str
(),
strerror
(
errno
));
fclose
(
fout
);
return
ret
;
}
}
// namespace
void
VisableDataSet
::
draw_graph
(
std
::
shared_ptr
<
json
::
Value
>
graph_json
)
{
graph_json
->
writeto_fpath
(
output_file
(
m_logdir
,
"graph.json"
));
}
void
VisableDataSet
::
dump_info
(
Content
&
c
)
{
auto
&&
content_set
=
m_file2content
[
c
.
file_name
()];
content_set
.
insert
(
c
.
content_name
());
auto
&&
value_list
=
m_filecontent2value
[
c
.
file_name
()
+
"/"
+
c
.
content_name
()];
value_list
.
push_back
(
c
.
to_json
());
}
void
VisableDataSet
::
write_to_file
()
{
for
(
auto
&
i
:
m_file2content
)
{
auto
f_objptr
=
json
::
Object
::
make
();
auto
&&
f_obj
=
*
f_objptr
;
for
(
auto
&
c
:
i
.
second
)
{
auto
c_objptr
=
json
::
Object
::
make
();
auto
&&
c_obj
=
*
c_objptr
;
for
(
auto
&
j
:
m_filecontent2value
[
i
.
first
+
"/"
+
c
])
{
c_obj
[(
*
j
).
cast_final_safe
<
json
::
Object
>
()[
"id"
]
->
cast_final_safe
<
json
::
String
>
()
.
get_impl
()]
=
j
;
}
f_obj
[
c
]
=
c_objptr
;
}
f_objptr
->
writeto_fpath
(
output_file
(
m_logdir
,
i
.
first
));
}
}
// const std::string PeakMemoryInfo::content() const {return }
std
::
shared_ptr
<
json
::
Value
>
Chunk
::
to_json
()
const
{
auto
objptr
=
json
::
Object
::
make
();
auto
&&
obj
=
*
objptr
;
obj
[
"id"
]
=
json
::
String
::
make
(
id
());
obj
[
"type"
]
=
json
::
String
::
make
(
m_type
);
obj
[
"time_begin"
]
=
json
::
String
::
make
(
m_time_begin
);
obj
[
"time_end"
]
=
json
::
String
::
make
(
m_time_end
);
obj
[
"logic_addr_begin"
]
=
json
::
String
::
make
(
m_logic_addr_begin
);
obj
[
"logic_addr_end"
]
=
json
::
String
::
make
(
m_logic_addr_end
);
obj
[
"overwrite_dest_id"
]
=
json
::
String
::
make
(
m_overwrite_dest_id
);
return
objptr
;
}
std
::
shared_ptr
<
json
::
Value
>
OprSeq
::
to_json
()
const
{
auto
objptr
=
json
::
Object
::
make
();
auto
&&
obj
=
*
objptr
;
obj
[
"id"
]
=
json
::
String
::
make
(
id
());
obj
[
"name"
]
=
json
::
String
::
make
(
m_name
);
return
objptr
;
}
#endif
\ No newline at end of file
src/core/include/megbrain/utils/visable_data_set.h
0 → 100644
浏览文件 @
11a383bc
/**
* \file src/core/include/megbrain/utils/visable_data_set.h
* MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
*
* Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or
* implied.
*/
#pragma once
#include "megbrain/utils/json.h"
#if MGB_ENABLE_JSON
#include <set>
#include "megbrain/plugin/base.h"
#include "megbrain/plugin/static_mem_record.h"
namespace
mgb
{
class
VisableDataSet
:
public
NonCopyableObj
{
private:
const
std
::
string
m_logdir
;
std
::
unordered_map
<
std
::
string
,
std
::
set
<
std
::
string
>>
m_file2content
;
std
::
unordered_map
<
std
::
string
,
std
::
vector
<
std
::
shared_ptr
<
json
::
Value
>>>
m_filecontent2value
;
public:
class
Content
{
private:
std
::
string
m_file_name
;
std
::
string
m_content_name
;
std
::
string
m_id
;
public:
Content
(
std
::
string
file_name
,
std
::
string
content_name
,
std
::
string
id
)
:
m_file_name
(
file_name
),
m_content_name
(
content_name
),
m_id
(
id
)
{}
const
std
::
string
&
file_name
()
const
{
return
m_file_name
;
}
const
std
::
string
&
content_name
()
const
{
return
m_content_name
;
}
const
std
::
string
&
id
()
const
{
return
m_id
;
}
virtual
std
::
shared_ptr
<
json
::
Value
>
to_json
()
const
=
0
;
virtual
~
Content
()
=
default
;
};
VisableDataSet
(
std
::
string
logdir
)
:
m_logdir
(
logdir
)
{}
void
draw_graph
(
std
::
shared_ptr
<
json
::
Value
>
graph_json
);
void
dump_info
(
Content
&
c
);
void
write_to_file
();
};
class
Chunk
:
public
VisableDataSet
::
Content
{
private:
const
char
*
enum_str
[
2
]
=
{
"static_mem"
,
"weight_mem"
};
std
::
string
m_type
,
m_time_begin
,
m_time_end
,
m_logic_addr_begin
,
m_logic_addr_end
,
m_overwrite_dest_id
;
// m_overwriter_dest_id = "-1" means no
// overwrite dest
public:
enum
chunk_type
{
static_mem
,
weight_mem
};
Chunk
(
std
::
string
id
,
chunk_type
type
,
std
::
string
time_begin
,
std
::
string
time_end
,
std
::
string
logic_addr_begin
,
std
::
string
logic_addr_end
,
std
::
string
overwrite_dest_id
)
:
Content
(
"StaticMemoryInfo.json"
,
"chunk"
,
id
),
m_type
(
enum_str
[
type
]),
m_time_begin
(
time_begin
),
m_time_end
(
time_end
),
m_logic_addr_begin
(
logic_addr_begin
),
m_logic_addr_end
(
logic_addr_end
),
m_overwrite_dest_id
(
overwrite_dest_id
)
{}
std
::
shared_ptr
<
json
::
Value
>
to_json
()
const
override
;
};
class
OprSeq
:
public
VisableDataSet
::
Content
{
private:
std
::
string
m_id
,
m_name
;
public:
OprSeq
(
std
::
string
id
,
std
::
string
opr_name
)
:
Content
(
"StaticMemoryInfo.json"
,
"opr"
,
id
),
m_name
(
opr_name
)
{}
std
::
shared_ptr
<
json
::
Value
>
to_json
()
const
override
;
};
}
// namespace mgb
#endif
\ No newline at end of file
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录