Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
慢慢CG
Mace
提交
12c3af21
Mace
项目概览
慢慢CG
/
Mace
与 Fork 源项目一致
Fork自
Xiaomi / Mace
通知
1
Star
0
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
Mace
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
提交
12c3af21
编写于
2月 27, 2018
作者:
L
Liangliang He
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
Sync mace changes and add latency logging
上级
6bef90cd
变更
2
隐藏空白更改
内联
并排
Showing
2 changed file
with
66 addition
and
78 deletion
+66
-78
BUILD
BUILD
+1
-2
mace_run.cc
mace_run.cc
+65
-76
未找到文件。
BUILD
浏览文件 @
12c3af21
...
...
@@ -15,11 +15,10 @@ cc_binary(
linkstatic
=
1
,
deps
=
[
"//codegen:generated_models"
,
"@mace//:mace_headers"
,
"//external:gflags_nothreads"
,
]
+
if_hexagon_enabled
([
"//lib/hexagon:hexagon"
,
])
+
if_production_mode
([
])
+
if_production_mode
([
"@mace//:mace_prod"
,
"//codegen:generated_opencl_prod"
,
"//codegen:generated_tuning_params"
,
...
...
mace_run.cc
浏览文件 @
12c3af21
...
...
@@ -14,17 +14,19 @@
* --model_data_file=model_data.data \
* --device=OPENCL
*/
#include <cstdlib>
#include <fstream>
#include <malloc.h>
#include <numeric>
#include <iostream>
#include <stdint.h>
#include <sys/time.h>
#include <time.h>
#include <cstdlib>
#include <fstream>
#include <iostream>
#include <numeric>
#include "gflags/gflags.h"
#include "mace/core/public/mace.h"
#include "mace/public/mace.h"
#include "mace/utils/env_time.h"
#include "mace/utils/logging.h"
using
namespace
std
;
using
namespace
mace
;
...
...
@@ -32,22 +34,16 @@ using namespace mace;
namespace
mace
{
namespace
MACE_MODEL_TAG
{
extern
unsigned
char
*
LoadModelData
(
const
char
*
model_data_file
);
extern
const
unsigned
char
*
LoadModelData
(
const
char
*
model_data_file
);
extern
void
UnloadModelData
(
unsigned
char
*
model_data
);
extern
void
UnloadModelData
(
const
unsigned
char
*
model_data
);
extern
NetDef
CreateNet
(
const
unsigned
char
*
model_data
);
extern
const
std
::
string
ModelChecksum
();
}
}
inline
int64_t
NowMicros
()
{
struct
timeval
tv
;
gettimeofday
(
&
tv
,
nullptr
);
return
static_cast
<
int64_t
>
(
tv
.
tv_sec
)
*
1000000
+
tv
.
tv_usec
;
}
}
// namespace MACE_MODEL_TAG
}
// namespace mace
void
ParseShape
(
const
string
&
str
,
vector
<
int64_t
>
*
shape
)
{
string
tmp
=
str
;
...
...
@@ -80,56 +76,46 @@ DeviceType ParseDeviceType(const string &device_str) {
struct
mallinfo
LogMallinfoChange
(
struct
mallinfo
prev
)
{
struct
mallinfo
curr
=
mallinfo
();
if
(
prev
.
arena
!=
curr
.
arena
)
{
std
::
cout
<<
"Non-mmapped space allocated (bytes): "
<<
curr
.
arena
<<
", diff: "
<<
((
int64_t
)
curr
.
arena
-
(
int64_t
)
prev
.
arena
)
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Non-mmapped space allocated (bytes): "
<<
curr
.
arena
<<
", diff: "
<<
((
int64_t
)
curr
.
arena
-
(
int64_t
)
prev
.
arena
);
}
if
(
prev
.
ordblks
!=
curr
.
ordblks
)
{
std
::
cout
<<
"Number of free chunks: "
<<
curr
.
ordblks
<<
", diff: "
<<
((
int64_t
)
curr
.
ordblks
-
(
int64_t
)
prev
.
ordblks
)
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Number of free chunks: "
<<
curr
.
ordblks
<<
", diff: "
<<
((
int64_t
)
curr
.
ordblks
-
(
int64_t
)
prev
.
ordblks
);
}
if
(
prev
.
smblks
!=
curr
.
smblks
)
{
std
::
cout
<<
"Number of free fastbin blocks: "
<<
curr
.
smblks
<<
", diff: "
<<
((
int64_t
)
curr
.
smblks
-
(
int64_t
)
prev
.
smblks
)
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Number of free fastbin blocks: "
<<
curr
.
smblks
<<
", diff: "
<<
((
int64_t
)
curr
.
smblks
-
(
int64_t
)
prev
.
smblks
);
}
if
(
prev
.
hblks
!=
curr
.
hblks
)
{
std
::
cout
<<
"Number of mmapped regions: "
<<
curr
.
hblks
<<
", diff: "
<<
((
int64_t
)
curr
.
hblks
-
(
int64_t
)
prev
.
hblks
)
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Number of mmapped regions: "
<<
curr
.
hblks
<<
", diff: "
<<
((
int64_t
)
curr
.
hblks
-
(
int64_t
)
prev
.
hblks
);
}
if
(
prev
.
hblkhd
!=
curr
.
hblkhd
)
{
std
::
cout
<<
"Space allocated in mmapped regions (bytes): "
<<
curr
.
hblkhd
<<
", diff: "
<<
((
int64_t
)
curr
.
hblkhd
-
(
int64_t
)
prev
.
hblkhd
)
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Space allocated in mmapped regions (bytes): "
<<
curr
.
hblkhd
<<
", diff: "
<<
((
int64_t
)
curr
.
hblkhd
-
(
int64_t
)
prev
.
hblkhd
);
}
if
(
prev
.
usmblks
!=
curr
.
usmblks
)
{
std
::
cout
<<
"Maximum total allocated space (bytes): "
<<
curr
.
usmblks
<<
", diff: "
<<
((
int64_t
)
curr
.
usmblks
-
(
int64_t
)
prev
.
usmblks
)
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Maximum total allocated space (bytes): "
<<
curr
.
usmblks
<<
", diff: "
<<
((
int64_t
)
curr
.
usmblks
-
(
int64_t
)
prev
.
usmblks
);
}
if
(
prev
.
fsmblks
!=
curr
.
fsmblks
)
{
std
::
cout
<<
"Space in freed fastbin blocks (bytes): "
<<
curr
.
fsmblks
<<
", diff: "
<<
((
int64_t
)
curr
.
fsmblks
-
(
int64_t
)
prev
.
fsmblks
)
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Space in freed fastbin blocks (bytes): "
<<
curr
.
fsmblks
<<
", diff: "
<<
((
int64_t
)
curr
.
fsmblks
-
(
int64_t
)
prev
.
fsmblks
);
}
if
(
prev
.
uordblks
!=
curr
.
uordblks
)
{
std
::
cout
<<
"Total allocated space (bytes): "
<<
curr
.
uordblks
LOG
(
INFO
)
<<
"Total allocated space (bytes): "
<<
curr
.
uordblks
<<
", diff: "
<<
((
int64_t
)
curr
.
uordblks
-
(
int64_t
)
prev
.
uordblks
)
<<
std
::
endl
;
<<
((
int64_t
)
curr
.
uordblks
-
(
int64_t
)
prev
.
uordblks
);
}
if
(
prev
.
fordblks
!=
curr
.
fordblks
)
{
std
::
cout
<<
"Total free space (bytes): "
<<
curr
.
fordblks
<<
", diff: "
<<
((
int64_t
)
curr
.
fordblks
-
(
int64_t
)
prev
.
fordblks
)
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Total free space (bytes): "
<<
curr
.
fordblks
<<
", diff: "
<<
((
int64_t
)
curr
.
fordblks
-
(
int64_t
)
prev
.
fordblks
);
}
if
(
prev
.
keepcost
!=
curr
.
keepcost
)
{
std
::
cout
<<
"Top-most, releasable space (bytes): "
<<
curr
.
keepcost
LOG
(
INFO
)
<<
"Top-most, releasable space (bytes): "
<<
curr
.
keepcost
<<
", diff: "
<<
((
int64_t
)
curr
.
keepcost
-
(
int64_t
)
prev
.
keepcost
)
<<
std
::
endl
;
<<
((
int64_t
)
curr
.
keepcost
-
(
int64_t
)
prev
.
keepcost
);
}
return
curr
;
}
...
...
@@ -138,7 +124,9 @@ DEFINE_string(input_shape, "1,224,224,3", "input shape, separated by comma");
DEFINE_string
(
output_shape
,
"1,224,224,2"
,
"output shape, separated by comma"
);
DEFINE_string
(
input_file
,
""
,
"input file name"
);
DEFINE_string
(
output_file
,
""
,
"output file name"
);
DEFINE_string
(
model_data_file
,
""
,
"model data file name, used when EMBED_MODEL_DATA set to 0"
);
DEFINE_string
(
model_data_file
,
""
,
"model data file name, used when EMBED_MODEL_DATA set to 0"
);
DEFINE_string
(
device
,
"OPENCL"
,
"CPU/NEON/OPENCL/HEXAGON"
);
DEFINE_int32
(
round
,
1
,
"round"
);
DEFINE_int32
(
malloc_check_cycle
,
-
1
,
"malloc debug check cycle, -1 to disable"
);
...
...
@@ -147,16 +135,15 @@ int main(int argc, char **argv) {
gflags
::
SetUsageMessage
(
"some usage message"
);
gflags
::
ParseCommandLineFlags
(
&
argc
,
&
argv
,
true
);
std
::
cout
<<
"mace version: "
<<
MaceVersion
()
<<
std
::
endl
<<
"mace git version: "
<<
MaceGitVersion
()
<<
std
::
endl
<<
"model checksum: "
<<
mace
::
MACE_MODEL_TAG
::
ModelChecksum
()
<<
std
::
endl
<<
"input_shape: "
<<
FLAGS_input_shape
<<
std
::
endl
<<
"output_shape: "
<<
FLAGS_output_shape
<<
std
::
endl
<<
"input_file: "
<<
FLAGS_input_file
<<
std
::
endl
<<
"output_file: "
<<
FLAGS_output_file
<<
std
::
endl
<<
"model_data_file: "
<<
FLAGS_model_data_file
<<
std
::
endl
<<
"device: "
<<
FLAGS_device
<<
std
::
endl
<<
"round: "
<<
FLAGS_round
<<
std
::
endl
;
LOG
(
INFO
)
<<
"mace version: "
<<
MaceVersion
()
<<
"mace git version: "
<<
MaceGitVersion
()
<<
"model checksum: "
<<
mace
::
MACE_MODEL_TAG
::
ModelChecksum
()
<<
"input_shape: "
<<
FLAGS_input_shape
<<
"output_shape: "
<<
FLAGS_output_shape
<<
"input_file: "
<<
FLAGS_input_file
<<
"output_file: "
<<
FLAGS_output_file
<<
"model_data_file: "
<<
FLAGS_model_data_file
<<
"device: "
<<
FLAGS_device
<<
"round: "
<<
FLAGS_round
;
vector
<
int64_t
>
input_shape_vec
;
vector
<
int64_t
>
output_shape_vec
;
...
...
@@ -165,18 +152,21 @@ int main(int argc, char **argv) {
// load model
int64_t
t0
=
NowMicros
();
unsigned
char
*
model_data
=
mace
::
MACE_MODEL_TAG
::
LoadModelData
(
FLAGS_model_data_file
.
c_str
());
const
unsigned
char
*
model_data
=
mace
::
MACE_MODEL_TAG
::
LoadModelData
(
FLAGS_model_data_file
.
c_str
());
NetDef
net_def
=
mace
::
MACE_MODEL_TAG
::
CreateNet
(
model_data
);
int64_t
t1
=
NowMicros
();
std
::
cout
<<
"CreateNetDef duration: "
<<
t1
-
t0
<<
" us"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"CreateNetDef latency: "
<<
t1
-
t0
<<
" us"
;
int64_t
init_micros
=
t1
-
t0
;
DeviceType
device_type
=
ParseDeviceType
(
FLAGS_device
);
std
::
cout
<<
"Device Type"
<<
device_type
<<
std
::
endl
;
int64_t
input_size
=
std
::
accumulate
(
input_shape_vec
.
begin
(),
input_shape_vec
.
end
(),
1
,
std
::
multiplies
<
int64_t
>
());
int64_t
output_size
=
std
::
accumulate
(
output_shape_vec
.
begin
(),
output_shape_vec
.
end
(),
1
,
std
::
multiplies
<
int64_t
>
());
LOG
(
INFO
)
<<
"Runing with device type: "
<<
device_type
;
int64_t
input_size
=
std
::
accumulate
(
input_shape_vec
.
begin
(),
input_shape_vec
.
end
(),
1
,
std
::
multiplies
<
int64_t
>
());
int64_t
output_size
=
std
::
accumulate
(
output_shape_vec
.
begin
(),
output_shape_vec
.
end
(),
1
,
std
::
multiplies
<
int64_t
>
());
std
::
unique_ptr
<
float
[]
>
input_data
(
new
float
[
input_size
]);
std
::
unique_ptr
<
float
[]
>
output_data
(
new
float
[
output_size
]);
...
...
@@ -187,12 +177,12 @@ int main(int argc, char **argv) {
input_size
*
sizeof
(
float
));
in_file
.
close
();
}
else
{
std
::
cout
<<
"Open input file failed"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Open input file failed"
;
return
-
1
;
}
// Init model
std
::
cout
<<
"Run init"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Run init"
;
t0
=
NowMicros
();
mace
::
MaceEngine
engine
(
&
net_def
,
device_type
);
if
(
device_type
==
DeviceType
::
OPENCL
||
device_type
==
DeviceType
::
HEXAGON
)
{
...
...
@@ -200,39 +190,38 @@ int main(int argc, char **argv) {
}
t1
=
NowMicros
();
init_micros
+=
t1
-
t0
;
std
::
cout
<<
"Net init duration: "
<<
t1
-
t0
<<
" us"
<<
std
::
endl
;
std
::
cout
<<
"Total init duration: "
<<
init_micros
<<
" us"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Net init latency: "
<<
t1
-
t0
<<
" us"
;
LOG
(
INFO
)
<<
"Total init latency: "
<<
init_micros
<<
" us"
;
std
::
cout
<<
"Warm up"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Warm up run"
;
t0
=
NowMicros
();
engine
.
Run
(
input_data
.
get
(),
input_shape_vec
,
output_data
.
get
());
t1
=
NowMicros
();
std
::
cout
<<
"1st warm up run duration: "
<<
t1
-
t0
<<
" us"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"1st warm up run latency: "
<<
t1
-
t0
<<
" us"
;
if
(
FLAGS_round
>
0
)
{
std
::
cout
<<
"Run model"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Run model"
;
t0
=
NowMicros
();
struct
mallinfo
prev
=
mallinfo
();
for
(
int
i
=
0
;
i
<
FLAGS_round
;
++
i
)
{
engine
.
Run
(
input_data
.
get
(),
input_shape_vec
,
output_data
.
get
());
if
(
FLAGS_malloc_check_cycle
>=
1
&&
i
%
FLAGS_malloc_check_cycle
==
0
)
{
std
::
cout
<<
"=== check malloc info change #"
<<
i
<<
" ==="
<<
std
::
endl
;
LOG
(
INFO
)
<<
"=== check malloc info change #"
<<
i
<<
" ==="
;
prev
=
LogMallinfoChange
(
prev
);
}
}
t1
=
NowMicros
();
std
::
cout
<<
"Avg duration: "
<<
(
t1
-
t0
)
/
FLAGS_round
<<
" us"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Averate latency: "
<<
(
t1
-
t0
)
/
FLAGS_round
<<
" us"
;
}
if
(
output_data
!=
nullptr
)
{
ofstream
out_file
(
FLAGS_output_file
,
ios
::
binary
);
out_file
.
write
((
const
char
*
)
(
output_data
.
get
()),
out_file
.
write
((
const
char
*
)(
output_data
.
get
()),
output_size
*
sizeof
(
float
));
out_file
.
flush
();
out_file
.
close
();
std
::
cout
<<
"Write output file done."
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Write output file done."
;
}
else
{
std
::
cout
<<
"output data is null"
<<
std
::
endl
;
LOG
(
INFO
)
<<
"Output data is null"
;
}
}
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录