Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
MegEngine 天元
MegEngine
提交
0ccb965c
MegEngine
项目概览
MegEngine 天元
/
MegEngine
1 年多 前同步成功
通知
404
Star
4705
Fork
582
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
MegEngine
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
提交
0ccb965c
编写于
6月 24, 2020
作者:
M
Megvii Engine Team
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
fix(mgb/gopt): fix convert format nchw->nchw4 pass
GitOrigin-RevId: 1813753b144fa70d53f4f97f1a2a509963440d04
上级
1c2a525e
变更
2
隐藏空白更改
内联
并排
Showing
2 changed file
with
178 addition
and
10 deletion
+178
-10
src/gopt/impl/tensor_reformat.cpp
src/gopt/impl/tensor_reformat.cpp
+86
-4
src/gopt/test/inference.cpp
src/gopt/test/inference.cpp
+92
-6
未找到文件。
src/gopt/impl/tensor_reformat.cpp
浏览文件 @
0ccb965c
...
...
@@ -1599,18 +1599,103 @@ std::unique_ptr<EnableNCHW4Pass> EnableNCHW4Pass::make_nchw4_converter(){
}
return
serialization
::
copy_opr_shallow
(
*
opr
,
temp_inp
,
opr
->
config
());
};
auto
replace_pooling_opr
=
[](
OperatorNodeBase
*
opr
,
const
VarNodeArray
&
new_inp
)
{
using
Param
=
opr
::
PoolingForward
::
Param
;
using
Format
=
Param
::
Format
;
mgb_assert
(
opr
->
input
().
size
()
==
new_inp
.
size
());
auto
&
pooling
=
opr
->
cast_final_safe
<
opr
::
PoolingForward
>
();
mgb_assert
(
pooling
.
param
().
format
==
Format
::
NCHW
,
"ConvertFormat Pass only support converting NCHW to NCHW4."
);
if
(
new_inp
[
0
]
->
shape
().
ndim
==
5
)
{
mgb_assert
(
new_inp
[
0
]
->
dtype
().
enumv
()
==
DTypeEnum
::
QuantizedS8
);
auto
new_param
=
pooling
.
param
();
new_param
.
format
=
Format
::
NCHW4
;
auto
new_pooling
=
opr
::
PoolingForward
::
make
(
new_inp
[
0
],
new_param
,
opr
->
config
());
mgb_assert
(
new_pooling
.
shape
().
ndim
==
5
,
"out var of Pooling opr after transform must be 5 (got: "
"%zu)."
,
new_pooling
.
shape
().
ndim
);
return
new_pooling
.
node
()
->
owner_opr
();
}
auto
new_opr
=
serialization
::
copy_opr_shallow
(
*
opr
,
new_inp
,
opr
->
config
());
return
new_opr
;
};
auto
replace_resize_opr
=
[](
OperatorNodeBase
*
opr
,
const
VarNodeArray
&
new_inp
)
{
using
Param
=
opr
::
ResizeForward
::
Param
;
using
Format
=
Param
::
Format
;
mgb_assert
(
opr
->
input
().
size
()
==
new_inp
.
size
());
auto
&
resize
=
opr
->
cast_final_safe
<
opr
::
ResizeForward
>
();
mgb_assert
(
resize
.
param
().
format
==
Format
::
NCHW
,
"ConvertFormat Pass only support converting NCHW to NCHW4."
);
if
(
new_inp
[
0
]
->
shape
().
ndim
==
5
)
{
mgb_assert
(
new_inp
[
0
]
->
dtype
().
enumv
()
==
DTypeEnum
::
QuantizedS8
);
auto
new_param
=
resize
.
param
();
new_param
.
format
=
Format
::
NCHW4
;
auto
new_resize
=
opr
::
ResizeForward
::
make
(
new_inp
[
0
],
new_inp
[
1
],
new_param
,
opr
->
config
());
mgb_assert
(
new_resize
.
shape
().
ndim
==
5
,
"out var of Resize opr after transform must be 5 (got: "
"%zu)."
,
new_resize
.
shape
().
ndim
);
return
new_resize
.
node
()
->
owner_opr
();
}
auto
new_opr
=
serialization
::
copy_opr_shallow
(
*
opr
,
new_inp
,
opr
->
config
());
return
new_opr
;
};
auto
replace_warp_perspective_opr
=
[](
OperatorNodeBase
*
opr
,
const
VarNodeArray
&
new_inp
)
{
using
Param
=
opr
::
WarpPerspective
::
Param
;
using
Format
=
Param
::
Format
;
mgb_assert
(
opr
->
input
().
size
()
==
new_inp
.
size
());
auto
&
warp
=
opr
->
cast_final_safe
<
opr
::
WarpPerspectiveForward
>
();
mgb_assert
(
warp
.
param
().
format
==
Format
::
NCHW
,
"ConvertFormat Pass only support converting NCHW to NCHW4."
);
if
(
new_inp
[
0
]
->
shape
().
ndim
==
5
)
{
mgb_assert
(
new_inp
[
0
]
->
dtype
().
enumv
()
==
DTypeEnum
::
QuantizedS8
);
auto
new_param
=
warp
.
param
();
new_param
.
format
=
Format
::
NCHW4
;
SymbolVar
new_warp
;
if
(
new_inp
.
size
()
==
3
)
{
new_warp
=
opr
::
WarpPerspectiveForward
::
make
(
new_inp
[
0
],
new_inp
[
1
],
nullptr
,
new_inp
[
2
],
new_param
,
opr
->
config
());
}
else
{
mgb_assert
(
new_inp
.
size
()
==
4
);
new_warp
=
opr
::
WarpPerspectiveForward
::
make
(
new_inp
[
0
],
new_inp
[
1
],
new_inp
[
2
],
new_inp
[
3
],
new_param
,
opr
->
config
());
}
mgb_assert
(
new_warp
.
shape
().
ndim
==
5
,
"out var of WarpPerspective opr after transform must be "
"5 (got: "
"%zu)."
,
new_warp
.
shape
().
ndim
);
return
new_warp
.
node
()
->
owner_opr
();
}
auto
new_opr
=
serialization
::
copy_opr_shallow
(
*
opr
,
new_inp
,
opr
->
config
());
return
new_opr
;
};
auto
&&
replace_func
=
ret
->
m_opr_replace_func
;
//! supportted nchw4
replace_func
[
opr
::
Convolution
::
typeinfo
()]
=
replace_conv_opr
;
replace_func
[
opr
::
ConvBias
::
typeinfo
()]
=
replace_conv_bias_opr
;
replace_func
[
opr
::
BatchConvBias
::
typeinfo
()]
=
replace_batch_conv_bias_opr
;
replace_func
[
opr
::
PoolingForward
::
typeinfo
()]
=
replace_pooling_opr
;
replace_func
[
opr
::
ResizeForward
::
typeinfo
()]
=
replace_resize_opr
;
replace_func
[
opr
::
WarpPerspectiveForward
::
typeinfo
()]
=
replace_warp_perspective_opr
;
replace_func
[
opr
::
Elemwise
::
typeinfo
()]
=
replace_elemwise_opr
;
replace_func
[
opr
::
TypeCvt
::
typeinfo
()]
=
replace_elemwise_opr
;
replace_func
[
opr
::
ElemwiseMultiType
::
typeinfo
()]
=
replace_elemwise_opr
;
replace_func
[
opr
::
PowC
::
typeinfo
()]
=
replace_elemwise_opr
;
//! not supported nchw4
replace_func
[
opr
::
PoolingForward
::
typeinfo
()]
=
relayout_inp_to_nchw
;
replace_func
[
opr
::
Concat
::
typeinfo
()]
=
relayout_inp_to_nchw
;
replace_func
[
opr
::
ConvolutionBackwardData
::
typeinfo
()]
=
relayout_inp_to_nchw
;
...
...
@@ -1620,9 +1705,6 @@ std::unique_ptr<EnableNCHW4Pass> EnableNCHW4Pass::make_nchw4_converter(){
replace_func
[
opr
::
Reduce
::
typeinfo
()]
=
relayout_inp_to_nchw
;
replace_func
[
opr
::
AssertEqual
::
typeinfo
()]
=
relayout_inp_to_nchw
;
replace_func
[
opr
::
IncrSubtensor
::
typeinfo
()]
=
relayout_inp_to_nchw
;
replace_func
[
opr
::
ResizeForward
::
typeinfo
()]
=
relayout_inp_to_nchw
;
replace_func
[
opr
::
WarpPerspectiveForward
::
typeinfo
()]
=
relayout_inp_to_nchw
;
replace_func
[
opr
::
WarpAffineForward
::
typeinfo
()]
=
relayout_inp_to_nchw
;
return
ret
;
}
...
...
src/gopt/test/inference.cpp
浏览文件 @
0ccb965c
...
...
@@ -2430,14 +2430,16 @@ TEST(TestGoptInference, ConvertFormatNCHW4GPU) {
auto
w1
=
mkcvar
(
"w1"
,
{
8
,
4
,
3
,
3
},
dtype
::
QuantizedS8
(
2.5
f
)),
b1
=
mkcvar
(
"b1"
,
{
1
,
8
,
1
,
1
},
dtype
::
QuantizedS32
(
6.25
f
));
auto
conv1
=
opr
::
ConvBiasForward
::
make
(
x
,
w1
,
b1
,
param_conv_bias
,
{},
OperatorNodeConfig
{
dtype
::
QuantizedS8
{
2.5
f
}});
x
,
w1
,
b1
,
param_conv_bias
,
{},
OperatorNodeConfig
{
dtype
::
QuantizedS8
{
2.5
f
}});
// group
// icpg != 1 && ocpg != 1
param_conv_bias
.
sparse
=
opr
::
ConvBias
::
Param
::
Sparse
::
GROUP
;
auto
w2
=
mkcvar
(
"w2"
,
{
2
,
4
,
4
,
3
,
3
},
dtype
::
QuantizedS8
(
2.5
f
)),
b2
=
mkcvar
(
"b2"
,
{
1
,
8
,
1
,
1
},
dtype
::
QuantizedS32
(
6.25
f
));
auto
conv2
=
opr
::
ConvBiasForward
::
make
(
conv1
,
w2
,
b2
,
param_conv_bias
,
{},
OperatorNodeConfig
{
dtype
::
QuantizedS8
{
2.5
f
}});
auto
conv2
=
opr
::
ConvBiasForward
::
make
(
conv1
,
w2
,
b2
,
param_conv_bias
,
{},
OperatorNodeConfig
{
dtype
::
QuantizedS8
{
2.5
f
}});
auto
y
=
opr
::
TypeCvt
::
make
(
conv2
,
dtype
::
Float32
());
...
...
@@ -2453,8 +2455,8 @@ TEST(TestGoptInference, ConvertFormatNCHW4GPU) {
graph
->
compile
({{
y_opt
,
{}}})
->
to_json
()
->
writeto_fpath
(
output_file
(
"TestGoptInference.ConvertFormatNCHW4GPU.json"
));
->
writeto_fpath
(
output_file
(
"TestGoptInference.ConvertFormatNCHW4GPU.json"
));
HostTensorND
host_y
,
host_y_opt
;
auto
func
=
graph
->
compile
({
make_callback_copy
(
y
,
host_y
),
...
...
@@ -2465,6 +2467,90 @@ TEST(TestGoptInference, ConvertFormatNCHW4GPU) {
#endif
TEST
(
TestGoptInference
,
ConvertFormatNCHW4NonConvOpr
)
{
auto
cn
=
CompNode
::
load
(
"xpu0"
);
HostTensorGenerator
<
dtype
::
Int8
>
gen
;
auto
graph
=
ComputingGraph
::
make
();
graph
->
options
().
graph_opt_level
=
0
;
auto
mkvar
=
[
&
](
const
char
*
name
,
const
TensorShape
&
shp
,
const
DType
&
dtype
)
{
return
opr
::
TypeCvt
::
make
(
opr
::
Host2DeviceCopy
::
make
(
*
graph
,
gen
(
shp
,
cn
)).
rename
(
name
),
dtype
);
};
auto
mkcvar
=
[
&
](
const
char
*
name
,
const
TensorShape
&
shp
,
const
DType
&
dtype
)
{
return
opr
::
TypeCvt
::
make
(
opr
::
SharedDeviceTensor
::
make
(
*
graph
,
*
gen
(
shp
,
cn
))
.
rename
(
name
),
dtype
);
};
auto
mkcvarf32
=
[
&
](
const
char
*
name
,
const
TensorShape
&
shp
)
{
return
opr
::
SharedDeviceTensor
::
make
(
*
graph
,
*
gen
(
shp
,
cn
))
.
rename
(
name
);
};
auto
x
=
mkvar
(
"x"
,
{
2
,
4
,
16
,
16
},
dtype
::
QuantizedS8
(
2.5
f
));
opr
::
ConvBias
::
Param
param_conv_bias
;
param_conv_bias
.
format
=
opr
::
ConvBias
::
Param
::
Format
::
NCHW
;
param_conv_bias
.
stride_h
=
param_conv_bias
.
stride_w
=
1
;
param_conv_bias
.
pad_h
=
param_conv_bias
.
pad_w
=
1
;
param_conv_bias
.
nonlineMode
=
opr
::
ConvBias
::
Param
::
NonlineMode
::
RELU
;
// dense
param_conv_bias
.
sparse
=
opr
::
ConvBias
::
Param
::
Sparse
::
DENSE
;
auto
w1
=
mkcvar
(
"w1"
,
{
8
,
4
,
3
,
3
},
dtype
::
QuantizedS8
(
2.5
f
)),
b1
=
mkcvar
(
"b1"
,
{
1
,
8
,
1
,
1
},
dtype
::
QuantizedS32
(
6.25
f
));
auto
conv1
=
opr
::
ConvBiasForward
::
make
(
x
,
w1
,
b1
,
param_conv_bias
,
{},
OperatorNodeConfig
{
dtype
::
QuantizedS8
{
2.5
f
}});
// test Resize
auto
shape_of
=
opr
::
GetVarShape
::
make
(
x
);
auto
subtensor
=
opr
::
Subtensor
::
make
(
shape_of
,
{
opr
::
Subtensor
::
AxisIndexer
::
make_interval
(
0
,
x
.
make_scalar
(
2
),
None
,
x
.
make_scalar
(
1
))});
opr
::
Resize
::
Param
param_resize
;
param_resize
.
format
=
opr
::
Resize
::
Param
::
Format
::
NCHW
;
auto
resize
=
opr
::
ResizeForward
::
make
(
conv1
,
subtensor
*
2
,
param_resize
);
// test WarpPerspective
auto
mat
=
mkcvarf32
(
"mat"
,
{
2
,
3
,
3
}),
warp
=
opr
::
WarpPerspectiveForward
::
make
(
resize
,
mat
,
nullptr
,
cg
::
var_from_tensor_shape
(
x
,
{
32
,
32
}));
opr
::
Pooling
::
Param
pool_param
;
pool_param
.
format
=
opr
::
Pooling
::
Param
::
Format
::
NCHW
;
// test Pooling
auto
pool
=
opr
::
Pooling
::
make
(
warp
,
pool_param
);
// group
// icpg != 1 && ocpg != 1
param_conv_bias
.
sparse
=
opr
::
ConvBias
::
Param
::
Sparse
::
GROUP
;
auto
w2
=
mkcvar
(
"w2"
,
{
2
,
4
,
4
,
3
,
3
},
dtype
::
QuantizedS8
(
2.5
f
)),
b2
=
mkcvar
(
"b2"
,
{
1
,
8
,
1
,
1
},
dtype
::
QuantizedS32
(
6.25
f
));
auto
conv2
=
opr
::
ConvBiasForward
::
make
(
pool
,
w2
,
b2
,
param_conv_bias
,
{},
OperatorNodeConfig
{
dtype
::
QuantizedS8
{
2.5
f
}});
auto
add
=
opr
::
ElemwiseMultiType
::
make
(
{
conv1
,
conv2
},
{
opr
::
ElemwiseMultiType
::
Param
::
Mode
::
QADD
},
OperatorNodeConfig
{
dtype
::
QuantizedS8
{
1.2
f
}});
auto
y
=
opr
::
TypeCvt
::
make
(
add
,
dtype
::
Float32
());
SymbolVar
y_opt
;
{
auto
options
=
gopt
::
OptimizeForInferenceOptions
{};
options
.
enable_nchw4
();
unpack_vector
(
gopt
::
optimize_for_inference
({
y
},
options
),
y_opt
);
}
auto
nr_dimshuffle
=
find_opr_num
<
mgb
::
opr
::
Dimshuffle
>
(
y_opt
);
ASSERT_EQ
(
2u
,
nr_dimshuffle
);
ASSERT_EQ
(
opr
::
ConvBias
::
Param
::
Format
::
NCHW4
,
find_opr
<
opr
::
ConvBias
>
(
y_opt
).
param
().
format
);
ASSERT_EQ
(
opr
::
ResizeForward
::
Param
::
Format
::
NCHW4
,
find_opr
<
opr
::
ResizeForward
>
(
y_opt
).
param
().
format
);
ASSERT_EQ
(
opr
::
WarpPerspectiveForward
::
Param
::
Format
::
NCHW4
,
find_opr
<
opr
::
WarpPerspectiveForward
>
(
y_opt
).
param
().
format
);
ASSERT_EQ
(
opr
::
PoolingForward
::
Param
::
Format
::
NCHW4
,
find_opr
<
opr
::
PoolingForward
>
(
y_opt
).
param
().
format
);
}
TEST
(
TestGoptInference
,
ConvertFormatNCHW4
)
{
HostTensorGenerator
<>
gen
;
auto
cn
=
CompNode
::
load
(
"cpu0"
);
...
...
@@ -2479,7 +2565,7 @@ TEST(TestGoptInference, ConvertFormatNCHW4) {
};
auto
x
=
mkvar
(
"x"
,
{
2
,
4
,
16
,
16
});
// ConvBias
// ConvBias
test dense
opr
::
ConvBias
::
Param
param_conv_bias
;
param_conv_bias
.
pad_h
=
param_conv_bias
.
pad_w
=
1
;
param_conv_bias
.
sparse
=
opr
::
ConvBias
::
Param
::
Sparse
::
DENSE
;
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录