Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
机器未来
Paddle
提交
e3f8e5cf
P
Paddle
项目概览
机器未来
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
e3f8e5cf
编写于
8月 28, 2020
作者:
P
Pei Yang
提交者:
GitHub
8月 28, 2020
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
trt int8 support conv2d_transpose (#26636)
上级
30aab177
变更
3
显示空白变更内容
内联
并排
Showing
3 changed file
with
29 addition
and
10 deletion
+29
-10
paddle/fluid/framework/ir/quant_conv2d_dequant_fuse_pass.cc
paddle/fluid/framework/ir/quant_conv2d_dequant_fuse_pass.cc
+21
-9
paddle/fluid/inference/tensorrt/convert/conv2d_op.cc
paddle/fluid/inference/tensorrt/convert/conv2d_op.cc
+7
-1
python/paddle/fluid/contrib/slim/quantization/quantization_pass.py
...ddle/fluid/contrib/slim/quantization/quantization_pass.py
+1
-0
未找到文件。
paddle/fluid/framework/ir/quant_conv2d_dequant_fuse_pass.cc
浏览文件 @
e3f8e5cf
...
...
@@ -81,7 +81,8 @@ void DeleteQuant(ir::Graph* graph, Scope* scope,
if
(
quantized_op_type
==
"conv2d"
||
quantized_op_type
==
"conv2d_fusion"
||
quantized_op_type
==
"depthwise_conv2d"
||
quantized_op_type
==
"fc"
)
{
quantized_op_type
==
"fc"
||
quantized_op_type
==
"conv2d_transpose"
)
{
op_desc
->
SetAttr
(
"Input_scale"
,
scale_value
);
}
else
if
(
quantized_op_type
==
"mul"
)
{
op_desc
->
SetAttr
(
"X_scale"
,
scale_value
);
...
...
@@ -111,7 +112,8 @@ void FuseDequant(ir::Graph* graph, Scope* scope,
std
::
string
input_name
=
""
;
if
(
quantized_op_type
==
"conv2d"
||
quantized_op_type
==
"depthwise_conv2d"
||
quantized_op_type
==
"conv2d_fusion"
)
{
quantized_op_type
==
"conv2d_fusion"
||
quantized_op_type
==
"conv2d_transpose"
)
{
weight_name
=
"Filter"
;
input_name
=
"Input"
;
}
else
if
(
quantized_op_type
==
"mul"
)
{
...
...
@@ -122,7 +124,8 @@ void FuseDequant(ir::Graph* graph, Scope* scope,
input_name
=
"Input"
;
}
else
{
PADDLE_THROW
(
platform
::
errors
::
Unimplemented
(
"QuantDequantFuse: We only support conv2d, conv2d_fusion, fc, mul for "
"QuantDequantFuse: We only support conv2d, conv2d_fusion, "
"conv2d_transpose, fc, mul for "
"now."
));
}
const
std
::
string
pattern_name
=
"dequant_fuse"
;
...
...
@@ -192,10 +195,12 @@ void FuseDequant(ir::Graph* graph, Scope* scope,
scope
->
Var
(
quantized_op_weight_node
->
Name
())
->
GetMutable
<
LoDTensor
>
();
auto
w_dims
=
weight_tensor
->
dims
();
// If quantized op is fc, weight scale size = 1;
// If quantized op is conv, weight scale size = weight dims[0]
// If quantized op is conv2d, weight scale size = weight dims[0]
// If quantized op is conv2d_transpose, weight scale size = weight dims[1]
bool
valid_scale_size
=
(
weight_scale
.
size
()
==
1
||
weight_scale
.
size
()
==
static_cast
<
size_t
>
(
w_dims
[
0
]));
weight_scale
.
size
()
==
static_cast
<
size_t
>
(
w_dims
[
0
])
||
weight_scale
.
size
()
==
static_cast
<
size_t
>
(
w_dims
[
1
]));
PADDLE_ENFORCE_EQ
(
valid_scale_size
,
true
,
platform
::
errors
::
InvalidArgument
(
...
...
@@ -205,11 +210,17 @@ void FuseDequant(ir::Graph* graph, Scope* scope,
for
(
int
j
=
0
;
j
<
weight_tensor
->
numel
();
j
++
)
{
if
(
weight_scale
.
size
()
==
1
)
{
quantized_weight_data
[
j
]
*=
weight_scale
[
0
];
}
else
{
if
(
quantized_op_type
==
"conv2d_transpose"
)
{
int
inner_size
=
w_dims
[
2
]
*
w_dims
[
3
];
quantized_weight_data
[
j
]
*=
weight_scale
[(
j
/
inner_size
)
%
w_dims
[
1
]];
}
else
{
int
inner_size
=
w_dims
[
1
]
*
w_dims
[
2
]
*
w_dims
[
3
];
quantized_weight_data
[
j
]
*=
weight_scale
[
j
/
inner_size
];
}
}
}
// create new op_desc
auto
base_op_desc
=
*
quantized_op_node
->
Op
()
->
Proto
();
...
...
@@ -220,7 +231,8 @@ void FuseDequant(ir::Graph* graph, Scope* scope,
new_op_desc
.
SetType
(
quantized_op_type
);
new_op_desc
.
SetAttr
(
"enable_int8"
,
true
);
if
(
quantized_op_type
==
"conv2d"
||
quantized_op_type
==
"conv2d_fusion"
||
quantized_op_type
==
"depthwise_conv2d"
)
{
quantized_op_type
==
"depthwise_conv2d"
||
quantized_op_type
==
"conv2d_transpose"
)
{
new_op_desc
.
SetInput
(
"Input"
,
{
new_input
});
new_op_desc
.
SetOutput
(
"Output"
,
{
new_output
});
}
else
if
(
quantized_op_type
==
"fc"
)
{
...
...
@@ -253,7 +265,7 @@ void QuantDequantFusePass::ApplyImpl(ir::Graph* graph) const {
std
::
unordered_set
<
std
::
string
>
quant_types
=
{
"fake_quantize_range_abs_max"
,
"fake_quantize_moving_average_abs_max"
};
std
::
unordered_set
<
std
::
string
>
quantized_op_types
=
{
"conv2d"
,
"mul"
,
"depthwise_conv2d"
,
"fc"
};
"conv2d"
,
"mul"
,
"depthwise_conv2d"
,
"fc"
,
"conv2d_transpose"
};
auto
*
scope
=
param_scope
();
for
(
auto
&
quant_type
:
quant_types
)
{
...
...
paddle/fluid/inference/tensorrt/convert/conv2d_op.cc
浏览文件 @
e3f8e5cf
...
...
@@ -51,7 +51,13 @@ void ConvertConv2d(TensorRTEngine* engine, const framework::proto::OpDesc& op,
if
(
enable_int8
)
{
#if IS_TRT_VERSION_GE(5000)
CHECK
(
op_desc
.
HasAttr
(
"Input_scale"
));
if
(
op_desc
.
Type
()
!=
"conv2d_transpose"
)
{
PADDLE_ENFORCE_EQ
(
op_desc
.
HasAttr
(
"Input_scale"
),
true
,
platform
::
errors
::
InvalidArgument
(
"Input scale not found. TRT int8"
" requires conv/deconv to have "
"input quantization scales."
));
}
float
in_scale
=
BOOST_GET_CONST
(
float
,
op_desc
.
GetAttr
(
"Input_scale"
))
*
127
;
auto
weight_scale
=
...
...
python/paddle/fluid/contrib/slim/quantization/quantization_pass.py
浏览文件 @
e3f8e5cf
...
...
@@ -68,6 +68,7 @@ _out_scale_op_list = [
"scale"
,
"hard_swish"
,
"hard_sigmoid"
,
"conv2d_transpose"
,
]
# list op real input and output names, to avoid processing input such as AxisTensor.
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录