Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle
提交
ed7956a8
P
Paddle
项目概览
PaddlePaddle
/
Paddle
大约 1 年 前同步成功
通知
2299
Star
20931
Fork
5422
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1423
列表
看板
标记
里程碑
合并请求
543
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1,423
Issue
1,423
列表
看板
标记
里程碑
合并请求
543
合并请求
543
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
ed7956a8
编写于
3月 21, 2021
作者:
G
guofei
提交者:
GitHub
3月 21, 2021
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
Fix skip_quant in QAT (#31704)
* Fix skip_quant in QAT
上级
8c19d7aa
变更
4
隐藏空白更改
内联
并排
Showing
4 changed file
with
60 addition
and
7 deletion
+60
-7
python/paddle/fluid/contrib/slim/quantization/imperative/qat.py
.../paddle/fluid/contrib/slim/quantization/imperative/qat.py
+35
-3
python/paddle/fluid/contrib/slim/quantization/imperative/utils.py
...addle/fluid/contrib/slim/quantization/imperative/utils.py
+6
-0
python/paddle/fluid/contrib/slim/tests/test_imperative_out_scale.py
...dle/fluid/contrib/slim/tests/test_imperative_out_scale.py
+7
-0
python/paddle/fluid/contrib/slim/tests/test_imperative_skip_op.py
...addle/fluid/contrib/slim/tests/test_imperative_skip_op.py
+12
-4
未找到文件。
python/paddle/fluid/contrib/slim/quantization/imperative/qat.py
浏览文件 @
ed7956a8
...
@@ -515,6 +515,8 @@ class ImperativeCalcOutputScale(object):
...
@@ -515,6 +515,8 @@ class ImperativeCalcOutputScale(object):
self
.
_out_scale_dict
[
ops_list
[
op_count
]])
self
.
_out_scale_dict
[
ops_list
[
op_count
]])
op_count
+=
1
op_count
+=
1
self
.
_set_skip_quant_attr
(
inference_program
)
# save the final quantized model that has output scales
# save the final quantized model that has output scales
save_inference_model
(
save_inference_model
(
dirname
=
dirname
,
dirname
=
dirname
,
...
@@ -537,9 +539,12 @@ class ImperativeCalcOutputScale(object):
...
@@ -537,9 +539,12 @@ class ImperativeCalcOutputScale(object):
Init the scale params for calculating output scales and save them in the
Init the scale params for calculating output scales and save them in the
target layer.
target layer.
After the users define the dygraph model, the hooks for calculating output
After the users define the dygraph model, the hooks for calculating output
scales will not execute immediately. If the users load the checkpoint now,
scales will not execute immediately. If the users load parameters form
the scale params have not been created, so them cann't be loaded.
checkpoint and save the quantized inference model immediately, the inference
Therefore, define the scale params in the beginning.
model would not be saved successfully. Beacuse the dygraph_to_static requires
that the parameters created in __init__, but the uniqueness of hook make it
impossible to create parameters in __init__. To avoid this mistake, we define
the scale parameters in the beginning instead of hook.
"""
"""
def
_create_param
(
in_layer
,
first_name
,
last_name
,
dtype
):
def
_create_param
(
in_layer
,
first_name
,
last_name
,
dtype
):
...
@@ -587,6 +592,33 @@ class ImperativeCalcOutputScale(object):
...
@@ -587,6 +592,33 @@ class ImperativeCalcOutputScale(object):
op_type
=
op_type
.
replace
(
'relu'
,
're_lu'
)
op_type
=
op_type
.
replace
(
'relu'
,
're_lu'
)
return
op_type
in
layer_name
return
op_type
in
layer_name
def
_set_skip_quant_attr
(
self
,
program
):
block
=
program
.
global_block
()
for
op
in
block
.
ops
:
if
self
.
_is_skip_quant_op
(
block
,
op
):
op
.
_set_attr
(
"skip_quant"
,
True
)
def
_is_skip_quant_op
(
self
,
block
,
in_op
):
"""
The input op should be skipped quantization.
1. the type of input op should be conv2d, depthwise_conv2d or matmul
2. the previous ops of the input op are not fake_quantize_dequantize ops
"""
def
_find_previous_op
(
block
,
var_name
):
for
op
in
block
.
ops
:
if
var_name
in
op
.
output_arg_names
:
return
op
target_op_types
=
[
"conv2d"
,
"depthwise_conv2d"
,
"matmul"
]
if
in_op
.
type
not
in
target_op_types
:
return
False
previous_ops
=
[
_find_previous_op
(
block
,
arg_name
)
\
for
arg_name
in
in_op
.
input_arg_names
]
return
any
(
op
is
not
None
and
op
.
type
not
in
utils
.
fake_quantize_dequantize_types
\
for
op
in
previous_ops
)
def
_calc_output_scale_hook
(
self
,
layer
,
input
,
output
):
def
_calc_output_scale_hook
(
self
,
layer
,
input
,
output
):
"""
"""
Create the MovingAverageAbsMaxScale layer for the target layer if needed.
Create the MovingAverageAbsMaxScale layer for the target layer if needed.
...
...
python/paddle/fluid/contrib/slim/quantization/imperative/utils.py
浏览文件 @
ed7956a8
...
@@ -52,6 +52,12 @@ supported_quant_layers_map = {
...
@@ -52,6 +52,12 @@ supported_quant_layers_map = {
'LayerNorm'
:
paddle
.
nn
.
LayerNorm
,
'LayerNorm'
:
paddle
.
nn
.
LayerNorm
,
}
}
fake_quantize_dequantize_types
=
[
"fake_quantize_dequantize_abs_max"
,
"fake_quantize_dequantize_channel_wise_abs_max"
,
"fake_quantize_dequantize_moving_average_abs_max"
]
out_scale_layers_list
=
(
out_scale_layers_list
=
(
paddle
.
nn
.
Conv2D
,
paddle
.
nn
.
Linear
,
paddle
.
nn
.
MaxPool2D
,
paddle
.
nn
.
Conv2D
,
paddle
.
nn
.
Linear
,
paddle
.
nn
.
MaxPool2D
,
paddle
.
nn
.
BatchNorm
,
paddle
.
nn
.
BatchNorm2D
,
paddle
.
nn
.
SyncBatchNorm
,
paddle
.
nn
.
BatchNorm
,
paddle
.
nn
.
BatchNorm2D
,
paddle
.
nn
.
SyncBatchNorm
,
...
...
python/paddle/fluid/contrib/slim/tests/test_imperative_out_scale.py
浏览文件 @
ed7956a8
...
@@ -393,12 +393,16 @@ class TestImperativeOutSclae(unittest.TestCase):
...
@@ -393,12 +393,16 @@ class TestImperativeOutSclae(unittest.TestCase):
if
'fake'
in
op
.
type
:
if
'fake'
in
op
.
type
:
static_ops
.
remove
(
op
)
static_ops
.
remove
(
op
)
op_count
=
0
for
i
in
range
(
len
(
dynamic_ops
)):
for
i
in
range
(
len
(
dynamic_ops
)):
if
dynamic_ops
[
i
].
has_attr
(
"out_threshold"
):
if
dynamic_ops
[
i
].
has_attr
(
"out_threshold"
):
op_count
+=
1
self
.
assertTrue
(
dynamic_ops
[
i
].
type
==
static_ops
[
i
].
type
)
self
.
assertTrue
(
dynamic_ops
[
i
].
type
==
static_ops
[
i
].
type
)
self
.
assertTrue
(
dynamic_ops
[
i
].
attr
(
"out_threshold"
)
==
self
.
assertTrue
(
dynamic_ops
[
i
].
attr
(
"out_threshold"
)
==
static_ops
[
i
].
attr
(
"out_threshold"
))
static_ops
[
i
].
attr
(
"out_threshold"
))
self
.
assertTrue
(
op_count
==
13
)
class
TestSaveQuanztizedModelFromCheckPoint
(
unittest
.
TestCase
):
class
TestSaveQuanztizedModelFromCheckPoint
(
unittest
.
TestCase
):
def
test_save_quantized_model
(
self
):
def
test_save_quantized_model
(
self
):
...
@@ -459,11 +463,14 @@ class TestSaveQuanztizedModelFromCheckPoint(unittest.TestCase):
...
@@ -459,11 +463,14 @@ class TestSaveQuanztizedModelFromCheckPoint(unittest.TestCase):
if
'fake'
in
op
.
type
:
if
'fake'
in
op
.
type
:
static_ops
.
remove
(
op
)
static_ops
.
remove
(
op
)
op_count
=
0
for
i
in
range
(
len
(
dynamic_ops
)):
for
i
in
range
(
len
(
dynamic_ops
)):
if
dynamic_ops
[
i
].
has_attr
(
"out_threshold"
):
if
dynamic_ops
[
i
].
has_attr
(
"out_threshold"
):
op_count
+=
1
self
.
assertTrue
(
dynamic_ops
[
i
].
type
==
static_ops
[
i
].
type
)
self
.
assertTrue
(
dynamic_ops
[
i
].
type
==
static_ops
[
i
].
type
)
self
.
assertTrue
(
dynamic_ops
[
i
].
attr
(
"out_threshold"
)
==
self
.
assertTrue
(
dynamic_ops
[
i
].
attr
(
"out_threshold"
)
==
static_ops
[
i
].
attr
(
"out_threshold"
))
static_ops
[
i
].
attr
(
"out_threshold"
))
self
.
assertTrue
(
op_count
==
13
)
class
TestSaveQuantizedModel_Warning
(
unittest
.
TestCase
):
class
TestSaveQuantizedModel_Warning
(
unittest
.
TestCase
):
...
...
python/paddle/fluid/contrib/slim/tests/test_imperative_skip_op.py
浏览文件 @
ed7956a8
...
@@ -200,9 +200,12 @@ class TestImperativeOutSclae(unittest.TestCase):
...
@@ -200,9 +200,12 @@ class TestImperativeOutSclae(unittest.TestCase):
params_filename
=
"lenet"
+
INFER_PARAMS_SUFFIX
))
params_filename
=
"lenet"
+
INFER_PARAMS_SUFFIX
))
model_ops
=
inference_program
.
global_block
().
ops
model_ops
=
inference_program
.
global_block
().
ops
conv2d_count
,
mul_count
=
0
,
0
conv2d_count
,
matmul_count
=
0
,
0
conv2d_skip_count
,
matmul_skip_count
=
0
,
0
for
i
,
op
in
enumerate
(
model_ops
):
for
i
,
op
in
enumerate
(
model_ops
):
if
op
.
type
==
'conv2d'
:
if
op
.
type
==
'conv2d'
:
if
op
.
has_attr
(
"skip_quant"
):
conv2d_skip_count
+=
1
if
conv2d_count
>
0
:
if
conv2d_count
>
0
:
self
.
assertTrue
(
self
.
assertTrue
(
'fake_quantize_dequantize'
in
model_ops
[
i
-
1
].
type
)
'fake_quantize_dequantize'
in
model_ops
[
i
-
1
].
type
)
...
@@ -211,14 +214,19 @@ class TestImperativeOutSclae(unittest.TestCase):
...
@@ -211,14 +214,19 @@ class TestImperativeOutSclae(unittest.TestCase):
'fake_quantize_dequantize'
not
in
model_ops
[
i
-
1
].
type
)
'fake_quantize_dequantize'
not
in
model_ops
[
i
-
1
].
type
)
conv2d_count
+=
1
conv2d_count
+=
1
if
op
.
type
==
'mul'
:
if
op
.
type
==
'matmul'
:
if
mul_count
>
0
:
if
op
.
has_attr
(
"skip_quant"
):
matmul_skip_count
+=
1
if
matmul_count
>
0
:
self
.
assertTrue
(
self
.
assertTrue
(
'fake_quantize_dequantize'
in
model_ops
[
i
-
1
].
type
)
'fake_quantize_dequantize'
in
model_ops
[
i
-
1
].
type
)
else
:
else
:
self
.
assertTrue
(
self
.
assertTrue
(
'fake_quantize_dequantize'
not
in
model_ops
[
i
-
1
].
type
)
'fake_quantize_dequantize'
not
in
model_ops
[
i
-
1
].
type
)
mul_count
+=
1
matmul_count
+=
1
self
.
assertTrue
(
conv2d_skip_count
==
1
)
self
.
assertTrue
(
matmul_skip_count
==
1
)
if
__name__
==
'__main__'
:
if
__name__
==
'__main__'
:
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录