Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
BaiXuePrincess
Paddle
提交
42d2915a
P
Paddle
项目概览
BaiXuePrincess
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
42d2915a
编写于
8月 28, 2020
作者:
C
ceci3
提交者:
GitHub
8月 28, 2020
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
[2.0 API] add SyncBatchNorm.convert_sync_batch_norm (#26688)
* add cnvert,test=develop
上级
68e0560c
变更
4
隐藏空白更改
内联
并排
Showing
4 changed file
with
117 addition
and
77 deletion
+117
-77
python/paddle/fluid/tests/unittests/test_batch_norm_op_v2.py
python/paddle/fluid/tests/unittests/test_batch_norm_op_v2.py
+25
-0
python/paddle/fluid/tests/unittests/test_layers.py
python/paddle/fluid/tests/unittests/test_layers.py
+1
-1
python/paddle/fluid/tests/unittests/test_sync_batch_norm_op.py
...n/paddle/fluid/tests/unittests/test_sync_batch_norm_op.py
+16
-0
python/paddle/nn/layer/norm.py
python/paddle/nn/layer/norm.py
+75
-76
未找到文件。
python/paddle/fluid/tests/unittests/test_batch_norm_op_v2.py
浏览文件 @
42d2915a
...
@@ -85,10 +85,35 @@ class TestBatchNorm(unittest.TestCase):
...
@@ -85,10 +85,35 @@ class TestBatchNorm(unittest.TestCase):
y
=
bn
(
fluid
.
dygraph
.
to_variable
(
x
))
y
=
bn
(
fluid
.
dygraph
.
to_variable
(
x
))
return
y
.
numpy
()
return
y
.
numpy
()
def
compute_v3
(
x
,
is_test
,
trainable_statistics
):
with
fluid
.
dygraph
.
guard
(
p
):
bn
=
fluid
.
dygraph
.
BatchNorm
(
shape
[
1
],
is_test
=
is_test
,
param_attr
=
fluid
.
ParamAttr
(
initializer
=
fluid
.
initializer
.
Constant
(
1.0
),
trainable
=
False
),
bias_attr
=
fluid
.
ParamAttr
(
initializer
=
fluid
.
initializer
.
Constant
(
0.0
),
trainable
=
False
),
trainable_statistics
=
trainable_statistics
)
y
=
bn
(
fluid
.
dygraph
.
to_variable
(
x
))
return
y
.
numpy
()
def
compute_v4
(
x
):
with
fluid
.
dygraph
.
guard
(
p
):
bn
=
paddle
.
nn
.
BatchNorm2d
(
shape
[
1
],
weight_attr
=
False
,
bias_attr
=
False
)
y
=
bn
(
fluid
.
dygraph
.
to_variable
(
x
))
return
y
.
numpy
()
x
=
np
.
random
.
randn
(
*
shape
).
astype
(
"float32"
)
x
=
np
.
random
.
randn
(
*
shape
).
astype
(
"float32"
)
y1
=
compute_v1
(
x
,
False
,
False
)
y1
=
compute_v1
(
x
,
False
,
False
)
y2
=
compute_v2
(
x
)
y2
=
compute_v2
(
x
)
y3
=
compute_v3
(
x
,
False
,
False
)
y4
=
compute_v4
(
x
)
self
.
assertTrue
(
np
.
allclose
(
y1
,
y2
))
self
.
assertTrue
(
np
.
allclose
(
y1
,
y2
))
self
.
assertTrue
(
np
.
allclose
(
y3
,
y4
))
def
test_static
(
self
):
def
test_static
(
self
):
places
=
[
fluid
.
CPUPlace
()]
places
=
[
fluid
.
CPUPlace
()]
...
...
python/paddle/fluid/tests/unittests/test_layers.py
浏览文件 @
42d2915a
...
@@ -299,7 +299,7 @@ class TestLayer(LayerTest):
...
@@ -299,7 +299,7 @@ class TestLayer(LayerTest):
my_syncbn
=
paddle
.
nn
.
SyncBatchNorm
(
3
)
my_syncbn
=
paddle
.
nn
.
SyncBatchNorm
(
3
)
dy_ret
=
my_syncbn
(
base
.
to_variable
(
t
))
dy_ret
=
my_syncbn
(
base
.
to_variable
(
t
))
dy_ret_value
=
dy_ret
.
numpy
()
dy_ret_value
=
dy_ret
.
numpy
()
self
.
assertTrue
(
np
.
array_equal
(
static_ret
,
static_ret
))
self
.
assertTrue
(
np
.
array_equal
(
static_ret
,
dy_ret_value
))
def
test_relu
(
self
):
def
test_relu
(
self
):
with
self
.
static_graph
():
with
self
.
static_graph
():
...
...
python/paddle/fluid/tests/unittests/test_sync_batch_norm_op.py
浏览文件 @
42d2915a
...
@@ -221,5 +221,21 @@ class TestDygraphSyncBatchNormAPIError(unittest.TestCase):
...
@@ -221,5 +221,21 @@ class TestDygraphSyncBatchNormAPIError(unittest.TestCase):
self
.
assertRaises
(
TypeError
,
my_sync_batch_norm
,
x2
)
self
.
assertRaises
(
TypeError
,
my_sync_batch_norm
,
x2
)
class
TestConvertSyncBatchNorm
(
unittest
.
TestCase
):
def
test_convert
(
self
):
if
not
core
.
is_compiled_with_cuda
():
return
with
program_guard
(
Program
(),
Program
()):
model
=
paddle
.
nn
.
Sequential
(
paddle
.
nn
.
Conv2d
(
3
,
5
,
3
),
paddle
.
nn
.
BatchNorm2d
(
5
))
sync_model
=
paddle
.
nn
.
SyncBatchNorm
.
convert_sync_batchnorm
(
model
)
for
idx
,
sublayer
in
enumerate
(
model
.
sublayers
()):
if
isinstance
(
sublayer
,
paddle
.
nn
.
BatchNorm2d
):
self
.
assertEqual
(
isinstance
(
sync_model
[
idx
],
paddle
.
nn
.
SyncBatchNorm
),
True
)
if
__name__
==
'__main__'
:
if
__name__
==
'__main__'
:
unittest
.
main
()
unittest
.
main
()
python/paddle/nn/layer/norm.py
浏览文件 @
42d2915a
...
@@ -27,6 +27,7 @@
...
@@ -27,6 +27,7 @@
# TODO: define normalization api
# TODO: define normalization api
import
six
from
...fluid.dygraph.nn
import
InstanceNorm
from
...fluid.dygraph.nn
import
InstanceNorm
from
...fluid.dygraph
import
BatchNorm
#DEFINE_ALIAS
from
...fluid.dygraph
import
BatchNorm
#DEFINE_ALIAS
...
@@ -36,7 +37,6 @@ from ...fluid.dygraph import BatchNorm #DEFINE_ALIAS
...
@@ -36,7 +37,6 @@ from ...fluid.dygraph import BatchNorm #DEFINE_ALIAS
from
...fluid.dygraph
import
SpectralNorm
#DEFINE_ALIAS
from
...fluid.dygraph
import
SpectralNorm
#DEFINE_ALIAS
from
...fluid.dygraph
import
layers
from
...fluid.dygraph
import
layers
from
...framework
import
get_default_dtype
,
set_default_dtype
from
...framework
import
get_default_dtype
,
set_default_dtype
from
...fluid.framework
import
in_dygraph_mode
from
...fluid.framework
import
in_dygraph_mode
...
@@ -50,6 +50,7 @@ from ..functional import batch_norm, layer_norm, instance_norm
...
@@ -50,6 +50,7 @@ from ..functional import batch_norm, layer_norm, instance_norm
import
numpy
as
np
import
numpy
as
np
import
numbers
import
numbers
import
warnings
import
warnings
from
...fluid.dygraph.base
import
no_grad
__all__
=
[
__all__
=
[
'BatchNorm'
,
'GroupNorm'
,
'LayerNorm'
,
'SpectralNorm'
,
'InstanceNorm'
,
'BatchNorm'
,
'GroupNorm'
,
'LayerNorm'
,
'SpectralNorm'
,
'InstanceNorm'
,
...
@@ -566,17 +567,28 @@ class _BatchNormBase(layers.Layer):
...
@@ -566,17 +567,28 @@ class _BatchNormBase(layers.Layer):
param_shape
=
[
num_features
]
param_shape
=
[
num_features
]
# create parameter
# create parameter
self
.
weight
=
self
.
create_parameter
(
if
weight_attr
==
False
:
attr
=
self
.
_weight_attr
,
self
.
weight
=
self
.
create_parameter
(
shape
=
param_shape
,
attr
=
None
,
shape
=
param_shape
,
default_initializer
=
Constant
(
1.0
))
default_initializer
=
Constant
(
1.0
))
self
.
weight
.
stop_gradient
=
True
self
.
weight
.
stop_gradient
=
(
self
.
_weight_attr
is
False
)
or
(
else
:
self
.
_weight_attr
and
self
.
_weight_attr
.
learning_rate
==
0.
)
self
.
weight
=
self
.
create_parameter
(
attr
=
self
.
_weight_attr
,
shape
=
param_shape
,
default_initializer
=
Constant
(
1.0
))
self
.
weight
.
stop_gradient
=
self
.
_weight_attr
!=
None
and
self
.
_weight_attr
.
learning_rate
==
0.
self
.
bias
=
self
.
create_parameter
(
if
bias_attr
==
False
:
attr
=
self
.
_bias_attr
,
shape
=
param_shape
,
is_bias
=
True
)
self
.
bias
=
self
.
create_parameter
(
self
.
bias
.
stop_gradient
=
(
self
.
_bias_attr
is
False
)
or
(
attr
=
None
,
self
.
_bias_attr
and
self
.
_bias_attr
.
learning_rate
==
0.
)
shape
=
param_shape
,
default_initializer
=
Constant
(
0.0
),
is_bias
=
True
)
self
.
bias
.
stop_gradient
=
True
else
:
self
.
bias
=
self
.
create_parameter
(
attr
=
self
.
_bias_attr
,
shape
=
param_shape
,
is_bias
=
True
)
self
.
bias
.
stop_gradient
=
self
.
_bias_attr
!=
None
and
self
.
_bias_attr
.
learning_rate
==
0.
moving_mean_name
=
None
moving_mean_name
=
None
moving_variance_name
=
None
moving_variance_name
=
None
...
@@ -611,6 +623,7 @@ class _BatchNormBase(layers.Layer):
...
@@ -611,6 +623,7 @@ class _BatchNormBase(layers.Layer):
self
.
_epsilon
=
epsilon
self
.
_epsilon
=
epsilon
self
.
_fuse_with_relu
=
False
self
.
_fuse_with_relu
=
False
self
.
_track_running_stats
=
track_running_stats
self
.
_track_running_stats
=
track_running_stats
self
.
_name
=
name
def
_check_input_dim
(
self
,
input
):
def
_check_input_dim
(
self
,
input
):
raise
NotImplementedError
(
"BatchNorm Base error"
)
raise
NotImplementedError
(
"BatchNorm Base error"
)
...
@@ -898,7 +911,7 @@ class BatchNorm3d(_BatchNormBase):
...
@@ -898,7 +911,7 @@ class BatchNorm3d(_BatchNormBase):
len
(
input
.
shape
)))
len
(
input
.
shape
)))
class
SyncBatchNorm
(
layers
.
Layer
):
class
SyncBatchNorm
(
_BatchNormBase
):
"""
"""
This interface is used to construct a callable object of the ``SyncBatchNorm`` class.
This interface is used to construct a callable object of the ``SyncBatchNorm`` class.
It implements the function of the Cross-GPU Synchronized Batch Normalization Layer, and can
It implements the function of the Cross-GPU Synchronized Batch Normalization Layer, and can
...
@@ -984,72 +997,16 @@ class SyncBatchNorm(layers.Layer):
...
@@ -984,72 +997,16 @@ class SyncBatchNorm(layers.Layer):
def
__init__
(
self
,
def
__init__
(
self
,
num_features
,
num_features
,
epsilon
=
1e-05
,
momentum
=
0.9
,
momentum
=
0.9
,
track_running_stats
=
True
,
epsilon
=
1e-05
,
weight_attr
=
None
,
weight_attr
=
None
,
bias_attr
=
None
,
bias_attr
=
None
,
data_format
=
'NCHW'
,
data_format
=
'NCHW'
,
track_running_stats
=
True
,
name
=
None
):
name
=
None
):
super
(
SyncBatchNorm
,
self
).
__init__
()
super
(
SyncBatchNorm
,
self
.
_weight_attr
=
weight_attr
self
).
__init__
(
num_features
,
momentum
,
epsilon
,
weight_attr
,
self
.
_bias_attr
=
bias_attr
bias_attr
,
data_format
,
track_running_stats
,
name
)
self
.
_num_features
=
num_features
self
.
_data_layout
=
data_format
self
.
_momentum
=
momentum
self
.
_epsilon
=
epsilon
self
.
_track_running_stats
=
track_running_stats
if
self
.
_track_running_stats
==
False
:
warnings
.
warn
(
"moving mean and moving variance will be calculated whether `track_running_stats` is set to `True` or `False`, we will fix it in the next version."
)
param_shape
=
[
self
.
_num_features
]
# create parameter
if
weight_attr
==
False
:
self
.
weight
=
self
.
create_parameter
(
attr
=
None
,
shape
=
param_shape
,
default_initializer
=
Constant
(
1.0
))
self
.
weight
.
stop_gradient
=
True
else
:
self
.
weight
=
self
.
create_parameter
(
attr
=
self
.
_weight_attr
,
shape
=
param_shape
,
default_initializer
=
Constant
(
1.0
))
self
.
weight
.
stop_gradient
=
self
.
_weight_attr
!=
None
and
self
.
_weight_attr
.
learning_rate
==
0.
if
bias_attr
==
False
:
self
.
bias
=
self
.
create_parameter
(
attr
=
None
,
shape
=
param_shape
,
default_initializer
=
Constant
(
0.0
),
is_bias
=
True
)
self
.
bias
.
stop_gradient
=
True
else
:
self
.
bias
=
self
.
create_parameter
(
attr
=
self
.
_bias_attr
,
shape
=
param_shape
,
is_bias
=
True
)
self
.
bias
.
stop_gradient
=
self
.
_weight_attr
!=
None
and
self
.
_weight_attr
.
learning_rate
==
0.
self
.
_mean
=
self
.
create_parameter
(
attr
=
ParamAttr
(
name
=
None
,
initializer
=
Constant
(
0.0
),
trainable
=
False
,
do_model_average
=
True
),
shape
=
param_shape
,
dtype
=
self
.
_dtype
)
self
.
_mean
.
stop_gradient
=
True
self
.
_variance
=
self
.
create_parameter
(
attr
=
ParamAttr
(
name
=
None
,
initializer
=
Constant
(
1.0
),
trainable
=
False
,
do_model_average
=
True
),
shape
=
param_shape
,
dtype
=
self
.
_dtype
)
self
.
_variance
.
stop_gradient
=
True
def
forward
(
self
,
x
):
def
forward
(
self
,
x
):
# create output
# create output
...
@@ -1063,7 +1020,7 @@ class SyncBatchNorm(layers.Layer):
...
@@ -1063,7 +1020,7 @@ class SyncBatchNorm(layers.Layer):
if
in_dygraph_mode
():
if
in_dygraph_mode
():
attrs
=
(
"momentum"
,
self
.
_momentum
,
"epsilon"
,
self
.
_epsilon
,
attrs
=
(
"momentum"
,
self
.
_momentum
,
"epsilon"
,
self
.
_epsilon
,
"is_test"
,
not
self
.
training
,
"data_layout"
,
"is_test"
,
not
self
.
training
,
"data_layout"
,
self
.
_data_
layou
t
,
"use_mkldnn"
,
False
,
"fuse_with_relu"
,
self
.
_data_
forma
t
,
"use_mkldnn"
,
False
,
"fuse_with_relu"
,
False
,
"use_global_stats"
,
False
,
'trainable_statistics'
,
False
,
"use_global_stats"
,
False
,
'trainable_statistics'
,
False
)
False
)
sync_batch_norm_out
,
_
,
_
,
_
,
_
,
_
=
core
.
ops
.
sync_batch_norm
(
sync_batch_norm_out
,
_
,
_
,
_
,
_
,
_
=
core
.
ops
.
sync_batch_norm
(
...
@@ -1073,13 +1030,13 @@ class SyncBatchNorm(layers.Layer):
...
@@ -1073,13 +1030,13 @@ class SyncBatchNorm(layers.Layer):
return
sync_batch_norm_out
return
sync_batch_norm_out
check_variable_and_dtype
(
x
,
'input'
,
[
'float16'
,
'float32'
,
'float64'
],
check_variable_and_dtype
(
x
,
'input'
,
[
'float16'
,
'float32'
,
'float64'
],
'BatchNorm'
)
'
Sync
BatchNorm'
)
attrs
=
{
attrs
=
{
"momentum"
:
self
.
_momentum
,
"momentum"
:
self
.
_momentum
,
"epsilon"
:
self
.
_epsilon
,
"epsilon"
:
self
.
_epsilon
,
"is_test"
:
not
self
.
training
,
"is_test"
:
not
self
.
training
,
"data_layout"
:
self
.
_data_
layou
t
,
"data_layout"
:
self
.
_data_
forma
t
,
"use_mkldnn"
:
False
,
"use_mkldnn"
:
False
,
"fuse_with_relu"
:
False
,
"fuse_with_relu"
:
False
,
"use_global_stats"
:
False
,
"use_global_stats"
:
False
,
...
@@ -1112,3 +1069,45 @@ class SyncBatchNorm(layers.Layer):
...
@@ -1112,3 +1069,45 @@ class SyncBatchNorm(layers.Layer):
self
.
_helper
.
append_op
(
self
.
_helper
.
append_op
(
type
=
"sync_batch_norm"
,
inputs
=
inputs
,
outputs
=
outputs
,
attrs
=
attrs
)
type
=
"sync_batch_norm"
,
inputs
=
inputs
,
outputs
=
outputs
,
attrs
=
attrs
)
return
sync_batch_norm_out
return
sync_batch_norm_out
@
classmethod
def
convert_sync_batchnorm
(
cls
,
layer
):
"""
Helper function to convert :class: `paddle.nn.BatchNorm*d` layers in the model to :class: `paddle.nn.SyncBatchNorm` layers.
Parameters:
layer(paddle.nn.Layer): model containing one or more `BatchNorm*d` layers.
Returns:
The original model with converted SyncBatchNorm layers. If BatchNorm*d layer in the model, use SyncBatchNorm layer instead.
Examples:
.. code-block:: python
import paddle
import paddle.nn as nn
paddle.disable_static()
model = nn.Sequential(nn.Conv2d(3, 5, 3), nn.BatchNorm2d(5))
sync_model = nn.SyncBatchNorm.convert_sync_batchnorm(model)
"""
layer_output
=
layer
if
isinstance
(
layer
,
_BatchNormBase
):
layer_output
=
SyncBatchNorm
(
layer
.
_num_features
,
layer
.
_epsilon
,
layer
.
_momentum
,
layer
.
_weight_attr
,
layer
.
_bias_attr
,
layer
.
_data_format
,
layer
.
_name
)
if
layer
.
_weight_attr
!=
False
and
layer
.
_bias_attr
!=
False
:
with
no_grad
():
layer_output
.
weight
=
layer
.
weight
layer_output
.
bias
=
layer
.
bias
layer_output
.
_mean
=
layer
.
_mean
layer_output
.
_variance
=
layer
.
_variance
for
name
,
sublayer
in
layer
.
named_sublayers
():
layer_output
.
add_sublayer
(
name
,
cls
.
convert_sync_batchnorm
(
sublayer
))
del
layer
return
layer_output
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录