Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
机器未来
Paddle
提交
a32d4200
P
Paddle
项目概览
机器未来
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
a32d4200
编写于
3月 07, 2019
作者:
F
flame
提交者:
nhzlx
3月 20, 2019
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
cherry-pick from feature/anakin-engine: batch norm (#16110)
* use anakin batch norm and scale implement fluid batch norm
上级
0945b97f
变更
2
隐藏空白更改
内联
并排
Showing
2 changed file
with
50 addition
and
48 deletion
+50
-48
paddle/fluid/inference/anakin/convert/batch_norm.cc
paddle/fluid/inference/anakin/convert/batch_norm.cc
+50
-47
paddle/fluid/inference/anakin/convert/test_batch_norm_op.cc
paddle/fluid/inference/anakin/convert/test_batch_norm_op.cc
+0
-1
未找到文件。
paddle/fluid/inference/anakin/convert/batch_norm.cc
浏览文件 @
a32d4200
...
@@ -41,16 +41,15 @@ void BatchNormOpConverter::operator()(const framework::proto::OpDesc &op,
...
@@ -41,16 +41,15 @@ void BatchNormOpConverter::operator()(const framework::proto::OpDesc &op,
auto
output
=
op_desc
.
Output
(
"Y"
).
front
();
auto
output
=
op_desc
.
Output
(
"Y"
).
front
();
auto
op_name
=
op_desc
.
Type
()
+
":"
+
op_desc
.
Output
(
"Y"
).
front
();
auto
op_name
=
op_desc
.
Type
()
+
":"
+
op_desc
.
Output
(
"Y"
).
front
();
engine_
->
AddOp
(
op_name
,
"Scale"
,
{
inputs
[
"X"
]},
{
output
});
engine_
->
AddOpAttr
(
op_name
,
"bias_term"
,
true
);
engine_
->
AddOpAttr
(
op_name
,
"axis"
,
1
);
engine_
->
AddOpAttr
(
op_name
,
"num_axes"
,
1
);
bool
is_test
=
boost
::
get
<
bool
>
(
op_desc
.
GetAttr
(
"is_test"
));
bool
is_test
=
boost
::
get
<
bool
>
(
op_desc
.
GetAttr
(
"is_test"
));
PADDLE_ENFORCE
(
is_test
);
auto
epsilon
=
boost
::
get
<
float
>
(
op_desc
.
GetAttr
(
"epsilon"
));
float
epsilon
=
boost
::
get
<
float
>
(
op_desc
.
GetAttr
(
"epsilon"
));
engine_
->
AddOpAttr
(
op_name
,
"epsilon"
,
epsilon
);
auto
bn_op_name
=
op_name
+
":bn"
;
auto
bn_output
=
bn_op_name
+
"_output"
;
engine_
->
AddOp
(
bn_op_name
,
"BatchNorm"
,
{
inputs
[
"X"
]},
{
bn_output
});
engine_
->
AddOpAttr
(
bn_op_name
,
"epsilon"
,
epsilon
);
auto
scale_op_name
=
op_name
+
":scale"
;
auto
get_lod_tensor
=
[
this
,
&
scope
,
&
op_name
](
const
std
::
string
&
var_name
,
auto
get_lod_tensor
=
[
this
,
&
scope
,
&
op_name
](
const
std
::
string
&
var_name
,
framework
::
LoDTensor
*
tensor
)
{
framework
::
LoDTensor
*
tensor
)
{
auto
*
v
=
scope
.
FindVar
(
var_name
);
auto
*
v
=
scope
.
FindVar
(
var_name
);
...
@@ -69,50 +68,54 @@ void BatchNormOpConverter::operator()(const framework::proto::OpDesc &op,
...
@@ -69,50 +68,54 @@ void BatchNormOpConverter::operator()(const framework::proto::OpDesc &op,
get_lod_tensor
(
inputs
[
"Scale"
],
&
scale_t
);
get_lod_tensor
(
inputs
[
"Scale"
],
&
scale_t
);
get_lod_tensor
(
inputs
[
"Variance"
],
&
variance_t
);
get_lod_tensor
(
inputs
[
"Variance"
],
&
variance_t
);
auto
*
bias
=
bias_t
.
mutable_data
<
float
>
(
platform
::
CPUPlace
());
auto
fill_shape
=
[](
size_t
n
,
std
::
vector
<
int
>
shape
)
{
auto
*
mean
=
mean_t
.
mutable_data
<
float
>
(
platform
::
CPUPlace
());
shape
.
insert
(
shape
.
begin
(),
1
);
auto
*
scale
=
scale_t
.
mutable_data
<
float
>
(
platform
::
CPUPlace
());
if
(
shape
.
size
()
<
n
)
{
auto
*
variance
=
variance_t
.
mutable_data
<
float
>
(
platform
::
CPUPlace
());
shape
.
insert
(
shape
.
end
(),
n
-
shape
.
size
(),
1
);
framework
::
LoDTensor
combile_scale_t
;
framework
::
LoDTensor
combile_bias_t
;
combile_scale_t
.
Resize
(
scale_t
.
dims
());
combile_bias_t
.
Resize
(
bias_t
.
dims
());
auto
*
combile_scale
=
combile_scale_t
.
mutable_data
<
float
>
(
platform
::
CPUPlace
());
auto
*
combile_bias
=
combile_bias_t
.
mutable_data
<
float
>
(
platform
::
CPUPlace
());
size_t
elem_num
=
combile_scale_t
.
memory_size
()
/
sizeof
(
float
);
for
(
size_t
i
=
0
;
i
<
elem_num
;
i
++
)
{
combile_scale
[
i
]
=
scale
[
i
]
/
sqrtf
(
variance
[
i
]
+
epsilon
);
combile_bias
[
i
]
=
bias
[
i
]
-
mean
[
i
]
*
combile_scale
[
i
];
}
auto
fill_shape
=
[](
size_t
n
,
std
::
vector
<
int
>
*
shape
)
{
shape
->
insert
(
shape
->
begin
(),
1
);
if
(
shape
->
size
()
<
n
)
{
shape
->
insert
(
shape
->
end
(),
n
-
shape
->
size
(),
1
);
}
}
return
shape
;
};
};
auto
scale_shape
=
framework
::
vectorize2int
(
combile_scale_t
.
dims
());
Shape
shape1
(
fill_shape
(
4
,
framework
::
vectorize2int
(
mean_t
.
dims
())));
auto
bias_shape
=
framework
::
vectorize2int
(
combile_bias_t
.
dims
());
Shape
shape2
(
fill_shape
(
4
,
framework
::
vectorize2int
(
variance_t
.
dims
())));
fill_shape
(
4
,
&
scale_shape
);
fill_shape
(
4
,
&
bias_shape
);
Shape
weight1_shape
(
scale_shape
);
Shape
weight2_shape
(
bias_shape
);
auto
*
weight1
=
auto
*
weight1
=
GraphGlobalMem
<
NV
>::
Global
().
template
new_block
<
AK_FLOAT
>(
weight1_shape
);
GraphGlobalMem
<
NV
>::
Global
().
template
new_block
<
AK_FLOAT
>(
shape1
);
auto
*
scale_data
=
static_cast
<
float
*>
(
weight1
->
h_tensor
().
mutable_data
());
auto
*
mean_data
=
static_cast
<
float
*>
(
weight1
->
h_tensor
().
mutable_data
());
std
::
copy_n
(
combile_scale_t
.
data
<
float
>
(),
combile_scale_t
.
numel
(),
std
::
copy_n
(
mean_t
.
data
<
float
>
(),
mean_t
.
numel
(),
mean_data
);
scale_data
);
engine_
->
AddOpAttr
(
bn_op_name
,
"weight_1"
,
*
weight1
);
engine_
->
AddOpAttr
(
op_name
,
"weight_1"
,
*
weight1
);
auto
*
weight2
=
auto
*
weight2
=
GraphGlobalMem
<
NV
>::
Global
().
template
new_block
<
AK_FLOAT
>(
weight2_shape
);
GraphGlobalMem
<
NV
>::
Global
().
template
new_block
<
AK_FLOAT
>(
shape2
);
auto
*
bias_data
=
static_cast
<
float
*>
(
weight2
->
h_tensor
().
mutable_data
());
auto
*
variance_data
=
std
::
copy_n
(
combile_bias_t
.
data
<
float
>
(),
combile_bias_t
.
numel
(),
bias_data
);
static_cast
<
float
*>
(
weight2
->
h_tensor
().
mutable_data
());
engine_
->
AddOpAttr
(
op_name
,
"weight_2"
,
*
weight2
);
std
::
copy_n
(
variance_t
.
data
<
float
>
(),
variance_t
.
numel
(),
variance_data
);
engine_
->
AddOpAttr
(
bn_op_name
,
"weight_2"
,
*
weight2
);
Shape
shape3
(
std
::
vector
<
int
>
({
1
,
1
,
1
,
1
}));
auto
*
weight3
=
GraphGlobalMem
<
NV
>::
Global
().
template
new_block
<
AK_FLOAT
>(
shape3
);
auto
*
alpha_data
=
static_cast
<
float
*>
(
weight3
->
h_tensor
().
mutable_data
());
float
weight3_data
[]
=
{
1
};
std
::
copy
(
std
::
begin
(
weight3_data
),
std
::
end
(
weight3_data
),
alpha_data
);
engine_
->
AddOpAttr
(
bn_op_name
,
"weight_3"
,
*
weight3
);
Shape
scale_shape
(
fill_shape
(
4
,
framework
::
vectorize2int
(
scale_t
.
dims
())));
auto
*
scale
=
GraphGlobalMem
<
NV
>::
Global
().
template
new_block
<
AK_FLOAT
>(
scale_shape
);
auto
*
scale_data
=
static_cast
<
float
*>
(
scale
->
h_tensor
().
mutable_data
());
std
::
copy_n
(
scale_t
.
data
<
float
>
(),
scale_t
.
numel
(),
scale_data
);
Shape
bias_shape
(
fill_shape
(
4
,
framework
::
vectorize2int
(
bias_t
.
dims
())));
auto
*
bias
=
GraphGlobalMem
<
NV
>::
Global
().
template
new_block
<
AK_FLOAT
>(
bias_shape
);
auto
*
bias_data
=
static_cast
<
float
*>
(
bias
->
h_tensor
().
mutable_data
());
std
::
copy_n
(
bias_t
.
data
<
float
>
(),
bias_t
.
numel
(),
bias_data
);
engine_
->
AddOp
(
scale_op_name
,
"Scale"
,
{
bn_output
},
{
output
});
engine_
->
AddOpAttr
(
scale_op_name
,
"axis"
,
1
);
engine_
->
AddOpAttr
(
scale_op_name
,
"num_axes"
,
1
);
engine_
->
AddOpAttr
(
scale_op_name
,
"bias_term"
,
true
);
engine_
->
AddOpAttr
(
scale_op_name
,
"weight_1"
,
*
scale
);
engine_
->
AddOpAttr
(
scale_op_name
,
"weight_2"
,
*
bias
);
}
}
}
// namespace anakin
}
// namespace anakin
...
...
paddle/fluid/inference/anakin/convert/test_batch_norm_op.cc
浏览文件 @
a32d4200
...
@@ -54,7 +54,6 @@ TEST(batch_norm_op, test) {
...
@@ -54,7 +54,6 @@ TEST(batch_norm_op, test) {
float
eps
=
1e-5
f
;
float
eps
=
1e-5
f
;
desc
.
SetAttr
(
"epsilon"
,
eps
);
desc
.
SetAttr
(
"epsilon"
,
eps
);
desc
.
SetAttr
(
"is_test"
,
true
);
desc
.
SetAttr
(
"is_test"
,
true
);
// desc.SetAttr("momentum", 0.8f);
validator
.
SetOp
(
*
desc
.
Proto
());
validator
.
SetOp
(
*
desc
.
Proto
());
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录