Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
magicwindyyd
mindspore
提交
12eaaf71
M
mindspore
项目概览
magicwindyyd
/
mindspore
与 Fork 源项目一致
Fork自
MindSpore / mindspore
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
M
mindspore
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
12eaaf71
编写于
4月 14, 2020
作者:
H
huanghui
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
mul_add_fusion pass supports when add's 2nd is mul
上级
c176bbe4
变更
3
隐藏空白更改
内联
并排
Showing
3 changed file
with
66 addition
and
25 deletion
+66
-25
mindspore/ccsrc/pre_activate/ascend/ir_fusion/mul_add_fusion.cc
...ore/ccsrc/pre_activate/ascend/ir_fusion/mul_add_fusion.cc
+37
-20
tests/ut/cpp/pre_activate/ascend/ir_fusion/mul_add_fusion_test.cc
.../cpp/pre_activate/ascend/ir_fusion/mul_add_fusion_test.cc
+22
-2
tests/ut/cpp/python_input/gtest_input/pre_activate/mul_add_fusion_test.py
...hon_input/gtest_input/pre_activate/mul_add_fusion_test.py
+7
-3
未找到文件。
mindspore/ccsrc/pre_activate/ascend/ir_fusion/mul_add_fusion.cc
浏览文件 @
12eaaf71
...
@@ -24,40 +24,57 @@
...
@@ -24,40 +24,57 @@
#include "pre_activate/common/helper.h"
#include "pre_activate/common/helper.h"
namespace
mindspore
{
namespace
mindspore
{
bool
GetMul
(
const
FuncGraphPtr
&
graph
,
const
CNodePtr
&
add
,
CNodePtr
*
mul
,
size_t
*
mul_index
)
{
MS_EXCEPTION_IF_NULL
(
graph
);
MS_EXCEPTION_IF_NULL
(
add
);
for
(
size_t
index
=
1
;
index
<
add
->
size
();
++
index
)
{
auto
input
=
add
->
input
(
index
);
MS_EXCEPTION_IF_NULL
(
input
);
if
(
input
->
isa
<
CNode
>
())
{
auto
cnode
=
input
->
cast
<
CNodePtr
>
();
MS_EXCEPTION_IF_NULL
(
cnode
);
if
(
AnfAlgo
::
GetCNodeName
(
cnode
)
==
prim
::
kPrimMul
->
name
())
{
if
(
!
opt
::
IsUsedByOthers
(
graph
,
cnode
))
{
*
mul
=
cnode
;
*
mul_index
=
index
;
return
true
;
}
}
}
}
return
false
;
}
namespace
opt
{
namespace
opt
{
const
BaseRef
MulAddFusion
::
DefinePattern
()
const
{
const
BaseRef
MulAddFusion
::
DefinePattern
()
const
{
VarPtr
mul_x_
=
std
::
make_shared
<
Var
>
();
VarPtr
x
=
std
::
make_shared
<
Var
>
();
VarPtr
mul_y_
=
std
::
make_shared
<
Var
>
();
VarPtr
y
=
std
::
make_shared
<
Var
>
();
VarPtr
add_y_
=
std
::
make_shared
<
Var
>
();
VectorRef
pattern
({
prim
::
kPrimTensorAdd
,
x
,
y
});
return
pattern
;
VectorRef
mul
({
prim
::
kPrimMul
,
mul_x_
,
mul_y_
});
VectorRef
add
({
prim
::
kPrimTensorAdd
,
mul
,
add_y_
});
return
add
;
}
}
const
AnfNodePtr
MulAddFusion
::
Process
(
const
FuncGraphPtr
&
graph
,
const
AnfNodePtr
&
node
,
const
EquivPtr
&
equiv
)
const
{
const
AnfNodePtr
MulAddFusion
::
Process
(
const
FuncGraphPtr
&
graph
,
const
AnfNodePtr
&
node
,
const
EquivPtr
&
)
const
{
if
(
graph
==
nullptr
||
node
==
nullptr
||
equiv
==
nullptr
)
{
if
(
graph
==
nullptr
||
node
==
nullptr
)
{
return
nullptr
;
return
nullptr
;
}
}
auto
add
=
node
->
cast
<
CNodePtr
>
();
auto
add
=
node
->
cast
<
CNodePtr
>
();
if
(
add
==
nullptr
||
add
->
inputs
().
size
()
!=
kAddInputNum
)
{
if
(
add
==
nullptr
||
add
->
inputs
().
size
()
!=
kAddInputNum
)
{
return
nullptr
;
return
nullptr
;
}
}
auto
mul_anf
=
add
->
input
(
1
);
CNodePtr
mul
=
nullptr
;
if
(
mul_anf
==
nullptr
)
{
size_t
mul_index
=
0
;
return
nullptr
;
if
(
!
GetMul
(
graph
,
add
,
&
mul
,
&
mul_index
)
||
mul
==
nullptr
||
mul_index
==
0
)
{
}
MS_LOG
(
DEBUG
)
<<
"Cannot find used-by-only-one-op Mul in Add's inputs"
;
auto
mul
=
mul_anf
->
cast
<
CNodePtr
>
();
if
(
mul
==
nullptr
||
mul
->
inputs
().
size
()
!=
kMulInputNum
)
{
return
nullptr
;
}
if
(
IsUsedByOthers
(
graph
,
mul
))
{
MS_LOG
(
DEBUG
)
<<
"Mul is used by more then two nodes, cannot fuse"
;
return
nullptr
;
return
nullptr
;
}
}
auto
prim
=
std
::
make_shared
<
Primitive
>
(
kFusedMulAddOpName
);
auto
prim
=
std
::
make_shared
<
Primitive
>
(
kFusedMulAddOpName
);
std
::
vector
<
AnfNodePtr
>
inputs
=
{
NewValueNode
(
prim
),
mul
->
input
(
1
),
mul
->
input
(
2
),
add
->
input
(
2
)};
std
::
vector
<
AnfNodePtr
>
inputs
=
{
NewValueNode
(
prim
)};
for
(
size_t
index
=
1
;
index
<
mul
->
size
();
++
index
)
{
inputs
.
push_back
(
mul
->
input
(
index
));
}
inputs
.
push_back
(
add
->
input
(
add
->
size
()
-
mul_index
));
auto
fusion_node
=
graph
->
NewCNode
(
inputs
);
auto
fusion_node
=
graph
->
NewCNode
(
inputs
);
fusion_node
->
set_scope
(
add
->
scope
());
fusion_node
->
set_scope
(
add
->
scope
());
fusion_node
->
set_abstract
(
add
->
abstract
());
fusion_node
->
set_abstract
(
add
->
abstract
());
...
...
tests/ut/cpp/pre_activate/ascend/ir_fusion/mul_add_fusion_test.cc
浏览文件 @
12eaaf71
...
@@ -28,8 +28,28 @@ class TestHWMulAddFusion : public BackendCommon {
...
@@ -28,8 +28,28 @@ class TestHWMulAddFusion : public BackendCommon {
UT
::
PyFuncGraphFetcher
get_py_fun_
;
UT
::
PyFuncGraphFetcher
get_py_fun_
;
};
};
TEST_F
(
TestHWMulAddFusion
,
test_mul_add_fusion
)
{
TEST_F
(
TestHWMulAddFusion
,
test_mul_add_fusion1
)
{
FuncGraphPtr
g
=
get_py_fun_
.
CallAndParseRet
(
"test_mul_add_fusion"
,
"before"
);
FuncGraphPtr
g
=
get_py_fun_
.
CallAndParseRet
(
"test_mul_add_fusion"
,
"before1"
);
std
::
vector
<
int
>
shp
{
2
,
32
,
224
,
224
};
auto
x_abstract
=
std
::
make_shared
<
abstract
::
AbstractTensor
>
(
kFloat32
,
shp
);
AbstractBasePtrList
args_spec_list
;
for
(
size_t
i
=
0
;
i
<
3
;
++
i
)
{
args_spec_list
.
push_back
(
x_abstract
);
}
auto
fg
=
GetKernelGraph
(
g
,
args_spec_list
);
auto
optimizer
=
std
::
make_shared
<
opt
::
GraphOptimizer
>
();
auto
pm
=
std
::
make_shared
<
opt
::
PassManager
>
();
pm
->
AddPass
(
std
::
make_shared
<
opt
::
MulAddFusion
>
());
optimizer
->
AddPassManager
(
pm
);
FuncGraphPtr
new_graph
=
optimizer
->
Optimize
(
fg
);
FuncGraphPtr
g_after
=
get_py_fun_
.
CallAndParseRet
(
"test_mul_add_fusion"
,
"after"
);
EXPECT_TRUE
(
CheckEqualGraph
(
g_after
,
new_graph
));
}
TEST_F
(
TestHWMulAddFusion
,
test_mul_add_fusion2
)
{
FuncGraphPtr
g
=
get_py_fun_
.
CallAndParseRet
(
"test_mul_add_fusion"
,
"before2"
);
std
::
vector
<
int
>
shp
{
2
,
32
,
224
,
224
};
std
::
vector
<
int
>
shp
{
2
,
32
,
224
,
224
};
auto
x_abstract
=
std
::
make_shared
<
abstract
::
AbstractTensor
>
(
kFloat32
,
shp
);
auto
x_abstract
=
std
::
make_shared
<
abstract
::
AbstractTensor
>
(
kFloat32
,
shp
);
AbstractBasePtrList
args_spec_list
;
AbstractBasePtrList
args_spec_list
;
...
...
tests/ut/cpp/python_input/gtest_input/pre_activate/mul_add_fusion_test.py
浏览文件 @
12eaaf71
...
@@ -21,7 +21,6 @@ fused_mul_add = Primitive('FusedMulAdd')
...
@@ -21,7 +21,6 @@ fused_mul_add = Primitive('FusedMulAdd')
make_tuple
=
Primitive
(
'make_tuple'
)
make_tuple
=
Primitive
(
'make_tuple'
)
tuple_getitem
=
Primitive
(
'tuple_getitem'
)
tuple_getitem
=
Primitive
(
'tuple_getitem'
)
class
FnDict
:
class
FnDict
:
def
__init__
(
self
):
def
__init__
(
self
):
self
.
fnDict
=
{}
self
.
fnDict
=
{}
...
@@ -32,16 +31,21 @@ class FnDict:
...
@@ -32,16 +31,21 @@ class FnDict:
def
__getitem__
(
self
,
name
):
def
__getitem__
(
self
,
name
):
return
self
.
fnDict
[
name
]
return
self
.
fnDict
[
name
]
def
test_mul_add_fusion
(
tag
):
def
test_mul_add_fusion
(
tag
):
fns
=
FnDict
()
fns
=
FnDict
()
@
fns
@
fns
def
before
(
x
,
y
,
z
):
def
before
1
(
x
,
y
,
z
):
res
=
mul
(
x
,
y
)
res
=
mul
(
x
,
y
)
res
=
add
(
res
,
z
)
res
=
add
(
res
,
z
)
return
res
return
res
@
fns
def
before2
(
x
,
y
,
z
):
res
=
mul
(
x
,
y
)
res
=
add
(
z
,
res
)
return
res
@
fns
@
fns
def
after
(
x
,
y
,
z
):
def
after
(
x
,
y
,
z
):
res
=
fused_mul_add
(
x
,
y
,
z
)
res
=
fused_mul_add
(
x
,
y
,
z
)
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录