Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
BaiXuePrincess
Paddle
提交
88c30b75
P
Paddle
项目概览
BaiXuePrincess
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
88c30b75
编写于
1月 19, 2021
作者:
H
hutuxian
提交者:
GitHub
1月 19, 2021
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
Ascend Framework Part3: Ascend Parser (#30391) (#30549)
上级
6f563ace
变更
2
隐藏空白更改
内联
并排
Showing
2 changed file
with
768 addition
and
0 deletion
+768
-0
python/paddle/distributed/fleet/meta_optimizers/ascend/ascend_optimizer.py
...tributed/fleet/meta_optimizers/ascend/ascend_optimizer.py
+179
-0
python/paddle/distributed/fleet/meta_optimizers/ascend/ascend_parser.py
...distributed/fleet/meta_optimizers/ascend/ascend_parser.py
+589
-0
未找到文件。
python/paddle/distributed/fleet/meta_optimizers/ascend/ascend_optimizer.py
0 → 100644
浏览文件 @
88c30b75
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import
paddle.fluid.framework
as
framework
from
paddle.fluid.optimizer
import
Optimizer
import
paddle.fluid.core
as
core
import
numpy
as
np
import
ascend_parser
class
AscendIRParser
(
object
):
def
__init__
(
self
):
self
.
graph_idx
=
0
def
_construct_input_map
(
self
,
input_varlist
):
ret_map
=
{}
ge_in_operator
=
[]
for
id
,
var
in
enumerate
(
input_varlist
):
if
var
.
is_data
:
# input data
ge_input
=
core
.
GEOperatorFactory
.
create_operator
(
var
.
name
,
"Data"
).
set_attr_int32
(
"index"
,
id
)
ret_map
[
var
.
name
]
=
ge_input
ge_in_operator
.
append
(
ge_input
)
else
:
# param, learning ...
ge_input
=
core
.
GEOperatorFactory
.
create_operator
(
var
.
name
,
"Variable"
)
ge_input
.
update_output_desc
(
"y"
,
core
.
GETensorDesc
(
core
.
GEShape
(
var
.
shape
),
core
.
GEFormat
.
FORMAT_ND
,
core
.
GEDataType
.
DT_FLOAT
))
ret_map
[
var
.
name
]
=
ge_input
return
ge_in_operator
,
ret_map
def
parse_op
(
self
,
op
):
if
op
.
type
in
ascend_parser
.
registerd_op
:
print
(
"Op[%s] has been registered, begin to parse it"
%
(
op
.
type
))
op_parser
=
self
.
parser_factory
.
create_parse
(
ascend_parser
.
registerd_op
[
op
.
type
])
op_parser
.
apply
(
op
)
else
:
print
(
"Op[%s] has not been registered, so we have to skip it"
%
(
op
.
type
))
def
_parse_program
(
self
,
graph_name
,
program
,
input_varlist
=
[],
fetch_list
=
[]):
begin_graph_idx
=
self
.
graph_idx
ge_in_operator
=
[]
ge_out_operator
=
[]
self
.
var2geop
=
{}
block
=
program
.
global_block
()
if
len
(
block
.
ops
)
==
0
:
print
(
"There is no ops in program %s"
%
(
graph_name
))
return
[]
graph
=
core
.
GEGraph
(
graph_name
)
ge_in_operator
,
self
.
var2geop
=
self
.
_construct_input_map
(
input_varlist
)
self
.
parser_factory
=
ascend_parser
.
AscendParserFactory
(
graph
,
self
.
var2geop
)
for
i
,
curop
in
list
(
enumerate
(
block
.
ops
)):
self
.
parse_op
(
curop
)
# Set fetch_var for GE
for
e
in
fetch_list
:
name
=
e
if
not
isinstance
(
e
,
str
):
name
=
e
.
name
ge_out_operator
.
append
(
self
.
var2geop
[
name
])
# (Debug) If you want to print back prop vars, append/assign the varname in ge_out_operator here, such as:
# if graph_name == "main":
# ge_out_operator.append(self.var2geop["reduce_sum_0.tmp_0@GRAD"])
# Add ops that may be input of a graph, such as const.
for
varname
,
geop
in
self
.
var2geop
.
items
():
if
varname
.
startswith
(
"geinput"
):
ge_in_operator
.
append
(
geop
)
graph
.
set_inputs
(
ge_in_operator
).
set_outputs
(
ge_out_operator
)
# Remove ops of origin program
op_num
=
len
(
block
.
ops
)
for
i
in
range
(
op_num
-
1
,
-
1
,
-
1
):
block
.
_remove_op
(
i
)
input_varlist
=
[
var
for
var
in
input_varlist
if
var
.
is_data
]
block
.
append_op
(
type
=
"ascend_trigger"
,
inputs
=
{
"FeedList"
:
input_varlist
},
outputs
=
{
"FetchList"
:
fetch_list
},
attrs
=
{
'graph_idx'
:
self
.
graph_idx
})
self
.
graph_idx
+=
1
return
graph
def
parse_program
(
self
,
startup_program
,
main_program
,
input_varlist
,
fetch_list
):
startup_graph
=
self
.
_parse_program
(
"startup"
,
startup_program
)
main_graph
=
self
.
_parse_program
(
"main"
,
main_program
,
input_varlist
,
fetch_list
)
return
startup_graph
,
main_graph
# AscendOptimizer is a wrapper for basic optimizer now
# We will make it part of fleet meta_optimizer in the future
class
AscendOptimizer
(
Optimizer
):
def
__init__
(
self
,
optimizer
,
fetch_list
=
[]):
self
.
inner_opt
=
optimizer
self
.
fetch_list
=
fetch_list
def
__del__
(
self
):
core
.
ge_finalize
()
def
_can_apply
(
self
):
if
not
self
.
user_defined_strategy
.
ascend
:
return
False
# TODO(hutuxian): other check here
return
True
def
_disable_strategy
(
self
,
dist_strategy
):
dist_strategy
.
ascend
=
False
dist_strategy
.
ascend_configs
=
{}
def
_get_input_varlist
(
program
):
ret_list
=
[]
for
var
in
program
.
list_vars
():
if
var
.
is_data
or
var
.
persistable
:
ret_list
.
append
(
var
)
return
ret_list
def
minimize
(
self
,
loss
,
startup_program
=
None
,
parameter_list
=
None
,
no_grad_set
=
None
):
minimized
=
self
.
inner_opt
.
minimize
(
loss
,
startup_program
=
startup_program
)
self
.
ascend_instance
=
core
.
AscendInstance
()
# Config about Graph Engine can be found in https://support.huaweicloud.com/
config
=
{
"ge.exec.deviceId"
:
"0"
,
"ge.graphRunMode"
:
"1"
,
"ge.exec.precision_mode"
:
"must_keep_origin_dtype"
}
core
.
ge_initialize
(
config
)
# Init Session
self
.
ascend_instance
.
init_global_resources
()
main_block
=
loss
.
block
self
.
parser
=
AscendIRParser
()
input_varlist
=
_get_input_varlist
(
main_block
.
program
)
startup_graph
,
main_graph
=
self
.
parser
.
parse_program
(
startup_program
,
main_block
.
program
,
input_varlist
,
self
.
fetch_list
)
self
.
ascend_instance
.
add_ascend_subgraph
(
0
,
startup_graph
)
self
.
ascend_instance
.
add_ascend_subgraph
(
1
,
main_graph
)
return
minimized
python/paddle/distributed/fleet/meta_optimizers/ascend/ascend_parser.py
0 → 100644
浏览文件 @
88c30b75
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import
paddle.fluid.framework
as
framework
from
paddle.fluid.optimizer
import
Optimizer
import
paddle.fluid.core
as
core
import
numpy
as
np
registerd_op
=
{
"elementwise_add"
:
"AddParser"
,
"matmul"
:
"MatMulParser"
,
"mul"
:
"MulParser"
,
"relu"
:
"ReluParser"
,
"softmax_with_cross_entropy"
:
"SoftmaxWithCrossEntropyParser"
,
"shape"
:
"ShapeParser"
,
"fill_constant"
:
"FillConstantParser"
,
"reduce_sum"
:
"ReduceSumParser"
,
"reduce_sum_grad"
:
"ReduceSumGradParser"
,
"matmul_grad"
:
"MatMulGradParser"
,
"mul_grad"
:
"MulGradParser"
,
"reshape2"
:
"ReshapeParser"
,
"scale"
:
"ScaleParser"
,
"relu_grad"
:
"ReluGradParser"
,
"softmax_with_cross_entropy_grad"
:
"SoftmaxWithCrossEntropyGradParser"
,
"truncated_gaussian_random"
:
"TruncatedNormalParser"
,
"sgd"
:
"SGDParser"
}
global_cnt
=
-
1
global_input_cnt
=
-
1
class
AscendHelper
(
object
):
def
__init__
(
self
):
self
.
dtype2ge_map
=
{
0
:
core
.
GEDataType
.
DT_BOOL
,
1
:
core
.
GEDataType
.
DT_INT16
,
2
:
core
.
GEDataType
.
DT_INT32
,
3
:
core
.
GEDataType
.
DT_INT64
,
4
:
core
.
GEDataType
.
DT_FLOAT16
,
5
:
core
.
GEDataType
.
DT_FLOAT
,
6
:
core
.
GEDataType
.
DT_DOUBLE
}
self
.
dtype2np_map
=
{
0
:
"bool"
,
1
:
"int16"
,
2
:
"int32"
,
3
:
"int64"
,
4
:
"float16"
,
5
:
"float32"
,
6
:
"float64"
}
def
dtype2ge
(
self
,
dtype
):
assert
dtype
in
self
.
dtype2ge_map
,
"dtype[%d] is not supported %d"
%
(
dtype
)
return
self
.
dtype2ge_map
[
dtype
]
def
dtype2np
(
self
,
index
):
assert
index
in
self
.
dtype2np_map
,
"index[%d] is not supported %d"
%
(
dtype
)
return
self
.
dtype2np_map
[
index
]
class
AscendParserFactory
(
object
):
def
__init__
(
self
,
graph
,
var2geop
):
self
.
graph
=
graph
self
.
var2geop
=
var2geop
def
create_parse
(
self
,
parser_class
):
try
:
parser
=
globals
()[
parser_class
](
self
.
graph
,
self
.
var2geop
)
return
parser
except
:
raise
ValueError
(
"parser class %s does not exist"
%
parser_class
)
class
AscendParserBase
(
object
):
def
__init__
(
self
,
graph
,
var2geop
):
self
.
graph
=
graph
self
.
var2geop
=
var2geop
self
.
op
=
None
self
.
ascend_helper
=
AscendHelper
()
def
_get_ge_input
(
self
,
input_var_name
):
assert
input_var_name
in
self
.
var2geop
,
"var %s not created before"
%
(
input_var_name
)
return
self
.
var2geop
[
input_var_name
]
def
update_output
(
self
,
geop_list
,
index_list
):
output_num
=
len
(
self
.
op
.
output_names
)
assert
output_num
==
len
(
index_list
),
"Parser[%s]'s output number[%d] is not equal to parameters number[%d]"
%
(
self
.
parser_name
,
len
(
index_list
),
output_num
)
for
output_id
in
range
(
output_num
):
arguments
=
self
.
op
.
output
(
self
.
op
.
output_names
[
output_id
])
print
(
"%d argument: %s"
%
(
output_id
,
str
(
arguments
)))
if
len
(
arguments
)
>
0
:
assert
len
(
arguments
)
==
len
(
index_list
[
output_id
]
),
"Parser[%s]'s %dth argument number[%d] is not equal to paddle's number[%d]"
%
(
self
.
parser_name
,
output_id
,
len
(
index_list
[
output_id
]),
len
(
arguments
))
for
i
in
range
(
len
(
arguments
)):
print
(
"assgin index_list[%d][%d] to %s"
%
(
output_id
,
i
,
arguments
[
i
]))
self
.
var2geop
[
arguments
[
i
]]
=
geop_list
[
index_list
[
output_id
][
i
]]
for
geop
in
geop_list
:
self
.
graph
.
add_op
(
geop
)
def
apply
(
self
,
op
):
self
.
op
=
op
assert
self
.
op
.
type
==
self
.
parser_name
,
"op [%s] != parser_name[%s]"
%
(
self
.
op
.
type
,
self
.
parser_name
)
print
(
"begin to parse op %s"
%
(
self
.
parser_name
))
geop_list
,
index_list
=
self
.
_apply
()
self
.
update_output
(
geop_list
,
index_list
)
def
_mark_as_input
(
self
,
ge_tensor
):
global
global_input_cnt
global_input_cnt
+=
1
self
.
var2geop
[
"geinput."
+
str
(
global_input_cnt
)]
=
ge_tensor
def
_accumulated_op_id
(
self
):
global
global_cnt
global_cnt
+=
1
return
"."
+
str
(
global_cnt
)
def
_create_ge_tensor
(
self
,
shape
,
dtype
,
value
):
tensor_desc
=
core
.
GETensorDesc
(
core
.
GEShape
(
shape
),
core
.
GEFormat
.
FORMAT_ND
,
self
.
ascend_helper
.
dtype2ge
(
dtype
))
tensor
=
core
.
GETensor
(
tensor_desc
)
data
=
(
value
*
np
.
ones
((
shape
))).
reshape
(
shape
).
astype
(
self
.
ascend_helper
.
dtype2np
(
dtype
))
buf
=
data
.
tobytes
()
data_8
=
np
.
frombuffer
(
buf
,
dtype
=
np
.
uint8
)
tensor
.
set_data
(
data_8
)
return
tensor
class
AddParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
AddParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"elementwise_add"
def
_apply
(
self
):
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
y
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
add
=
core
.
GEOperatorFactory
.
create_operator
(
"add"
+
self
.
_accumulated_op_id
(),
"Add"
).
set_input
(
"x1"
,
x
).
set_input
(
"x2"
,
y
)
return
[
add
],
[[
0
]]
class
ReduceSumParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
ReduceSumParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"reduce_sum"
def
_apply
(
self
):
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
axes
=
self
.
op
.
attr
(
"dim"
)
keep_dims
=
self
.
op
.
attr
(
"keep_dim"
)
reduce_sum
=
core
.
GEOperatorFactory
.
create_operator
(
"reduce_sum"
+
self
.
_accumulated_op_id
(),
"ReduceSumD"
).
set_input
(
"x"
,
x
,
0
).
set_attr_vec_int32
(
"axes"
,
axes
).
set_attr_bool
(
"keep_dims"
,
keep_dims
)
return
[
reduce_sum
],
[[
0
]]
class
ReduceSumGradParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
ReduceSumGradParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"reduce_sum_grad"
def
_apply
(
self
):
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
input
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
shape_tensor
=
core
.
GEOperatorFactory
.
create_operator
(
"shape"
+
self
.
_accumulated_op_id
(),
"Shape"
).
set_input
(
"x"
,
input
,
0
)
axis_const
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
self
.
_create_ge_tensor
([
1
],
2
,
-
1
))
self
.
_mark_as_input
(
axis_const
)
broadcast
=
core
.
GEOperatorFactory
.
create_operator
(
"broadcast_to_d"
+
self
.
_accumulated_op_id
(),
"BroadcastTo"
).
set_input
(
"x"
,
x
).
set_input
(
"shape"
,
shape_tensor
)
# unsqueeze cannot get right result, but ExpandDims seems have the same functionality.
reduce_sum_grad
=
core
.
GEOperatorFactory
.
create_operator
(
"expand"
+
self
.
_accumulated_op_id
(),
"ExpandDims"
).
set_input
(
"x"
,
broadcast
).
set_input
(
"axis"
,
axis_const
)
return
[
shape_tensor
,
axis_const
,
broadcast
,
reduce_sum_grad
],
[[
3
]]
class
MatMulParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
MatMulParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"matmul"
def
_apply
(
self
):
x1
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
x2
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
matmul
=
core
.
GEOperatorFactory
.
create_operator
(
"matmul"
+
self
.
_accumulated_op_id
(),
"MatMul"
).
set_input
(
"x1"
,
x1
).
set_input
(
"x2"
,
x2
)
return
[
matmul
],
[[
0
]]
class
MatMulGradParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
MatMulGradParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"matmul_grad"
def
_apply
(
self
):
out_grad
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
y
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
2
])
x_grad
=
core
.
GEOperatorFactory
.
create_operator
(
self
.
parser_name
+
self
.
_accumulated_op_id
(),
"MatMul"
).
set_input
(
"x1"
,
out_grad
).
set_input
(
"x2"
,
y
).
set_attr_bool
(
"transpose_x1"
,
False
).
set_attr_bool
(
"transpose_x2"
,
True
)
y_grad
=
core
.
GEOperatorFactory
.
create_operator
(
self
.
parser_name
+
self
.
_accumulated_op_id
(),
"MatMul"
).
set_input
(
"x1"
,
x
).
set_input
(
"x2"
,
out_grad
).
set_attr_bool
(
"transpose_x1"
,
True
).
set_attr_bool
(
"transpose_x2"
,
False
)
return
[
x_grad
,
y_grad
],
[[
0
],
[
1
]]
class
MulGradParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
MulGradParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"mul_grad"
def
_apply
(
self
):
out_grad
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
y
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
2
])
x_grad
=
core
.
GEOperatorFactory
.
create_operator
(
self
.
parser_name
+
self
.
_accumulated_op_id
(),
"MatMul"
).
set_input
(
"x1"
,
out_grad
).
set_input
(
"x2"
,
y
).
set_attr_bool
(
"transpose_x1"
,
False
).
set_attr_bool
(
"transpose_x2"
,
True
)
y_grad
=
core
.
GEOperatorFactory
.
create_operator
(
self
.
parser_name
+
self
.
_accumulated_op_id
(),
"MatMul"
).
set_input
(
"x1"
,
x
).
set_input
(
"x2"
,
out_grad
).
set_attr_bool
(
"transpose_x1"
,
True
).
set_attr_bool
(
"transpose_x2"
,
False
)
return
[
x_grad
,
y_grad
],
[[
0
],
[
1
]]
class
MulParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
MulParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"mul"
def
_apply
(
self
):
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
y
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
matmul
=
core
.
GEOperatorFactory
.
create_operator
(
"mul"
+
self
.
_accumulated_op_id
(),
"MatMul"
).
set_input
(
"x1"
,
x
).
set_input
(
"x2"
,
y
)
return
[
matmul
],
[[
0
]]
class
ReluParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
ReluParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"relu"
def
_apply
(
self
):
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
relu
=
core
.
GEOperatorFactory
.
create_operator
(
"relu"
+
self
.
_accumulated_op_id
(),
"Relu"
).
set_input
(
"x"
,
x
)
return
[
relu
],
[[
0
]]
class
ReluGradParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
ReluGradParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"relu_grad"
def
_apply
(
self
):
out
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
out_grad
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
relu_grad
=
core
.
GEOperatorFactory
.
create_operator
(
self
.
parser_name
+
self
.
_accumulated_op_id
(),
"ReluGrad"
).
set_input
(
"gradients"
,
out_grad
).
set_input
(
"features"
,
out
)
return
[
relu_grad
],
[[
0
]]
class
SoftmaxWithCrossEntropyParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
SoftmaxWithCrossEntropyParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"softmax_with_cross_entropy"
def
_apply
(
self
):
label
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
logits
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
cls_num
=
self
.
op
.
block
.
var
(
self
.
op
.
input_arg_names
[
1
]).
shape
[
1
]
softmax
=
core
.
GEOperatorFactory
.
create_operator
(
"softmax"
+
self
.
_accumulated_op_id
(),
"SoftmaxV2"
).
set_input
(
"x"
,
logits
)
label
=
core
.
GEOperatorFactory
.
create_operator
(
"cast"
+
self
.
_accumulated_op_id
(),
"Cast"
).
set_input
(
"x"
,
label
).
set_attr_int32
(
"dst_type"
,
3
)
tensoron
=
self
.
_create_ge_tensor
([
1
],
5
,
1
)
on_const
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensoron
)
self
.
_mark_as_input
(
on_const
)
tensoroff
=
self
.
_create_ge_tensor
([
1
],
5
,
0
)
off_const
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensoroff
)
self
.
_mark_as_input
(
off_const
)
onehot
=
core
.
GEOperatorFactory
.
create_operator
(
"onehot"
+
self
.
_accumulated_op_id
(),
"OneHotD"
).
set_input
(
"x"
,
label
).
set_input
(
"on_value"
,
on_const
).
set_input
(
"off_value"
,
off_const
).
set_attr_int32
(
"depth"
,
cls_num
)
squeeze
=
core
.
GEOperatorFactory
.
create_operator
(
"mul"
+
self
.
_accumulated_op_id
(),
"Squeeze"
).
set_input
(
"x"
,
onehot
)
loss
=
core
.
GEOperatorFactory
.
create_operator
(
"loss"
+
self
.
_accumulated_op_id
(),
"SoftmaxCrossEntropyWithLogits"
).
set_input
(
"features"
,
logits
).
set_input
(
"labels"
,
squeeze
)
return
[
label
,
softmax
,
on_const
,
off_const
,
onehot
,
squeeze
,
loss
],
[[
6
],
[
1
]]
class
SoftmaxWithCrossEntropyGradParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
SoftmaxWithCrossEntropyGradParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"softmax_with_cross_entropy_grad"
def
_apply
(
self
):
label
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
loss_grad
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
softmax
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
2
])
cls_num
=
self
.
op
.
block
.
var
(
self
.
op
.
input_arg_names
[
2
]).
shape
[
1
]
tensoron
=
self
.
_create_ge_tensor
([
1
],
5
,
1
)
on_const
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensoron
)
self
.
_mark_as_input
(
on_const
)
tensoroff
=
self
.
_create_ge_tensor
([
1
],
5
,
0
)
off_const
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensoroff
)
self
.
_mark_as_input
(
off_const
)
label
=
core
.
GEOperatorFactory
.
create_operator
(
"cast"
+
self
.
_accumulated_op_id
(),
"Cast"
).
set_input
(
"x"
,
label
).
set_attr_int32
(
"dst_type"
,
3
)
onehot
=
core
.
GEOperatorFactory
.
create_operator
(
"onehot"
+
self
.
_accumulated_op_id
(),
"OneHotD"
).
set_input
(
"x"
,
label
).
set_input
(
"on_value"
,
on_const
).
set_input
(
"off_value"
,
off_const
).
set_attr_int32
(
"depth"
,
cls_num
)
# the fuck onehot will add a demension, so must call squeeze afterward
squeeze
=
core
.
GEOperatorFactory
.
create_operator
(
"mul"
+
self
.
_accumulated_op_id
(),
"Squeeze"
).
set_input
(
"x"
,
onehot
)
sub
=
core
.
GEOperatorFactory
.
create_operator
(
"sub"
+
self
.
_accumulated_op_id
(),
"Sub"
).
set_input
(
"x1"
,
softmax
).
set_input
(
"x2"
,
squeeze
)
grad
=
core
.
GEOperatorFactory
.
create_operator
(
"mul"
+
self
.
_accumulated_op_id
(),
"Mul"
).
set_input
(
"x1"
,
loss_grad
).
set_input
(
"x2"
,
sub
)
return
[
on_const
,
off_const
,
label
,
onehot
,
squeeze
,
sub
,
grad
],
[[
-
1
]]
class
ShapeParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
ShapeParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"shape"
def
_apply
(
self
):
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
shape
=
core
.
GEOperatorFactory
.
create_operator
(
"shape"
+
self
.
_accumulated_op_id
(),
"Shape"
).
set_input
(
"x"
,
x
)
return
[
shape
],
[[
0
]]
class
FillConstantParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
FillConstantParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"fill_constant"
def
_apply
(
self
):
shape
=
self
.
op
.
attr
(
"shape"
)
dtype
=
self
.
op
.
attr
(
"dtype"
)
value
=
self
.
op
.
attr
(
"value"
)
print
(
"shape: "
,
shape
)
print
(
"dtype: "
,
dtype
)
print
(
"value: "
,
value
)
tensor
=
self
.
_create_ge_tensor
(
shape
,
dtype
,
value
)
const
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensor
)
self
.
_mark_as_input
(
const
)
if
self
.
op
.
block
.
var
(
self
.
op
.
output
(
'Out'
)[
0
]).
persistable
:
print
(
"%s fill_constant"
%
(
self
.
op
.
output
(
'Out'
)[
0
]))
var
=
core
.
GEOperatorFactory
.
create_operator
(
self
.
op
.
output
(
'Out'
)[
0
],
"Variable"
)
var
.
update_output_desc
(
"y"
,
core
.
GETensorDesc
(
core
.
GEShape
(
shape
),
core
.
GEFormat
.
FORMAT_ND
,
core
.
GEDataType
.
DT_FLOAT
))
assign
=
core
.
GEOperatorFactory
.
create_operator
(
"assign"
+
self
.
_accumulated_op_id
(),
"Assign"
).
set_input
(
"value"
,
const
).
set_input
(
"ref"
,
var
)
return
[
const
],
[[
0
]]
else
:
print
(
"self.op.output('Out')[0] is not persistable in fill_constant"
)
return
[
const
],
[[
0
]]
class
SGDParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
SGDParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"sgd"
def
_apply
(
self
):
grad
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
lr
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
1
])
param
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
2
])
sgd
=
core
.
GEOperatorFactory
.
create_operator
(
"momentum"
+
self
.
_accumulated_op_id
(),
"ApplyGradientDescent"
).
set_input
(
"var"
,
param
).
set_input
(
"alpha"
,
lr
).
set_input
(
"delta"
,
grad
)
return
[
sgd
],
[[
0
]]
class
TruncatedNormalParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
TruncatedNormalParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"truncated_gaussian_random"
def
_apply
(
self
):
shape
=
self
.
op
.
attr
(
"shape"
)
dtype
=
self
.
op
.
attr
(
"dtype"
)
mean
=
self
.
op
.
attr
(
"mean"
)
std
=
self
.
op
.
attr
(
"std"
)
seed
=
self
.
op
.
attr
(
"seed"
)
tensor1
=
self
.
_create_ge_tensor
([
len
(
shape
)],
2
,
shape
)
shape_tensor
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensor1
)
tensor2
=
self
.
_create_ge_tensor
([
1
],
dtype
,
mean
)
mean_tensor
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensor2
)
tensor3
=
self
.
_create_ge_tensor
([
1
],
dtype
,
std
)
std_tensor
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensor3
)
tensor4
=
self
.
_create_ge_tensor
([
1
],
dtype
,
mean
-
2
*
std
)
min_tensor
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensor4
)
tensor5
=
self
.
_create_ge_tensor
([
1
],
dtype
,
mean
+
2
*
std
)
max_tensor
=
core
.
GEOperatorFactory
.
create_operator
(
"const"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensor5
)
self
.
_mark_as_input
(
shape_tensor
)
self
.
_mark_as_input
(
mean_tensor
)
self
.
_mark_as_input
(
std_tensor
)
self
.
_mark_as_input
(
min_tensor
)
self
.
_mark_as_input
(
max_tensor
)
truncated_normal
=
core
.
GEOperatorFactory
.
create_operator
(
"truncated_normal"
+
self
.
_accumulated_op_id
(),
"ParameterizedTruncatedNormal"
).
set_input
(
"shape"
,
shape_tensor
).
set_input
(
"means"
,
mean_tensor
).
set_input
(
"stdevs"
,
std_tensor
).
set_input
(
"min"
,
min_tensor
).
set_input
(
"max"
,
max_tensor
).
set_attr_int32
(
"seed"
,
0
)
## wirte the output of truncatedNormal from startup_program to main_program
if
self
.
op
.
block
.
var
(
self
.
op
.
output
(
'Out'
)[
0
]).
persistable
:
print
(
"%s is Persistable in truncated_normal"
%
(
self
.
op
.
output
(
'Out'
)[
0
]))
#var = core.GEOperatorFactory.create_operator(self.op.output('Out')[0], "Variable").set_input("x", truncated_normal)
var
=
core
.
GEOperatorFactory
.
create_operator
(
self
.
op
.
output
(
'Out'
)[
0
],
"Variable"
)
var
.
update_output_desc
(
"y"
,
core
.
GETensorDesc
(
core
.
GEShape
(
shape
),
core
.
GEFormat
.
FORMAT_ND
,
core
.
GEDataType
.
DT_FLOAT
))
assign
=
core
.
GEOperatorFactory
.
create_operator
(
"assign"
+
self
.
_accumulated_op_id
(),
"Assign"
).
set_input
(
"value"
,
truncated_normal
).
set_input
(
"ref"
,
var
)
return
[
shape_tensor
,
mean_tensor
,
std_tensor
,
min_tensor
,
max_tensor
,
truncated_normal
],
[[
-
1
]]
else
:
print
(
"self.op.output('Out')[0] is not persistable in truncated_noraml"
)
return
[
truncated_normal
],
[[
0
]]
#[assign]
class
ScaleParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
ScaleParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"scale"
def
_apply
(
self
):
x
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
scale
=
self
.
op
.
attr
(
"scale"
)
#self.get_ge_input(self.op.input_arg_names[1])
bias
=
self
.
op
.
attr
(
"bias"
)
bias_after_scale
=
self
.
op
.
attr
(
"bias_after_scale"
)
if
bias_after_scale
:
scale_value
=
core
.
GEOperatorFactory
.
create_operator
(
"scale"
+
self
.
_accumulated_op_id
(),
"Power"
).
set_input
(
"x"
,
x
).
set_attr_float
(
"power"
,
1.0
).
set_attr_float
(
"scale"
,
scale
).
set_attr_float
(
"shift"
,
bias
)
else
:
x_add_bias
=
core
.
GEOperatorFactory
.
create_operator
(
"adds"
+
self
.
_accumulated_op_id
(),
"Adds"
).
set_input
(
"x"
,
x
).
set_attr_float
(
"value"
,
bias
)
#set_input("x2", bias)
scale_value
=
core
.
GEOperatorFactory
.
create_operator
(
"scale"
+
self
.
_accumulated_op_id
(),
"Power"
).
set_input
(
"x"
,
x_add_bias
).
set_attr_float
(
"power"
,
1.0
).
set_attr_float
(
"scale"
,
scale
).
set_attr_float
(
"shift"
,
0.0
)
#tensor_zeros = core.GEOperatorFactory.create_operator("zeroslike" + self.getid(), "ZerosLike").set_input("x", x)
#bias_ = self.create_ge_tensor([1], 5, bias)
#const_bias = core.GEOperatorFactory.create_operator("const" + self.getid(), "Const").set_attr_tensor("value", tensor_bias)
return
[
scale_value
],
[[
0
]]
class
ReshapeParser
(
AscendParserBase
):
def
__init__
(
self
,
graph
,
var2geop
):
super
(
ReshapeParser
,
self
).
__init__
(
graph
,
var2geop
)
self
.
parser_name
=
"reshape2"
def
_apply
(
self
):
print
(
"swbuf:"
,
self
.
op
.
input_arg_names
)
shape
=
self
.
op
.
attr
(
"shape"
)
axis
=
0
if
shape
[
0
]
==
-
1
:
axis
=
1
shape
=
shape
[
1
:]
print
(
"shape: "
,
shape
)
data_x1_shape
=
self
.
_get_ge_input
(
self
.
op
.
input_arg_names
[
0
])
tensor
=
self
.
_create_ge_tensor
([
len
(
shape
)],
2
,
shape
)
const_shape
=
core
.
GEOperatorFactory
.
create_operator
(
"shape"
+
self
.
_accumulated_op_id
(),
"Const"
).
set_attr_tensor
(
"value"
,
tensor
)
reshape
=
core
.
GEOperatorFactory
.
create_operator
(
"reshape"
+
self
.
_accumulated_op_id
(),
"Reshape"
).
set_input
(
"x"
,
data_x1_shape
).
set_input
(
"shape"
,
const_shape
).
set_attr_int32
(
"axis"
,
axis
)
return
[
reshape
,
reshape
],
[[
0
],
[
1
]]
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录