Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
BaiXuePrincess
Paddle
提交
339aefac
P
Paddle
项目概览
BaiXuePrincess
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
339aefac
编写于
11月 09, 2022
作者:
Z
zhaoyingli
提交者:
GitHub
11月 09, 2022
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
manage no shape var type (#47775)
上级
692a9632
变更
8
隐藏空白更改
内联
并排
Showing
8 changed file
with
42 addition
and
85 deletion
+42
-85
python/paddle/distributed/auto_parallel/completion.py
python/paddle/distributed/auto_parallel/completion.py
+4
-8
python/paddle/distributed/auto_parallel/dist_context.py
python/paddle/distributed/auto_parallel/dist_context.py
+4
-15
python/paddle/distributed/auto_parallel/dist_op.py
python/paddle/distributed/auto_parallel/dist_op.py
+11
-33
python/paddle/distributed/auto_parallel/dist_tensor.py
python/paddle/distributed/auto_parallel/dist_tensor.py
+3
-13
python/paddle/distributed/auto_parallel/engine.py
python/paddle/distributed/auto_parallel/engine.py
+1
-1
python/paddle/distributed/auto_parallel/interface.py
python/paddle/distributed/auto_parallel/interface.py
+6
-7
python/paddle/distributed/auto_parallel/partitioner.py
python/paddle/distributed/auto_parallel/partitioner.py
+9
-7
python/paddle/distributed/auto_parallel/utils.py
python/paddle/distributed/auto_parallel/utils.py
+4
-1
未找到文件。
python/paddle/distributed/auto_parallel/completion.py
浏览文件 @
339aefac
...
...
@@ -18,7 +18,7 @@ import logging
from
paddle.fluid
import
core
from
.utils
import
is_naive_data_parallel
,
get_logger
from
.utils
import
is_gradient_clip_op
,
__no
t
_shape_var_type__
from
.utils
import
is_gradient_clip_op
,
__no_shape_var_type__
from
.operators
import
find_compatible_distributed_operator_impls
from
.dist_context
import
_node_id
from
.dist_attribute
import
TensorDistributedAttribute
...
...
@@ -151,11 +151,7 @@ class Completer:
return
False
tensor_desc
=
tensor_node
.
var
()
# Skip reader tensor
if
(
tensor_desc
.
type
()
==
core
.
VarDesc
.
VarType
.
READER
or
tensor_desc
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
tensor_desc
.
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
tensor_desc
.
type
()
in
__no_shape_var_type__
:
return
False
tensor_dist_attr
=
self
.
_dist_context
.
get_tensor_dist_attr_for_graph
(
tensor_node
...
...
@@ -621,7 +617,7 @@ class Completer:
):
if
(
tensor_node
.
var
().
type
()
in
__no
t
_shape_var_type__
in
__no_shape_var_type__
or
len
(
tensor_node
.
var
().
shape
())
!=
1
):
flag
=
False
...
...
@@ -633,7 +629,7 @@ class Completer:
):
if
(
tensor_node
.
var
().
type
()
in
__no
t
_shape_var_type__
in
__no_shape_var_type__
or
len
(
tensor_node
.
var
().
shape
())
!=
1
):
flag
=
False
...
...
python/paddle/distributed/auto_parallel/dist_context.py
浏览文件 @
339aefac
...
...
@@ -22,7 +22,7 @@ from .dist_tensor import DistributedTensor
from
.dist_op
import
DistributedOperator
from
.process_mesh
import
ProcessMesh
from
.utils
import
_copy_dist_attr_to_cpp
from
.utils
import
is_loss_grad_op
from
.utils
import
is_loss_grad_op
,
__no_shape_var_type__
# There always exists a default context for user. And user can set it to another one.
...
...
@@ -862,11 +862,7 @@ class DistributedContext:
for
dist_tensor
in
self
.
_dist_tensors_for_program
.
values
():
serial_tensor
=
dist_tensor
.
serial_tensor
dist_attr
=
dist_tensor
.
dist_attr
if
(
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
READER
or
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
serial_tensor
.
type
in
__no_shape_var_type__
:
tensor_shape
=
[]
else
:
tensor_shape
=
serial_tensor
.
shape
...
...
@@ -896,10 +892,7 @@ class DistributedContext:
else
:
if
(
dist_op
.
get_serial_input
(
arg_name
).
type
==
core
.
VarDesc
.
VarType
.
READER
or
dist_op
.
get_serial_input
(
arg_name
).
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
dist_op
.
serial_op
.
type
==
"create_py_reader"
in
__no_shape_var_type__
):
tensor_shape
=
[]
else
:
...
...
@@ -923,11 +916,7 @@ class DistributedContext:
for
arg_name
in
serial_op
.
output_arg_names
:
if
(
dist_op
.
get_serial_output
(
arg_name
).
type
==
core
.
VarDesc
.
VarType
.
READER
or
dist_op
.
get_serial_output
(
arg_name
).
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
dist_op
.
get_serial_output
(
arg_name
).
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
in
__no_shape_var_type__
):
tensor_shape
=
[]
else
:
...
...
python/paddle/distributed/auto_parallel/dist_op.py
浏览文件 @
339aefac
...
...
@@ -14,12 +14,15 @@
import
copy
import
paddle
from
paddle.fluid
import
core
from
paddle.fluid.framework
import
Variable
from
.dist_attribute
import
OperatorDistributedAttribute
from
.dist_attribute
import
append_op_input_suffix
from
.dist_attribute
import
append_op_output_suffix
from
.utils
import
convert_to_shard_spec
,
verify_shard_spec
from
.utils
import
(
convert_to_shard_spec
,
verify_shard_spec
,
__no_shape_var_type__
,
)
class
DistributedOperator
:
...
...
@@ -73,10 +76,7 @@ class DistributedOperator:
if
tensor
is
None
:
tensor_shape
=
[]
else
:
if
(
tensor
.
type
==
core
.
VarDesc
.
VarType
.
READER
or
tensor
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
):
if
tensor
.
type
in
__no_shape_var_type__
:
tensor_shape
=
[]
else
:
tensor_shape
=
tensor
.
shape
...
...
@@ -87,11 +87,7 @@ class DistributedOperator:
)
for
tensor_name
in
self
.
_serial_op
.
output_arg_names
:
tensor
=
self
.
_serial_op
.
block
.
_var_recursive
(
tensor_name
)
if
(
tensor
.
type
==
core
.
VarDesc
.
VarType
.
READER
or
tensor
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
tensor
.
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
tensor
.
type
in
__no_shape_var_type__
:
tensor_shape
=
[]
else
:
tensor_shape
=
tensor
.
shape
...
...
@@ -151,10 +147,7 @@ class DistributedOperator:
for
name
in
self
.
serial_op
.
input_arg_names
:
input_dist_attr
=
self
.
dist_attr
.
get_input_dist_attr
(
name
)
dims_mapping
=
input_dist_attr
.
dims_mapping
if
(
self
.
get_serial_input
(
name
).
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
):
if
self
.
get_serial_input
(
name
).
type
in
__no_shape_var_type__
:
shape
=
[]
else
:
shape
=
self
.
get_serial_input
(
name
).
shape
...
...
@@ -174,12 +167,7 @@ class DistributedOperator:
for
name
in
self
.
serial_op
.
output_arg_names
:
output_dist_attr
=
self
.
dist_attr
.
get_output_dist_attr
(
name
)
dims_mapping
=
output_dist_attr
.
dims_mapping
if
(
self
.
get_serial_output
(
name
).
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
self
.
get_serial_output
(
name
).
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
self
.
get_serial_output
(
name
).
type
in
__no_shape_var_type__
:
shape
=
[]
else
:
shape
=
self
.
get_serial_output
(
name
).
shape
...
...
@@ -337,12 +325,7 @@ class DistributedOperatorHelper:
if
tensor
is
None
:
tensor_shape
=
[]
else
:
if
(
tensor
.
type
==
core
.
VarDesc
.
VarType
.
READER
or
tensor
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
tensor
.
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
tensor
.
type
in
__no_shape_var_type__
:
tensor_shape
=
[]
else
:
tensor_shape
=
tensor
.
shape
...
...
@@ -368,12 +351,7 @@ class DistributedOperatorHelper:
if
tensor
is
None
:
tensor_shape
=
[]
else
:
if
(
tensor
.
type
==
core
.
VarDesc
.
VarType
.
READER
or
tensor
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
tensor
.
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
tensor
.
type
in
__no_shape_var_type__
:
tensor_shape
=
[]
else
:
tensor_shape
=
tensor
.
shape
...
...
python/paddle/distributed/auto_parallel/dist_tensor.py
浏览文件 @
339aefac
...
...
@@ -16,10 +16,9 @@ import copy
import
inspect
import
paddle
from
paddle.fluid
import
core
from
paddle.fluid.framework
import
Parameter
,
Block
,
Variable
from
.dist_attribute
import
TensorDistributedAttribute
from
.utils
import
_linear_idx2coordinate
from
.utils
import
_linear_idx2coordinate
,
__no_shape_var_type__
class
DistributedTensor
:
...
...
@@ -208,12 +207,7 @@ class DistributedTensor:
def
_init_default_dist_attr
(
self
):
if
self
.
_dist_attr
.
dims_mapping
is
None
:
if
(
self
.
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
READER
or
self
.
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
self
.
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
self
.
serial_tensor
.
type
in
__no_shape_var_type__
:
tensor_shape
=
[]
else
:
tensor_shape
=
self
.
_serial_tensor
.
shape
...
...
@@ -221,11 +215,7 @@ class DistributedTensor:
self
.
_dist_attr
.
dims_mapping
=
tensor_dims_mapping
def
validate_dist_attr
(
self
):
if
(
self
.
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
READER
or
self
.
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
self
.
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
self
.
serial_tensor
.
type
in
__no_shape_var_type__
:
return
True
tensor_shape
=
self
.
serial_tensor
.
shape
if
len
(
tensor_shape
)
!=
len
(
self
.
dist_attr
.
dims_mapping
):
...
...
python/paddle/distributed/auto_parallel/engine.py
浏览文件 @
339aefac
...
...
@@ -580,7 +580,7 @@ class Engine:
metric
.
compute
(
*
(
outputs
+
self
.
_labels
))
)
)
el
se
:
el
if
mode
==
"train"
:
assert
isinstance
(
self
.
_loss
,
Variable
),
"the type of `loss` of the Engine arguments should be Variable."
...
...
python/paddle/distributed/auto_parallel/interface.py
浏览文件 @
339aefac
...
...
@@ -13,13 +13,16 @@
# limitations under the License.
import
paddle
from
paddle.fluid
import
core
from
.process_mesh
import
ProcessMesh
from
.process_mesh
import
get_current_process_mesh
from
.dist_context
import
get_default_distributed_context
from
.dist_tensor
import
DistributedTensor
from
.dist_op
import
DistributedOperatorHelper
from
.utils
import
verify_shard_spec
,
convert_to_dims_mapping
from
.utils
import
(
verify_shard_spec
,
convert_to_dims_mapping
,
__no_shape_var_type__
,
)
def
shard_tensor
(
x
,
process_mesh
=
None
,
shard_spec
=
None
):
...
...
@@ -79,11 +82,7 @@ def shard_tensor(x, process_mesh=None, shard_spec=None):
dist_tensor
=
DistributedTensor
(
x
)
serial_tensor
=
dist_tensor
.
serial_tensor
dist_tensor
.
dist_attr
.
process_mesh
=
process_mesh
if
(
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
READER
or
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
or
serial_tensor
.
type
==
core
.
VarDesc
.
VarType
.
STEP_SCOPES
):
if
serial_tensor
.
type
in
__no_shape_var_type__
:
tensor_shape
=
[]
else
:
tensor_shape
=
serial_tensor
.
shape
...
...
python/paddle/distributed/auto_parallel/partitioner.py
浏览文件 @
339aefac
...
...
@@ -22,14 +22,16 @@ from paddle.distributed.auto_parallel.operators.common import (
)
from
paddle.distributed.auto_parallel.dist_context
import
DistributedContext
from
.dist_attribute
import
OperatorDistributedAttribute
from
.utils
import
is_backward_op
,
is_forward_op
,
is_loss_op
,
is_optimize_op
from
.operators.common
import
BACKWARD_ONLY_DIST_OPS
from
.utils
import
(
is_backward_op
,
is_forward_op
,
is_loss_op
,
is_optimize_op
,
__no_shape_var_type__
,
)
__varname_not_in_block__
=
[
"lod_tensor_blocking_queue"
]
__not_shape_var_type__
=
[
core
.
VarDesc
.
VarType
.
READER
,
core
.
VarDesc
.
VarType
.
STEP_SCOPES
,
]
class
Partitioner
:
...
...
@@ -363,7 +365,7 @@ class Partitioner:
var_dist_attrs
=
[
self
.
_dist_context
.
get_tensor_dist_attr_for_program
(
var
)
for
var
in
vars_
if
(
var
.
type
not
in
__no
t
_shape_var_type__
)
if
(
var
.
type
not
in
__no_shape_var_type__
)
]
all_ops_annotated
=
all
(
...
...
@@ -468,7 +470,7 @@ def _partition_var(
"""
src_var
=
src_block
.
var
(
src_varname
)
if
src_var
.
type
in
__no
t
_shape_var_type__
:
if
src_var
.
type
in
__no_shape_var_type__
:
persist
=
getattr
(
src_var
,
'persistable'
,
False
)
new_var
=
dst_block
.
create_var
(
type
=
src_var
.
type
,
...
...
python/paddle/distributed/auto_parallel/utils.py
浏览文件 @
339aefac
...
...
@@ -33,9 +33,12 @@ from paddle.distributed.auto_parallel.dist_attribute import (
OperatorDistributedAttribute
,
)
__no
t
_shape_var_type__
=
[
__no_shape_var_type__
=
[
core
.
VarDesc
.
VarType
.
READER
,
core
.
VarDesc
.
VarType
.
STEP_SCOPES
,
core
.
VarDesc
.
VarType
.
LOD_TENSOR_ARRAY
,
core
.
VarDesc
.
VarType
.
FEED_MINIBATCH
,
core
.
VarDesc
.
VarType
.
FETCH_LIST
,
]
__not_naive_data_parallel_op__
=
[
"expand_v2"
]
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录