Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
Crayon鑫
Paddle
提交
0360e583
P
Paddle
项目概览
Crayon鑫
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
0360e583
编写于
8月 06, 2020
作者:
S
sandyhouse
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
bug fix, test=develop
上级
63b58dc2
变更
2
显示空白变更内容
内联
并排
Showing
2 changed file
with
50 addition
and
35 deletion
+50
-35
paddle/fluid/framework/section_worker.cc
paddle/fluid/framework/section_worker.cc
+23
-5
python/paddle/fluid/optimizer.py
python/paddle/fluid/optimizer.py
+27
-30
未找到文件。
paddle/fluid/framework/section_worker.cc
浏览文件 @
0360e583
...
@@ -194,10 +194,17 @@ void SectionWorker::TrainFiles() {
...
@@ -194,10 +194,17 @@ void SectionWorker::TrainFiles() {
dev_ctx_
->
Wait
();
dev_ctx_
->
Wait
();
batch_timer
.
Pause
();
batch_timer
.
Pause
();
VLOG
(
0
)
<<
"batch time: "
<<
batch_timer
.
ElapsedUS
();
VLOG
(
0
)
<<
"batch time: "
<<
batch_timer
.
ElapsedUS
();
{
std
::
unique_lock
<
std
::
mutex
>
lk
(
thread_mutex
);
if
(
threads_completed
)
{
return
;
}
}
}
}
}
else
{
}
else
{
while
(
true
)
{
while
(
true
)
{
// forward pass:
// forward pass:
bool
local_completed
=
false
;
int
real_microbatch_num
=
0
;
int
real_microbatch_num
=
0
;
for
(
int
i
=
0
;
i
<
num_microbatches_
;
++
i
)
{
for
(
int
i
=
0
;
i
<
num_microbatches_
;
++
i
)
{
{
{
...
@@ -217,6 +224,7 @@ void SectionWorker::TrainFiles() {
...
@@ -217,6 +224,7 @@ void SectionWorker::TrainFiles() {
VLOG
(
3
)
<<
"thread "
<<
thread_id_
<<
" completed."
;
VLOG
(
3
)
<<
"thread "
<<
thread_id_
<<
" completed."
;
lk
.
unlock
();
lk
.
unlock
();
threads_completed
=
false
;
threads_completed
=
false
;
local_completed
=
true
;
break
;
break
;
}
}
lk
.
unlock
();
lk
.
unlock
();
...
@@ -282,6 +290,9 @@ void SectionWorker::TrainFiles() {
...
@@ -282,6 +290,9 @@ void SectionWorker::TrainFiles() {
}
}
}
}
dev_ctx_
->
Wait
();
dev_ctx_
->
Wait
();
if
(
local_completed
)
{
return
;
}
}
}
}
}
}
}
...
@@ -479,6 +490,7 @@ void SectionWorker::TrainFilesWithProfiler() {
...
@@ -479,6 +490,7 @@ void SectionWorker::TrainFilesWithProfiler() {
if
(
real_microbatch_num
==
0
)
{
if
(
real_microbatch_num
==
0
)
{
batch_timer
.
Pause
();
batch_timer
.
Pause
();
VLOG
(
0
)
<<
"batch time: "
<<
batch_timer
.
ElapsedUS
();
VLOG
(
0
)
<<
"batch time: "
<<
batch_timer
.
ElapsedUS
();
return
;
}
}
// update pass
// update pass
int
op_idx
=
0
;
int
op_idx
=
0
;
...
@@ -528,14 +540,15 @@ void SectionWorker::TrainFilesWithProfiler() {
...
@@ -528,14 +540,15 @@ void SectionWorker::TrainFilesWithProfiler() {
<<
"]:START["
<<
micro_start
.
tv_sec
*
1e6
+
micro_start
.
tv_usec
<<
"]:START["
<<
micro_start
.
tv_sec
*
1e6
+
micro_start
.
tv_usec
<<
"]:END["
<<
micro_end
.
tv_sec
*
1e6
+
micro_end
.
tv_usec
<<
"]"
<<
std
::
endl
;
<<
"]:END["
<<
micro_end
.
tv_sec
*
1e6
+
micro_end
.
tv_usec
<<
"]"
<<
std
::
endl
;
}
}
struct
timeval
wait_start
;
struct
timeval
wait_end
;
gettimeofday
(
&
wait_start
,
NULL
);
dev_ctx_
->
Wait
();
dev_ctx_
->
Wait
();
gettimeofday
(
&
wait_end
,
NULL
);
VLOG
(
0
)
<<
"device wait: "
<<
wait_end
.
tv_sec
*
1e6
+
wait_end
.
tv_usec
-
wait_start
.
tv_sec
*
1e6
-
wait_start
.
tv_usec
;
batch_timer
.
Pause
();
batch_timer
.
Pause
();
VLOG
(
0
)
<<
"batch time: "
<<
batch_timer
.
ElapsedUS
();
VLOG
(
0
)
<<
"batch time: "
<<
batch_timer
.
ElapsedUS
();
{
std
::
unique_lock
<
std
::
mutex
>
lk
(
thread_mutex
);
if
(
threads_completed
)
{
return
;
}
}
}
}
}
else
{
}
else
{
struct
timeval
start
;
struct
timeval
start
;
...
@@ -545,6 +558,7 @@ void SectionWorker::TrainFilesWithProfiler() {
...
@@ -545,6 +558,7 @@ void SectionWorker::TrainFilesWithProfiler() {
cudaEvent_t
cu_start
,
cu_stop
;
cudaEvent_t
cu_start
,
cu_stop
;
cudaEventCreate
(
&
cu_start
);
cudaEventCreate
(
&
cu_start
);
cudaEventCreate
(
&
cu_stop
);
cudaEventCreate
(
&
cu_stop
);
bool
local_completed
=
false
;
while
(
true
)
{
while
(
true
)
{
// forward pass:
// forward pass:
int
real_microbatch_num
=
0
;
int
real_microbatch_num
=
0
;
...
@@ -563,6 +577,7 @@ void SectionWorker::TrainFilesWithProfiler() {
...
@@ -563,6 +577,7 @@ void SectionWorker::TrainFilesWithProfiler() {
VLOG
(
3
)
<<
"thread "
<<
thread_id_
<<
" local_batch_id_ "
VLOG
(
3
)
<<
"thread "
<<
thread_id_
<<
" local_batch_id_ "
<<
local_batch_id_
<<
" batch_id_ "
<<
batch_id_
;
<<
local_batch_id_
<<
" batch_id_ "
<<
batch_id_
;
if
(
threads_completed
)
{
if
(
threads_completed
)
{
local_completed
=
true
;
VLOG
(
3
)
<<
"thread "
<<
thread_id_
<<
" completed."
;
VLOG
(
3
)
<<
"thread "
<<
thread_id_
<<
" completed."
;
lk
.
unlock
();
lk
.
unlock
();
VLOG
(
0
)
<<
"============timeline============"
;
VLOG
(
0
)
<<
"============timeline============"
;
...
@@ -742,6 +757,9 @@ void SectionWorker::TrainFilesWithProfiler() {
...
@@ -742,6 +757,9 @@ void SectionWorker::TrainFilesWithProfiler() {
<<
"]:END["
<<
micro_end
.
tv_sec
*
1e6
+
micro_end
.
tv_usec
<<
"]"
<<
std
::
endl
;
<<
"]:END["
<<
micro_end
.
tv_sec
*
1e6
+
micro_end
.
tv_usec
<<
"]"
<<
std
::
endl
;
}
}
dev_ctx_
->
Wait
();
dev_ctx_
->
Wait
();
if
(
local_completed
)
{
return
;
}
}
}
}
}
}
}
...
...
python/paddle/fluid/optimizer.py
浏览文件 @
0360e583
...
@@ -3772,30 +3772,31 @@ class PipelineOptimizer(object):
...
@@ -3772,30 +3772,31 @@ class PipelineOptimizer(object):
return
programs
return
programs
#def _find_post_op(self, ops, cur_op, var_name):
def
_find_post_op
(
self
,
ops
,
cur_op
,
var_name
):
# """
"""
# Find the real post op that has variable named var_name as input.
Find the real post op that has variable named var_name as input.
# Args:
Args:
# ops (list): A list of ops.
ops (list): A list of ops.
# cur_op (Operator): Current operator which has variable named
cur_op (Operator): Current operator which has variable named
# var_name as output.
var_name as output.
# var_name (string): Variable name.
var_name (string): Variable name.
# """
"""
# post_op = []
post_op
=
[]
# before = True
before
=
True
# for op in ops:
for
op
in
ops
:
# if op == cur_op:
if
op
==
cur_op
:
# before = False
before
=
False
# continue
continue
# if before:
if
before
:
# continue
continue
# for in_var_name in op.input_arg_names:
for
in_var_name
in
op
.
input_arg_names
:
# if in_var_name == var_name:
if
in_var_name
==
var_name
:
# post_op.append(op)
post_op
.
append
(
op
)
# if post_op:
break
# return post_op[0]
if
post_op
:
# return None
return
post_op
[
0
]
return
None
def
_find_real_prev_op
(
self
,
ops
,
cur_op
,
var_name
):
def
_find_real_prev_op
(
self
,
ops
,
cur_op
,
var_name
):
"""
"""
...
@@ -4009,12 +4010,8 @@ class PipelineOptimizer(object):
...
@@ -4009,12 +4010,8 @@ class PipelineOptimizer(object):
assert
'@RENAME@'
in
name
assert
'@RENAME@'
in
name
assert
len
(
op
.
desc
.
output_arg_names
())
==
1
assert
len
(
op
.
desc
.
output_arg_names
())
==
1
out_name
=
op
.
desc
.
output_arg_names
()[
0
]
out_name
=
op
.
desc
.
output_arg_names
()[
0
]
assert
core
.
grad_var_suffix
()
in
out_name
post_op
=
self
.
_find_post_op
(
block
.
ops
,
op
,
out_name
)
param_name
=
self
.
_strip_grad_suffix
(
out_name
)
device
=
post_op
.
attr
(
self
.
_op_device_key
)
assert
param_name
in
self
.
_param_device_map
device
=
self
.
_param_device_map
[
param_name
]
#post_op = self._find_post_op(block.ops, op, out_name)
#device = post_op.attr(self._op_device_key)
assert
device
assert
device
op
.
_set_attr
(
self
.
_op_device_key
,
device
)
op
.
_set_attr
(
self
.
_op_device_key
,
device
)
continue
continue
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录