Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
ERNIE
提交
9f63e261
E
ERNIE
项目概览
PaddlePaddle
/
ERNIE
大约 1 年 前同步成功
通知
109
Star
5997
Fork
1270
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
29
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
E
ERNIE
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
29
Issue
29
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
9f63e261
编写于
7月 10, 2019
作者:
Z
zhengya01
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
add ce for ERNIE
上级
a171e58e
变更
6
隐藏空白更改
内联
并排
Showing
6 changed file
with
165 addition
and
1 deletion
+165
-1
ERNIE/.run_ce.sh
ERNIE/.run_ce.sh
+43
-0
ERNIE/__init__.py
ERNIE/__init__.py
+0
-0
ERNIE/_ce.py
ERNIE/_ce.py
+67
-0
ERNIE/finetune_args.py
ERNIE/finetune_args.py
+3
-0
ERNIE/run_classifier.py
ERNIE/run_classifier.py
+24
-1
ERNIE/utils/cards.py
ERNIE/utils/cards.py
+28
-0
未找到文件。
ERNIE/.run_ce.sh
0 → 100644
浏览文件 @
9f63e261
set
-eux
export
FLAGS_sync_nccl_allreduce
=
1
MODEL_PATH
=
ERNIE_1.0.1
TASK_DATA_PATH
=
task_data
train
()
{
python
-u
run_classifier.py
\
--use_cuda
true
\
--do_train
true
\
--do_val
true
\
--do_test
true
\
--verbose
true
\
--batch_size
8192
\
--in_tokens
true
\
--init_pretraining_params
${
MODEL_PATH
}
/params
\
--train_set
${
TASK_DATA_PATH
}
/xnli/train.tsv
\
--dev_set
${
TASK_DATA_PATH
}
/xnli/dev.tsv
\
--test_set
${
TASK_DATA_PATH
}
/xnli/test.tsv
\
--vocab_path
config/vocab.txt
\
--label_map
${
TASK_DATA_PATH
}
/xnli/label_map.json
\
--ernie_config_path
config/ernie_config.json
\
--checkpoints
./checkpoints
\
--save_steps
2000
\
--weight_decay
0.01
\
--warmup_proportion
0.0
\
--validation_steps
25
\
--epoch
1
\
--max_seq_len
512
\
--learning_rate
1e-4
\
--skip_steps
10
\
--num_iteration_per_drop_scope
1
\
--num_labels
3
\
--random_seed
100
\
--enable_ce
\
--shuffle
false
}
export
CUDA_VISIBLE_DEVICES
=
0
train | python _ce.py
export
CUDA_VISIBLE_DEVICES
=
0,1,2,3
train | python _ce.py
ERNIE/__init__.py
0 → 100644
浏览文件 @
9f63e261
ERNIE/_ce.py
0 → 100644
浏览文件 @
9f63e261
####this file is only used for continuous evaluation test!
import
os
import
sys
sys
.
path
.
insert
(
0
,
os
.
environ
[
'ceroot'
])
from
kpi
import
CostKpi
,
DurationKpi
,
AccKpi
#### NOTE kpi.py should shared in models in some way!!!!
train_loss_card1_kpi
=
CostKpi
(
'train_loss_card1'
,
0.03
,
0
,
actived
=
True
)
train_acc_card1_kpi
=
AccKpi
(
'train_acc_card1'
,
0.06
,
0
,
actived
=
True
)
train_duration_card1_kpi
=
DurationKpi
(
'train_duration_card1'
,
0.01
,
0
,
actived
=
True
)
train_loss_card4_kpi
=
CostKpi
(
'train_loss_card4'
,
0.01
,
0
,
actived
=
True
)
train_acc_card4_kpi
=
AccKpi
(
'train_acc_card4'
,
0.02
,
0
,
actived
=
True
)
train_duration_card4_kpi
=
DurationKpi
(
'train_duration_card4'
,
0.02
,
0
,
actived
=
True
)
tracking_kpis
=
[
train_loss_card1_kpi
,
train_acc_card1_kpi
,
train_duration_card1_kpi
,
train_loss_card4_kpi
,
train_acc_card4_kpi
,
train_duration_card4_kpi
,
]
def
parse_log
(
log
):
'''
This method should be implemented by model developers.
The suggestion:
each line in the log should be key, value, for example:
"
train_loss
\t
1.0
test_loss
\t
1.0
train_loss
\t
1.0
train_acc
\t
1.2
"
'''
for
line
in
log
.
split
(
'
\n
'
):
fs
=
line
.
strip
().
split
(
'
\t
'
)
print
(
fs
)
if
len
(
fs
)
==
3
and
fs
[
0
]
==
'kpis'
:
print
(
"-----%s"
%
fs
)
kpi_name
=
fs
[
1
]
kpi_value
=
float
(
fs
[
2
])
yield
kpi_name
,
kpi_value
def
log_to_ce
(
log
):
kpi_tracker
=
{}
for
kpi
in
tracking_kpis
:
kpi_tracker
[
kpi
.
name
]
=
kpi
for
(
kpi_name
,
kpi_value
)
in
parse_log
(
log
):
print
(
kpi_name
,
kpi_value
)
kpi_tracker
[
kpi_name
].
add_record
(
kpi_value
)
kpi_tracker
[
kpi_name
].
persist
()
if
__name__
==
'__main__'
:
log
=
sys
.
stdin
.
read
()
print
(
"*****"
)
print
(
log
)
print
(
"****"
)
log_to_ce
(
log
)
ERNIE/finetune_args.py
浏览文件 @
9f63e261
...
@@ -74,4 +74,7 @@ run_type_g.add_arg("do_train", bool, True, "Whether to pe
...
@@ -74,4 +74,7 @@ run_type_g.add_arg("do_train", bool, True, "Whether to pe
run_type_g
.
add_arg
(
"do_val"
,
bool
,
True
,
"Whether to perform evaluation on dev data set."
)
run_type_g
.
add_arg
(
"do_val"
,
bool
,
True
,
"Whether to perform evaluation on dev data set."
)
run_type_g
.
add_arg
(
"do_test"
,
bool
,
True
,
"Whether to perform evaluation on test data set."
)
run_type_g
.
add_arg
(
"do_test"
,
bool
,
True
,
"Whether to perform evaluation on test data set."
)
run_type_g
.
add_arg
(
"metrics"
,
bool
,
True
,
"Whether to perform evaluation on test data set."
)
run_type_g
.
add_arg
(
"metrics"
,
bool
,
True
,
"Whether to perform evaluation on test data set."
)
run_type_g
.
add_arg
(
"shuffle"
,
bool
,
True
,
""
)
parser
.
add_argument
(
"--enable_ce"
,
action
=
'store_true'
,
help
=
"The flag indicating whether to run the task for continuous evaluation."
)
# yapf: enable
# yapf: enable
ERNIE/run_classifier.py
浏览文件 @
9f63e261
...
@@ -29,6 +29,7 @@ from finetune.classifier import create_model, evaluate
...
@@ -29,6 +29,7 @@ from finetune.classifier import create_model, evaluate
from
optimization
import
optimization
from
optimization
import
optimization
from
utils.args
import
print_arguments
,
check_cuda
from
utils.args
import
print_arguments
,
check_cuda
from
utils.init
import
init_pretraining_params
,
init_checkpoint
from
utils.init
import
init_pretraining_params
,
init_checkpoint
from
utils.cards
import
get_cards
from
finetune_args
import
parser
from
finetune_args
import
parser
args
=
parser
.
parse_args
()
args
=
parser
.
parse_args
()
...
@@ -67,7 +68,7 @@ def main(args):
...
@@ -67,7 +68,7 @@ def main(args):
input_file
=
args
.
train_set
,
input_file
=
args
.
train_set
,
batch_size
=
args
.
batch_size
,
batch_size
=
args
.
batch_size
,
epoch
=
args
.
epoch
,
epoch
=
args
.
epoch
,
shuffle
=
Tru
e
,
shuffle
=
args
.
shuffl
e
,
phase
=
"train"
)
phase
=
"train"
)
num_train_examples
=
reader
.
get_num_examples
(
args
.
train_set
)
num_train_examples
=
reader
.
get_num_examples
(
args
.
train_set
)
...
@@ -85,6 +86,8 @@ def main(args):
...
@@ -85,6 +86,8 @@ def main(args):
print
(
"Num warmup steps: %d"
%
warmup_steps
)
print
(
"Num warmup steps: %d"
%
warmup_steps
)
train_program
=
fluid
.
Program
()
train_program
=
fluid
.
Program
()
if
args
.
random_seed
is
not
None
and
args
.
enable_ce
:
train_program
.
random_seed
=
args
.
random_seed
with
fluid
.
program_guard
(
train_program
,
startup_prog
):
with
fluid
.
program_guard
(
train_program
,
startup_prog
):
with
fluid
.
unique_name
.
guard
():
with
fluid
.
unique_name
.
guard
():
...
@@ -187,6 +190,7 @@ def main(args):
...
@@ -187,6 +190,7 @@ def main(args):
if
warmup_steps
>
0
:
if
warmup_steps
>
0
:
graph_vars
[
"learning_rate"
]
=
scheduled_lr
graph_vars
[
"learning_rate"
]
=
scheduled_lr
ce_info
=
[]
time_begin
=
time
.
time
()
time_begin
=
time
.
time
()
while
True
:
while
True
:
try
:
try
:
...
@@ -213,6 +217,7 @@ def main(args):
...
@@ -213,6 +217,7 @@ def main(args):
(
current_epoch
,
current_example
,
num_train_examples
,
(
current_epoch
,
current_example
,
num_train_examples
,
steps
,
outputs
[
"loss"
],
outputs
[
"accuracy"
],
steps
,
outputs
[
"loss"
],
outputs
[
"accuracy"
],
args
.
skip_steps
/
used_time
))
args
.
skip_steps
/
used_time
))
ce_info
.
append
([
outputs
[
"loss"
],
outputs
[
"accuracy"
],
used_time
])
time_begin
=
time
.
time
()
time_begin
=
time
.
time
()
if
steps
%
args
.
save_steps
==
0
:
if
steps
%
args
.
save_steps
==
0
:
...
@@ -246,6 +251,24 @@ def main(args):
...
@@ -246,6 +251,24 @@ def main(args):
fluid
.
io
.
save_persistables
(
exe
,
save_path
,
train_program
)
fluid
.
io
.
save_persistables
(
exe
,
save_path
,
train_program
)
train_pyreader
.
reset
()
train_pyreader
.
reset
()
break
break
if
args
.
enable_ce
:
card_num
=
get_cards
()
ce_loss
=
0
ce_acc
=
0
ce_time
=
0
try
:
ce_loss
=
ce_info
[
-
2
][
0
]
ce_acc
=
ce_info
[
-
2
][
1
]
ce_time
=
ce_info
[
-
2
][
2
]
except
:
print
(
"ce info error"
)
print
(
"kpis
\t
train_duration_card%s
\t
%s"
%
(
card_num
,
ce_time
))
print
(
"kpis
\t
train_loss_card%s
\t
%f"
%
(
card_num
,
ce_loss
))
print
(
"kpis
\t
train_acc_card%s
\t
%f"
%
(
card_num
,
ce_acc
))
# final eval on dev set
# final eval on dev set
if
args
.
do_val
:
if
args
.
do_val
:
...
...
ERNIE/utils/cards.py
0 → 100644
浏览文件 @
9f63e261
# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import
os
def
get_cards
():
"""
get gpu cards number
"""
num
=
0
cards
=
os
.
environ
.
get
(
'CUDA_VISIBLE_DEVICES'
,
''
)
if
cards
!=
''
:
num
=
len
(
cards
.
split
(
","
))
return
num
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录