Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
PaddleClas
提交
1d17c637
P
PaddleClas
项目概览
PaddlePaddle
/
PaddleClas
大约 1 年 前同步成功
通知
115
Star
4999
Fork
1114
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
19
列表
看板
标记
里程碑
合并请求
6
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
PaddleClas
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
19
Issue
19
列表
看板
标记
里程碑
合并请求
6
合并请求
6
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
1d17c637
编写于
3月 08, 2022
作者:
D
dongshuilong
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
fix shufflenet_bs1536,mv3 slim train, static env numberwork8 resent50 bs256 bug
上级
abbe1b85
变更
11
隐藏空白更改
内联
并排
Showing
11 changed file
with
80 addition
and
8 deletion
+80
-8
test_tipc/benchmark_train.sh
test_tipc/benchmark_train.sh
+5
-1
test_tipc/config/ShuffleNet/ShuffleNetV2_x1_0_train_infer_python.txt
...onfig/ShuffleNet/ShuffleNetV2_x1_0_train_infer_python.txt
+2
-2
test_tipc/static/ResNet50/N1C1/ResNet50_bs256_fp16_SingleP_DP.sh
...pc/static/ResNet50/N1C1/ResNet50_bs256_fp16_SingleP_DP.sh
+13
-0
test_tipc/static/ResNet50/N1C1/ResNet50_bs256_fp32_SingleP_DP.sh
...pc/static/ResNet50/N1C1/ResNet50_bs256_fp32_SingleP_DP.sh
+17
-0
test_tipc/static/ResNet50/N1C1/ResNet50_bs64_fp16_SingleP_DP.sh
...ipc/static/ResNet50/N1C1/ResNet50_bs64_fp16_SingleP_DP.sh
+1
-1
test_tipc/static/ResNet50/N1C1/ResNet50_bs64_fp32_SingleP_DP.sh
...ipc/static/ResNet50/N1C1/ResNet50_bs64_fp32_SingleP_DP.sh
+1
-1
test_tipc/static/ResNet50/N1C8/ResNet50_bs256_fp16_MultiP_DP.sh
...ipc/static/ResNet50/N1C8/ResNet50_bs256_fp16_MultiP_DP.sh
+13
-0
test_tipc/static/ResNet50/N1C8/ResNet50_bs256_fp32_MultiP_DP.sh
...ipc/static/ResNet50/N1C8/ResNet50_bs256_fp32_MultiP_DP.sh
+13
-0
test_tipc/static/ResNet50/N1C8/ResNet50_bs64_fp16_MultiP_DP.sh
...tipc/static/ResNet50/N1C8/ResNet50_bs64_fp16_MultiP_DP.sh
+1
-1
test_tipc/static/ResNet50/N1C8/ResNet50_bs64_fp32_MultiP_DP.sh
...tipc/static/ResNet50/N1C8/ResNet50_bs64_fp32_MultiP_DP.sh
+1
-1
test_tipc/static/ResNet50/benchmark_common/run_benchmark.sh
test_tipc/static/ResNet50/benchmark_common/run_benchmark.sh
+13
-1
未找到文件。
test_tipc/benchmark_train.sh
浏览文件 @
1d17c637
...
...
@@ -69,7 +69,7 @@ PARAMS=$3
IFS
=
$'
\n
'
# parser params from train_benchmark.txt
sed
-i
's/ -o DataLoader.Train.sampler.shuffle=False//g'
$FILENAME
sed
-i
's/ -o DataLoader.Train.loader.num_workers=0//g'
$FILENAME
sed
-i
's/ -o DataLoader.Train.loader.num_workers=0/
-o Global.print_batch_step=1
/g'
$FILENAME
sed
-i
's/-o DataLoader.Train.loader.use_shared_memory=False/-o Global.eval_during_train=False/g'
$FILENAME
dataline
=
`
cat
$FILENAME
`
# parser params
...
...
@@ -117,10 +117,14 @@ line_profile=13
line_eval_py
=
24
line_export_py
=
30
line_norm_train
=
16
line_pact_train
=
17
line_fgpm_train
=
18
func_sed_params
"
$FILENAME
"
"
${
line_eval_py
}
"
"null"
func_sed_params
"
$FILENAME
"
"
${
line_export_py
}
"
"null"
func_sed_params
"
$FILENAME
"
"
${
line_python
}
"
"
$python
"
func_sed_params
"
$FILENAME
"
"
${
line_pact_train
}
"
"null"
func_sed_params
"
$FILENAME
"
"
${
line_fgpm_train
}
"
"null"
# if params
if
[
!
-n
"
$PARAMS
"
]
;
then
...
...
test_tipc/config/ShuffleNet/ShuffleNetV2_x1_0_train_infer_python.txt
浏览文件 @
1d17c637
...
...
@@ -53,8 +53,8 @@ null:null
===========================train_benchmark_params==========================
batch_size:256|1536
fp_items:fp32
epoch:
1
epoch:
2
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
===========================infer_benchmark_params==========================
random_infer_input:[{float32,[3,224,224]}]
\ No newline at end of file
random_infer_input:[{float32,[3,224,224]}]
test_tipc/static/ResNet50/N1C1/ResNet50_bs256_fp16_SingleP_DP.sh
0 → 100644
浏览文件 @
1d17c637
model_item
=
ResNet50
bs_item
=
256
fp_item
=
fp16
run_process_type
=
SingleP
run_mode
=
DP
device_num
=
N1C1
max_epochs
=
1
num_workers
=
8
# get data
bash test_tipc/static/
${
model_item
}
/benchmark_common/prepare.sh
# run
bash test_tipc/static/
${
model_item
}
/benchmark_common/run_benchmark.sh
${
model_item
}
${
bs_item
}
${
fp_item
}
${
run_process_type
}
${
run_mode
}
${
device_num
}
${
max_epochs
}
${
num_workers
}
2>&1
;
test_tipc/static/ResNet50/N1C1/ResNet50_bs256_fp32_SingleP_DP.sh
0 → 100644
浏览文件 @
1d17c637
model_item
=
ResNet50
bs_item
=
256
fp_item
=
fp32
run_process_type
=
SingleP
run_mode
=
DP
device_num
=
N1C1
max_epochs
=
1
num_workers
=
8
# get data
bash test_tipc/static/
${
model_item
}
/benchmark_common/prepare.sh
# run
bash test_tipc/static/
${
model_item
}
/benchmark_common/run_benchmark.sh
${
model_item
}
${
bs_item
}
${
fp_item
}
${
run_process_type
}
${
run_mode
}
${
device_num
}
${
max_epochs
}
${
num_workers
}
2>&1
;
# run profiling
sleep
10
;
export
PROFILING
=
true
bash test_tipc/static/
${
model_item
}
/benchmark_common/run_benchmark.sh
${
model_item
}
${
bs_item
}
${
fp_item
}
${
run_process_type
}
${
run_mode
}
${
device_num
}
${
max_epochs
}
${
num_workers
}
2>&1
;
test_tipc/static/ResNet50/N1C1/ResNet50_bs64_fp16_SingleP_DP.sh
浏览文件 @
1d17c637
...
...
@@ -5,7 +5,7 @@ run_process_type=SingleP
run_mode
=
DP
device_num
=
N1C1
max_epochs
=
1
num_workers
=
4
num_workers
=
8
# get data
bash test_tipc/static/
${
model_item
}
/benchmark_common/prepare.sh
...
...
test_tipc/static/ResNet50/N1C1/ResNet50_bs64_fp32_SingleP_DP.sh
浏览文件 @
1d17c637
...
...
@@ -5,7 +5,7 @@ run_process_type=SingleP
run_mode
=
DP
device_num
=
N1C1
max_epochs
=
1
num_workers
=
4
num_workers
=
8
# get data
bash test_tipc/static/
${
model_item
}
/benchmark_common/prepare.sh
...
...
test_tipc/static/ResNet50/N1C8/ResNet50_bs256_fp16_MultiP_DP.sh
0 → 100644
浏览文件 @
1d17c637
model_item
=
ResNet50
bs_item
=
256
fp_item
=
fp16
run_process_type
=
MultiP
run_mode
=
DP
device_num
=
N1C8
max_epochs
=
1
num_workers
=
8
# get data
bash test_tipc/static/
${
model_item
}
/benchmark_common/prepare.sh
# run
bash test_tipc/static/
${
model_item
}
/benchmark_common/run_benchmark.sh
${
model_item
}
${
bs_item
}
${
fp_item
}
${
run_process_type
}
${
run_mode
}
${
device_num
}
${
max_epochs
}
${
num_workers
}
2>&1
;
test_tipc/static/ResNet50/N1C8/ResNet50_bs256_fp32_MultiP_DP.sh
0 → 100644
浏览文件 @
1d17c637
model_item
=
ResNet50
bs_item
=
256
fp_item
=
fp32
run_process_type
=
MultiP
run_mode
=
DP
device_num
=
N1C8
max_epochs
=
1
num_workers
=
8
# get data
bash test_tipc/static/
${
model_item
}
/benchmark_common/prepare.sh
# run
bash test_tipc/static/
${
model_item
}
/benchmark_common/run_benchmark.sh
${
model_item
}
${
bs_item
}
${
fp_item
}
${
run_process_type
}
${
run_mode
}
${
device_num
}
${
max_epochs
}
${
num_workers
}
2>&1
;
test_tipc/static/ResNet50/N1C8/ResNet50_bs64_fp16_MultiP_DP.sh
浏览文件 @
1d17c637
...
...
@@ -5,7 +5,7 @@ run_process_type=MultiP
run_mode
=
DP
device_num
=
N1C8
max_epochs
=
1
num_workers
=
4
num_workers
=
8
# get data
bash test_tipc/static/
${
model_item
}
/benchmark_common/prepare.sh
...
...
test_tipc/static/ResNet50/N1C8/ResNet50_bs64_fp32_MultiP_DP.sh
浏览文件 @
1d17c637
...
...
@@ -5,7 +5,7 @@ run_process_type=MultiP
run_mode
=
DP
device_num
=
N1C8
max_epochs
=
1
num_workers
=
4
num_workers
=
8
# get data
bash test_tipc/static/
${
model_item
}
/benchmark_common/prepare.sh
...
...
test_tipc/static/ResNet50/benchmark_common/run_benchmark.sh
浏览文件 @
1d17c637
...
...
@@ -46,7 +46,7 @@ function _train(){
log_file
=
${
profiling_log_file
}
fi
train_cmd
=
"
${
config_file
}
-o DataLoader.Train.sampler.batch_size=
${
base_batch_size
}
-o Global.epochs=
${
max_epochs
}
-o DataLoader.Train.loader.num_workers=
${
num_workers
}
${
profiling_config
}
"
train_cmd
=
"
${
config_file
}
-o DataLoader.Train.sampler.batch_size=
${
base_batch_size
}
-o Global.epochs=
${
max_epochs
}
-o DataLoader.Train.loader.num_workers=
${
num_workers
}
${
profiling_config
}
-o Global.eval_during_train=False
"
# 以下为通用执行命令,无特殊可不用修改
case
${
run_process_type
}
in
SingleP
)
...
...
@@ -69,7 +69,19 @@ function _train(){
fi
cd
../
}
function
_set_env
(){
#开启gc
export
FLAGS_eager_delete_tensor_gb
=
0.0
export
FLAGS_fraction_of_gpu_memory_to_use
=
0.98
####
export
FLAGS_cudnn_exhaustive_search
=
1
export
FLAGS_conv_workspace_size_limit
=
4000
#MB
}
source
${
BENCHMARK_ROOT
}
/scripts/run_model.sh
# 在该脚本中会对符合benchmark规范的log使用analysis.py 脚本进行性能数据解析;如果不联调只想要产出训练log可以注掉本行,提交时需打开
_set_params
$@
# _train # 如果只产出训练log,不解析,可取消注释
_set_env
_run
# 该函数在run_model.sh中,执行时会调用_train; 如果不联调只产出训练log可以注掉本行,提交时需打开
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录