提交 8aed9831 编写于 作者: D dongshuilong

add pure and amp fp16 for bechmark r50

上级 10fbf55c
model_item=ResNet50
bs_item=128
fp_item=amp_fp16
run_process_type=SingleP
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=fp32
run_process_type=SingleP
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
# run profiling
sleep 10;
export PROFILING=true
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=pure_fp16
run_process_type=SingleP
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=256
fp_item=fp16
fp_item=amp_fp16
run_process_type=SingleP
run_mode=DP
device_num=N1C1
......
model_item=ResNet50
bs_item=256
fp_item=pure_fp16
run_process_type=SingleP
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=64
fp_item=fp16
fp_item=amp_fp16
run_process_type=SingleP
run_mode=DP
device_num=N1C1
......
model_item=ResNet50
bs_item=64
fp_item=pure_fp16
run_process_type=SingleP
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=amp_fp16
run_process_type=MultiP
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=fp32
run_process_type=MultiP
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=pure_fp16
run_process_type=MultiP
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=256
fp_item=fp16
fp_item=amp_fp16
run_process_type=MultiP
run_mode=DP
device_num=N1C8
......
model_item=ResNet50
bs_item=256
fp_item=pure_fp16
run_process_type=MultiP
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=64
fp_item=fp16
fp_item=amp_fp16
run_process_type=MultiP
run_mode=DP
device_num=N1C8
......
model_item=ResNet50
bs_item=64
fp_item=pure_fp16
run_process_type=MultiP
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=amp_fp16
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=fp32
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=pure_fp16
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=256
fp_item=amp_fp16
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=256
fp_item=fp32
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=256
fp_item=pure_fp16
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=64
fp_item=amp_fp16
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=64
fp_item=fp32
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=64
fp_item=pure_fp16
run_process_type=MultiP
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_process_type} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
......@@ -35,8 +35,10 @@ function _train(){
if [ ${fp_item} = "fp32" ]; then
config_file="-c ppcls/configs/ImageNet/ResNet/ResNet50.yaml"
else
elif [ ${fp_item} = "amp_fp16" ]; then
config_file="-c ppcls/configs/ImageNet/ResNet/ResNet50_amp_O1.yaml"
elif [ ${fp_item} = "pure_fp16" ]; then
config_file="-c ppcls/configs/ImageNet/ResNet/ResNet50_amp_O2.yaml"
fi
if [ ${profiling} = "false" ]; then
profiling_config=""
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册