未验证 提交 e01c7e87 编写于 作者: W Walter 提交者: GitHub

Merge pull request #1757 from RainFrost1/benchmark_bug

fix static r50 N1C8 benchmark
model_item=ResNet50
bs_item=128
fp_item=amp_fp16
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=fp32
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
# run profiling
sleep 10;
export PROFILING=true
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=pure_fp16
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50 model_item=ResNet50
bs_item=256 bs_item=256
fp_item=fp16 fp_item=amp_fp16
run_mode=DP run_mode=DP
device_num=N1C1 device_num=N1C1
max_epochs=1 max_epochs=1
......
model_item=ResNet50
bs_item=256
fp_item=pure_fp16
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50 model_item=ResNet50
bs_item=64 bs_item=64
fp_item=fp16 fp_item=amp_fp16
run_mode=DP run_mode=DP
device_num=N1C1 device_num=N1C1
max_epochs=1 max_epochs=1
......
model_item=ResNet50
bs_item=64
fp_item=pure_fp16
run_mode=DP
device_num=N1C1
max_epochs=1
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=amp_fp16
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=fp32
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=pure_fp16
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50 model_item=ResNet50
bs_item=256 bs_item=256
fp_item=fp16 fp_item=amp_fp16
run_mode=DP run_mode=DP
device_num=N1C8 device_num=N1C8
max_epochs=1 max_epochs=8
num_workers=8 num_workers=8
# get data # get data
......
...@@ -3,7 +3,7 @@ bs_item=256 ...@@ -3,7 +3,7 @@ bs_item=256
fp_item=fp32 fp_item=fp32
run_mode=DP run_mode=DP
device_num=N1C8 device_num=N1C8
max_epochs=1 max_epochs=8
num_workers=8 num_workers=8
# get data # get data
......
model_item=ResNet50
bs_item=256
fp_item=pure_fp16
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50 model_item=ResNet50
bs_item=64 bs_item=64
fp_item=fp16 fp_item=amp_fp16
run_mode=DP run_mode=DP
device_num=N1C8 device_num=N1C8
max_epochs=1 max_epochs=8
num_workers=8 num_workers=8
# get data # get data
......
...@@ -3,7 +3,7 @@ bs_item=64 ...@@ -3,7 +3,7 @@ bs_item=64
fp_item=fp32 fp_item=fp32
run_mode=DP run_mode=DP
device_num=N1C8 device_num=N1C8
max_epochs=1 max_epochs=8
num_workers=8 num_workers=8
# get data # get data
......
model_item=ResNet50
bs_item=64
fp_item=pure_fp16
run_mode=DP
device_num=N1C8
max_epochs=8
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=amp_fp16
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=fp32
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=128
fp_item=pure_fp16
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=256
fp_item=amp_fp16
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=256
fp_item=fp32
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=256
fp_item=pure_fp16
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=64
fp_item=amp_fp16
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=64
fp_item=fp32
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
model_item=ResNet50
bs_item=64
fp_item=pure_fp16
run_mode=DP
device_num=N4C32
max_epochs=32
num_workers=8
# get data
bash test_tipc/static/${model_item}/benchmark_common/prepare.sh
# run
bash test_tipc/static/${model_item}/benchmark_common/run_benchmark.sh ${model_item} ${bs_item} ${fp_item} ${run_mode} ${device_num} ${max_epochs} ${num_workers} 2>&1;
...@@ -34,8 +34,10 @@ function _train(){ ...@@ -34,8 +34,10 @@ function _train(){
if [ ${fp_item} = "fp32" ]; then if [ ${fp_item} = "fp32" ]; then
config_file="-c ppcls/configs/ImageNet/ResNet/ResNet50.yaml" config_file="-c ppcls/configs/ImageNet/ResNet/ResNet50.yaml"
else elif [ ${fp_item} = "amp_fp16" ]; then
config_file="-c ppcls/configs/ImageNet/ResNet/ResNet50_amp_O1.yaml" config_file="-c ppcls/configs/ImageNet/ResNet/ResNet50_amp_O1.yaml"
elif [ ${fp_item} = "pure_fp16" ]; then
config_file="-c ppcls/configs/ImageNet/ResNet/ResNet50_amp_O2.yaml"
fi fi
if [ ${profiling} = "false" ]; then if [ ${profiling} = "false" ]; then
profiling_config="" profiling_config=""
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册