diff --git a/test_tipc/static/mask_rcnn_r50_1x_coco/N1C1/mask_rcnn_r50_1x_coco_bs2_fp32_DP.sh b/test_tipc/static/mask_rcnn_r50_1x_coco/N1C1/mask_rcnn_r50_1x_coco_bs2_fp32_DP.sh index 65878fd7010418c4f9ff5c3b60d83f60d6c10184..626555aca6b08e79a053fe99048c92a743af32f2 100644 --- a/test_tipc/static/mask_rcnn_r50_1x_coco/N1C1/mask_rcnn_r50_1x_coco_bs2_fp32_DP.sh +++ b/test_tipc/static/mask_rcnn_r50_1x_coco/N1C1/mask_rcnn_r50_1x_coco_bs2_fp32_DP.sh @@ -4,7 +4,7 @@ fp_item=fp32 run_mode=DP device_num=N1C1 max_iter=100 -num_workers=2 +num_workers=8 # get data bash test_tipc/static/${model_item}/benchmark_common/prepare.sh diff --git a/test_tipc/static/mask_rcnn_r50_1x_coco/N1C8/mask_rcnn_r50_1x_coco_bs2_fp32_DP.sh b/test_tipc/static/mask_rcnn_r50_1x_coco/N1C8/mask_rcnn_r50_1x_coco_bs2_fp32_DP.sh index 4109e021e991e6bc14f866b5d7ba104775ff8c54..54f8c485ad621917b16475502a29d2343f539ff2 100644 --- a/test_tipc/static/mask_rcnn_r50_1x_coco/N1C8/mask_rcnn_r50_1x_coco_bs2_fp32_DP.sh +++ b/test_tipc/static/mask_rcnn_r50_1x_coco/N1C8/mask_rcnn_r50_1x_coco_bs2_fp32_DP.sh @@ -4,7 +4,7 @@ fp_item=fp32 run_mode=DP device_num=N1C8 max_iter=100 -num_workers=2 +num_workers=8 # get data bash test_tipc/static/${model_item}/benchmark_common/prepare.sh diff --git a/test_tipc/static/mask_rcnn_r50_1x_coco/benchmark_common/run_benchmark.sh b/test_tipc/static/mask_rcnn_r50_1x_coco/benchmark_common/run_benchmark.sh index 2bfed8bcefbc374c3e11cf1f874816ca31d800fe..355fd4734e422790523b3454a258b69370af7f21 100644 --- a/test_tipc/static/mask_rcnn_r50_1x_coco/benchmark_common/run_benchmark.sh +++ b/test_tipc/static/mask_rcnn_r50_1x_coco/benchmark_common/run_benchmark.sh @@ -32,6 +32,7 @@ function _train(){ export FLAGS_eager_delete_tensor_gb=0.0 export FLAGS_fraction_of_gpu_memory_to_use=0.98 export FLAGS_memory_fraction_of_eager_deletion=1.0 + export FLAGS_conv_workspace_size_limit=500 cd ./static batch_size=${base_batch_size} # 如果模型跑多卡单进程时,请在_train函数中计算出多卡需要的bs echo "current CUDA_VISIBLE_DEVICES=${CUDA_VISIBLE_DEVICES}, model_name=${model_name}, device_num=${device_num}, is profiling=${profiling}" @@ -49,8 +50,8 @@ function _train(){ use_fp16_cmd="" fi - train_cmd="-c configs/mask_rcnn_r50_1x.yml -o LearningRate.base_lr=0.001 snapshot_iter=100000 \ - TrainReader.batch_size=${batch_size} \ + train_cmd="-c configs/mask_rcnn_r50_1x.yml \ + -o TrainReader.batch_size=${batch_size} \ max_iters=${max_iter} log_iter=1 \ TrainReader.worker_num=${num_workers} ${use_fp16_cmd} \ --is_profiler=${is_profiler} "