Merge pull request #16687 from luotao1/reduce_inference_ci_time

reduce all analyzer_test ci elasped time

Merge pull request #16687 from luotao1/reduce_inference_ci_time
reduce all analyzer_test ci elasped time
4048a268 · Tao Luo · GitHub · c6720990 · d5c8d4ac · 4048a268
显示空白变更内容
内联并排

Showing with 10 addition and 2 deletion

paddle/fluid/inference/tests/api/tester_helper.h paddle/fluid/inference/tests/api/tester_helper.h +10 -2

未找到文件。
--- a/paddle/fluid/inference/tests/api/tester_helper.h
+++ b/paddle/fluid/inference/tests/api/tester_helper.h
@@ -55,6 +55,9 @@ DEFINE_bool(record_benchmark, false,
 DEFINE_double(accuracy, 1e-3, "Result Accuracy.");
 DEFINE_double(quantized_accuracy, 1e-2, "Result Quantized Accuracy.");
 DEFINE_bool(zero_copy, false, "Use ZeroCopy to speedup Feed/Fetch.");
+DEFINE_bool(warmup, false,
+            "Use warmup to calculate elapsed_time more accurately. "
+            "To reduce CI time, it sets false in default.");

 DECLARE_bool(profile);
 DECLARE_int32(paddle_num_threads);
@@ -367,7 +370,9 @@ void TestOneThreadPrediction(
    const std::vector<std::vector<PaddleTensor>> &inputs,
    std::vector<std::vector<PaddleTensor>> *outputs, bool use_analysis = true) {
  auto predictor = CreateTestPredictor(config, use_analysis);
+  if (FLAGS_warmup) {
    PredictionWarmUp(predictor.get(), inputs, outputs, 1, 0);
+  }
  PredictionRun(predictor.get(), inputs, outputs, 1, 0);
 }

@@ -395,7 +400,10 @@ void TestMultiThreadPrediction(
            ->SetMkldnnThreadID(static_cast<int>(tid) + 1);
      }
 #endif
-      PredictionWarmUp(predictor.get(), inputs, &outputs_tid, num_threads, tid);
+      if (FLAGS_warmup) {
+        PredictionWarmUp(predictor.get(), inputs, &outputs_tid, num_threads,
+                         tid);
+      }
      PredictionRun(predictor.get(), inputs, &outputs_tid, num_threads, tid);
    });
  }