diff --git a/deploy/pdserving/README.md b/deploy/pdserving/README.md index 55e03c4c2654f336ed942ae03e61e88b61940006..6989502c820e0941a777704e99701359bb74c988 100644 --- a/deploy/pdserving/README.md +++ b/deploy/pdserving/README.md @@ -163,43 +163,41 @@ The recognition model is the same. The predicted performance data will be automatically written into the `PipelineServingLogs/pipeline.tracer` file. - Tested on 200 real pictures, and limited the detection long side to 960. The average QPS on T4 GPU can reach around 23: + Tested on 200 real pictures, and limited the detection long side to 960. The average QPS on T4 GPU can reach around 62.0: ``` - - 2021-05-13 03:42:36,895 ==================== TRACER ====================== - 2021-05-13 03:42:36,975 Op(rec): - 2021-05-13 03:42:36,976 in[14.472382882882883 ms] - 2021-05-13 03:42:36,976 prep[9.556855855855856 ms] - 2021-05-13 03:42:36,976 midp[59.921905405405404 ms] - 2021-05-13 03:42:36,976 postp[15.345945945945946 ms] - 2021-05-13 03:42:36,976 out[1.9921216216216215 ms] - 2021-05-13 03:42:36,976 idle[0.16254943864471572] - 2021-05-13 03:42:36,976 Op(det): - 2021-05-13 03:42:36,976 in[315.4468035714286 ms] - 2021-05-13 03:42:36,976 prep[69.5980625 ms] - 2021-05-13 03:42:36,976 midp[18.989535714285715 ms] - 2021-05-13 03:42:36,976 postp[18.857803571428573 ms] - 2021-05-13 03:42:36,977 out[3.1337544642857145 ms] - 2021-05-13 03:42:36,977 idle[0.7477961159203756] - 2021-05-13 03:42:36,977 DAGExecutor: - 2021-05-13 03:42:36,977 Query count[224] - 2021-05-13 03:42:36,977 QPS[22.4 q/s] - 2021-05-13 03:42:36,977 Succ[0.9910714285714286] - 2021-05-13 03:42:36,977 Error req[169, 170] - 2021-05-13 03:42:36,977 Latency: - 2021-05-13 03:42:36,977 ave[535.1678348214285 ms] - 2021-05-13 03:42:36,977 .50[172.651 ms] - 2021-05-13 03:42:36,977 .60[187.904 ms] - 2021-05-13 03:42:36,977 .70[245.675 ms] - 2021-05-13 03:42:36,977 .80[526.684 ms] - 2021-05-13 03:42:36,977 .90[854.596 ms] - 2021-05-13 03:42:36,977 .95[1722.728 ms] - 2021-05-13 03:42:36,977 .99[3990.292 ms] - 2021-05-13 03:42:36,978 Channel (server worker num[10]): - 2021-05-13 03:42:36,978 chl0(In: ['@DAGExecutor'], Out: ['det']) size[0/0] - 2021-05-13 03:42:36,979 chl1(In: ['det'], Out: ['rec']) size[6/0] - 2021-05-13 03:42:36,979 chl2(In: ['rec'], Out: ['@DAGExecutor']) size[0/0] + 2022-05-12 03:56:46,461 ==================== TRACER ====================== + 2022-05-12 03:56:46,860 Op(det): + 2022-05-12 03:56:46,860 in[80.32286641221374 ms] + 2022-05-12 03:56:46,860 prep[74.27364885496183 ms] + 2022-05-12 03:56:46,860 midp[33.41587786259542 ms] + 2022-05-12 03:56:46,860 postp[20.935980916030534 ms] + 2022-05-12 03:56:46,860 out[1.551145038167939 ms] + 2022-05-12 03:56:46,860 idle[0.3889510617728378] + 2022-05-12 03:56:46,860 Op(rec): + 2022-05-12 03:56:46,860 in[15.46498846153846 ms] + 2022-05-12 03:56:46,861 prep[22.565715384615384 ms] + 2022-05-12 03:56:46,861 midp[91.42518076923076 ms] + 2022-05-12 03:56:46,861 postp[11.678453846153847 ms] + 2022-05-12 03:56:46,861 out[1.1200576923076924 ms] + 2022-05-12 03:56:46,861 idle[0.11658723106110291] + 2022-05-12 03:56:46,862 DAGExecutor: + 2022-05-12 03:56:46,862 Query count[620] + 2022-05-12 03:56:46,862 QPS[62.0 q/s] + 2022-05-12 03:56:46,862 Succ[0.4193548387096774] + 2022-05-12 03:56:46,862 Latency: + 2022-05-12 03:56:46,863 ave[165.54603709677417 ms] + 2022-05-12 03:56:46,863 .50[77.863 ms] + 2022-05-12 03:56:46,863 .60[158.414 ms] + 2022-05-12 03:56:46,863 .70[237.28 ms] + 2022-05-12 03:56:46,863 .80[316.022 ms] + 2022-05-12 03:56:46,863 .90[424.416 ms] + 2022-05-12 03:56:46,863 .95[515.566 ms] + 2022-05-12 03:56:46,863 .99[762.256 ms] + 2022-05-12 03:56:46,863 Channel (server worker num[10]): + 2022-05-12 03:56:46,864 chl0(In: ['@DAGExecutor'], Out: ['det']) size[0/0] + 2022-05-12 03:56:46,864 chl1(In: ['det'], Out: ['rec']) size[2/0] + 2022-05-12 03:56:46,865 chl2(In: ['rec'], Out: ['@DAGExecutor']) size[0/0] ``` diff --git a/deploy/pdserving/README_CN.md b/deploy/pdserving/README_CN.md index 0891611db5f39d322473354f7d988b10afa78cbd..761d63fa2a8892d6b95b80df34e6124c82fe7bfd 100644 --- a/deploy/pdserving/README_CN.md +++ b/deploy/pdserving/README_CN.md @@ -162,42 +162,41 @@ python3 -m paddle_serving_client.convert --dirname ./ch_PP-OCRv3_rec_infer/ \ 预测性能数据会被自动写入 `PipelineServingLogs/pipeline.tracer` 文件中。 - 在200张真实图片上测试,把检测长边限制为960。T4 GPU 上 QPS 均值可达到23左右: + 在200张真实图片上测试,把检测长边限制为960。T4 GPU 上 QPS 均值可达到62左右: ``` - 2021-05-13 03:42:36,895 ==================== TRACER ====================== - 2021-05-13 03:42:36,975 Op(rec): - 2021-05-13 03:42:36,976 in[14.472382882882883 ms] - 2021-05-13 03:42:36,976 prep[9.556855855855856 ms] - 2021-05-13 03:42:36,976 midp[59.921905405405404 ms] - 2021-05-13 03:42:36,976 postp[15.345945945945946 ms] - 2021-05-13 03:42:36,976 out[1.9921216216216215 ms] - 2021-05-13 03:42:36,976 idle[0.16254943864471572] - 2021-05-13 03:42:36,976 Op(det): - 2021-05-13 03:42:36,976 in[315.4468035714286 ms] - 2021-05-13 03:42:36,976 prep[69.5980625 ms] - 2021-05-13 03:42:36,976 midp[18.989535714285715 ms] - 2021-05-13 03:42:36,976 postp[18.857803571428573 ms] - 2021-05-13 03:42:36,977 out[3.1337544642857145 ms] - 2021-05-13 03:42:36,977 idle[0.7477961159203756] - 2021-05-13 03:42:36,977 DAGExecutor: - 2021-05-13 03:42:36,977 Query count[224] - 2021-05-13 03:42:36,977 QPS[22.4 q/s] - 2021-05-13 03:42:36,977 Succ[0.9910714285714286] - 2021-05-13 03:42:36,977 Error req[169, 170] - 2021-05-13 03:42:36,977 Latency: - 2021-05-13 03:42:36,977 ave[535.1678348214285 ms] - 2021-05-13 03:42:36,977 .50[172.651 ms] - 2021-05-13 03:42:36,977 .60[187.904 ms] - 2021-05-13 03:42:36,977 .70[245.675 ms] - 2021-05-13 03:42:36,977 .80[526.684 ms] - 2021-05-13 03:42:36,977 .90[854.596 ms] - 2021-05-13 03:42:36,977 .95[1722.728 ms] - 2021-05-13 03:42:36,977 .99[3990.292 ms] - 2021-05-13 03:42:36,978 Channel (server worker num[10]): - 2021-05-13 03:42:36,978 chl0(In: ['@DAGExecutor'], Out: ['det']) size[0/0] - 2021-05-13 03:42:36,979 chl1(In: ['det'], Out: ['rec']) size[6/0] - 2021-05-13 03:42:36,979 chl2(In: ['rec'], Out: ['@DAGExecutor']) size[0/0] + 2022-05-12 03:56:46,461 ==================== TRACER ====================== + 2022-05-12 03:56:46,860 Op(det): + 2022-05-12 03:56:46,860 in[80.32286641221374 ms] + 2022-05-12 03:56:46,860 prep[74.27364885496183 ms] + 2022-05-12 03:56:46,860 midp[33.41587786259542 ms] + 2022-05-12 03:56:46,860 postp[20.935980916030534 ms] + 2022-05-12 03:56:46,860 out[1.551145038167939 ms] + 2022-05-12 03:56:46,860 idle[0.3889510617728378] + 2022-05-12 03:56:46,860 Op(rec): + 2022-05-12 03:56:46,860 in[15.46498846153846 ms] + 2022-05-12 03:56:46,861 prep[22.565715384615384 ms] + 2022-05-12 03:56:46,861 midp[91.42518076923076 ms] + 2022-05-12 03:56:46,861 postp[11.678453846153847 ms] + 2022-05-12 03:56:46,861 out[1.1200576923076924 ms] + 2022-05-12 03:56:46,861 idle[0.11658723106110291] + 2022-05-12 03:56:46,862 DAGExecutor: + 2022-05-12 03:56:46,862 Query count[620] + 2022-05-12 03:56:46,862 QPS[62.0 q/s] + 2022-05-12 03:56:46,862 Succ[0.4193548387096774] + 2022-05-12 03:56:46,862 Latency: + 2022-05-12 03:56:46,863 ave[165.54603709677417 ms] + 2022-05-12 03:56:46,863 .50[77.863 ms] + 2022-05-12 03:56:46,863 .60[158.414 ms] + 2022-05-12 03:56:46,863 .70[237.28 ms] + 2022-05-12 03:56:46,863 .80[316.022 ms] + 2022-05-12 03:56:46,863 .90[424.416 ms] + 2022-05-12 03:56:46,863 .95[515.566 ms] + 2022-05-12 03:56:46,863 .99[762.256 ms] + 2022-05-12 03:56:46,863 Channel (server worker num[10]): + 2022-05-12 03:56:46,864 chl0(In: ['@DAGExecutor'], Out: ['det']) size[0/0] + 2022-05-12 03:56:46,864 chl1(In: ['det'], Out: ['rec']) size[2/0] + 2022-05-12 03:56:46,865 chl2(In: ['rec'], Out: ['@DAGExecutor']) size[0/0] ``` diff --git a/deploy/pdserving/imgs/c++_qps.png b/deploy/pdserving/imgs/c++_qps.png new file mode 100644 index 0000000000000000000000000000000000000000..dc406acd624ea3f5fd51a56ae7c6d299c8211b48 Binary files /dev/null and b/deploy/pdserving/imgs/c++_qps.png differ