benchmark.py 2.4 KB
Newer Older
D
Dong Daxiang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
B
barrierye 已提交
14 15
# pylint: disable=doc-string-missing

16 17
from paddle_serving_client import Client
from paddle_serving_client.utils import MultiThreadRunner
H
HexToString 已提交
18
from paddle_serving_client.utils import benchmark_args, show_latency
19 20 21 22 23 24 25
import time
import paddle
import sys
import requests

args = benchmark_args()

B
barrierye 已提交
26

27
def single_func(idx, resource):
H
HexToString 已提交
28 29 30 31 32 33
    train_reader = paddle.batch(
        paddle.reader.shuffle(
            paddle.dataset.uci_housing.train(), buf_size=500),
        batch_size=1)
    total_number = sum(1 for _ in train_reader())

34 35 36 37 38 39
    if args.request == "rpc":
        client = Client()
        client.load_client_config(args.model)
        client.connect([args.endpoint])
        start = time.time()
        for data in train_reader():
H
HexToString 已提交
40
            fetch_map = client.predict(feed={"x": data[0][0]}, fetch=["price"])
41
        end = time.time()
H
HexToString 已提交
42
        return [[end - start], [total_number]]
43
    elif args.request == "http":
B
barrierye 已提交
44 45 46 47
        train_reader = paddle.batch(
            paddle.reader.shuffle(
                paddle.dataset.uci_housing.train(), buf_size=500),
            batch_size=1)
48 49
        start = time.time()
        for data in train_reader():
B
barrierye 已提交
50 51 52
            r = requests.post(
                'http://{}/uci/prediction'.format(args.endpoint),
                data={"x": data[0]})
53
        end = time.time()
H
HexToString 已提交
54
        return [[end - start], [total_number]]
55

B
barrierye 已提交
56

H
HexToString 已提交
57
start = time.time()
58 59
multi_thread_runner = MultiThreadRunner()
result = multi_thread_runner.run(single_func, args.thread, {})
H
HexToString 已提交
60 61 62 63 64 65 66 67 68 69 70
end = time.time()
total_cost = end - start
avg_cost = 0
for i in range(args.thread):
    avg_cost += result[0][i]
avg_cost = avg_cost / args.thread

print("total cost: {}s".format(total_cost))
print("each thread cost: {}s. ".format(avg_cost))
print("qps: {}samples/s".format(args.batch_size * args.thread / total_cost))
show_latency(result[1])