web_service.py 5.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#!flask/bin/python
B
barrierye 已提交
15 16
# pylint: disable=doc-string-missing

17 18 19 20
from flask import Flask, request, abort
from multiprocessing import Pool, Process
from paddle_serving_server import OpMaker, OpSeqMaker, Server
from paddle_serving_client import Client
M
MRXLT 已提交
21 22
from contextlib import closing
import socket
23

B
barrierye 已提交
24

25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
class WebService(object):
    def __init__(self, name="default_service"):
        self.name = name

    def load_model_config(self, model_config):
        self.model_config = model_config

    def _launch_rpc_service(self):
        op_maker = OpMaker()
        read_op = op_maker.create('general_reader')
        general_infer_op = op_maker.create('general_infer')
        general_response_op = op_maker.create('general_response')
        op_seq_maker = OpSeqMaker()
        op_seq_maker.add_op(read_op)
        op_seq_maker.add_op(general_infer_op)
        op_seq_maker.add_op(general_response_op)
        server = Server()
        server.set_op_sequence(op_seq_maker.get_op_sequence())
        server.set_num_threads(16)
M
MRXLT 已提交
44 45
        server.set_memory_optimize(self.mem_optim)
        server.set_ir_optimize(self.ir_optim)
46 47
        server.load_model_config(self.model_config)
        server.prepare_server(
M
MRXLT 已提交
48
            workdir=self.workdir, port=self.port_list[0], device=self.device)
49 50
        server.run_server()

M
MRXLT 已提交
51 52 53 54 55 56 57 58 59
    def port_is_available(self, port):
        with closing(socket.socket(socket.AF_INET, socket.SOCK_STREAM)) as sock:
            sock.settimeout(2)
            result = sock.connect_ex(('0.0.0.0', port))
        if result != 0:
            return True
        else:
            return False

M
MRXLT 已提交
60 61 62 63 64 65
    def prepare_server(self,
                       workdir="",
                       port=9393,
                       device="cpu",
                       mem_optim=True,
                       ir_optim=False):
66 67 68
        self.workdir = workdir
        self.port = port
        self.device = device
M
MRXLT 已提交
69
        default_port = 12000
M
MRXLT 已提交
70
        self.port_list = []
M
MRXLT 已提交
71 72
        self.mem_optim = mem_optim
        self.ir_optim = ir_optim
M
MRXLT 已提交
73 74 75 76
        for i in range(1000):
            if self.port_is_available(default_port + i):
                self.port_list.append(default_port + i)
                break
77 78

    def _launch_web_service(self):
M
MRXLT 已提交
79 80 81 82
        self.client = Client()
        self.client.load_client_config("{}/serving_server_conf.prototxt".format(
            self.model_config))
        self.client.connect(["0.0.0.0:{}".format(self.port_list[0])])
B
barrierye 已提交
83

D
dongdaxiang 已提交
84
    def get_prediction(self, request):
D
dongdaxiang 已提交
85 86 87 88 89
        if not request.json:
            abort(400)
        if "fetch" not in request.json:
            abort(400)
        try:
M
MRXLT 已提交
90 91
            feed, fetch = self.preprocess(request.json["feed"],
                                          request.json["fetch"])
B
barrierye 已提交
92 93
            if isinstance(feed, dict) and "fetch" in feed:
                del feed["fetch"]
W
wangjiawei04 已提交
94 95
            if len(feed) == 0:
                raise ValueError("empty input")
M
MRXLT 已提交
96
            fetch_map = self.client.predict(feed=feed, fetch=fetch)
G
gongweibao 已提交
97
            result = self.postprocess(
M
MRXLT 已提交
98
                feed=request.json["feed"], fetch=fetch, fetch_map=fetch_map)
G
gongweibao 已提交
99
            result = {"result": result}
M
bug fix  
MRXLT 已提交
100
        except ValueError as err:
M
MRXLT 已提交
101
            result = {"result": str(err)}
D
dongdaxiang 已提交
102
        return result
103

M
MRXLT 已提交
104
    def run_rpc_service(self):
105 106 107
        import socket
        localIP = socket.gethostbyname(socket.gethostname())
        print("web service address:")
B
barrierye 已提交
108 109
        print("http://{}:{}/{}/prediction".format(localIP, self.port,
                                                  self.name))
110 111 112
        p_rpc = Process(target=self._launch_rpc_service)
        p_rpc.start()

M
MRXLT 已提交
113 114 115 116 117 118 119 120 121 122 123 124
        app_instance = Flask(__name__)

        @app_instance.before_first_request
        def init():
            self._launch_web_service()

        service_name = "/" + self.name + "/prediction"

        @app_instance.route(service_name, methods=["POST"])
        def run():
            return self.get_prediction(request)

M
MRXLT 已提交
125 126
        self.app_instance = app_instance

W
wangjiawei04 已提交
127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152
    def run_debugger_service(self):
        import socket
        localIP = socket.gethostbyname(socket.gethostname())
        print("web service address:")
        print("http://{}:{}/{}/prediction".format(localIP, self.port,
                                                  self.name))
        app_instance = Flask(__name__)

        @app_instance.before_first_request
        def init():
            self._launch_local_predictor()

        service_name = "/" + self.name + "/prediction"

        @app_instance.route(service_name, methods=["POST"])
        def run():
            return self.get_prediction(request)

        self.app_instance = app_instance

    def _launch_local_predictor(self):
        from paddle_serving_app.local_predict import Debugger
        self.client = Debugger()
        self.client.load_model_config(
            "{}".format(self.model_config), gpu=False, profile=False)

M
MRXLT 已提交
153
    def run_web_service(self):
M
fix bug  
MRXLT 已提交
154 155 156 157
        self.app_instance.run(host="0.0.0.0",
                              port=self.port,
                              threaded=False,
                              processes=1)
M
MRXLT 已提交
158 159

    def get_app_instance(self):
G
gongweibao 已提交
160
        return self.app_instance
M
MRXLT 已提交
161

M
MRXLT 已提交
162
    def preprocess(self, feed=[], fetch=[]):
163 164
        return feed, fetch

M
MRXLT 已提交
165
    def postprocess(self, feed=[], fetch=[], fetch_map=None):
M
bug fix  
MRXLT 已提交
166 167
        for key in fetch_map:
            fetch_map[key] = fetch_map[key].tolist()
168
        return fetch_map