提交 51229597 编写于 作者: D dongdaxiang

add tolist to gpu web service

上级 548a0fc5
...@@ -90,77 +90,26 @@ class WebService(object): ...@@ -90,77 +90,26 @@ class WebService(object):
self.client = Client() self.client = Client()
self.client.load_client_config("{}/serving_server_conf.prototxt".format( self.client.load_client_config("{}/serving_server_conf.prototxt".format(
self.model_config)) self.model_config))
endpoints = ""
client.connect([endpoint]) if gpu_num > 0:
while True:
request_json = inputqueue.get()
try:
feed, fetch = self.preprocess(request_json,
request_json["fetch"])
if isinstance(feed, list):
fetch_map_batch = client.predict(
feed_batch=feed, fetch=fetch)
fetch_map_batch = self.postprocess(
feed=request_json,
fetch=fetch,
fetch_map=fetch_map_batch)
for key in fetch_map_batch:
fetch_map_batch[key] = fetch_map_batch[key].tolist()
result = {"result": fetch_map_batch}
elif isinstance(feed, dict):
if "fetch" in feed:
del feed["fetch"]
fetch_map = client.predict(feed=feed, fetch=fetch)
for key in fetch_map:
fetch_map[key] = fetch_map[key][0].tolist()
result = self.postprocess(
feed=request_json, fetch=fetch, fetch_map=fetch_map)
self.output_queue.put(result)
except ValueError:
self.output_queue.put(-1)
def _launch_web_service(self, gpu_num):
app_instance = Flask(__name__)
service_name = "/" + self.name + "/prediction"
self.input_queues = []
self.output_queue = Queue()
for i in range(gpu_num): for i in range(gpu_num):
self.input_queues.append(Queue()) endpoints += "127.0.0.1:{},".format(self.port + i + 1)
else:
producer_list = [] endpoints = "127.0.0.1:{}".format(self.port + 1)
for i, input_q in enumerate(self.input_queues): self.client.connect([endpoints])
producer_processes = Process(
target=self.producers,
args=(
input_q,
"0.0.0.0:{}".format(self.port + 1 + i), ))
producer_list.append(producer_processes)
for p in producer_list:
p.start()
client = Client()
client.load_client_config("{}/serving_server_conf.prototxt".format(
self.model_config))
client.connect(["0.0.0.0:{}".format(self.port + 1)])
self.idx = 0
def get_prediction(): def get_prediction(self, request):
if not request.json: if not request.json:
abort(400) abort(400)
if "fetch" not in request.json: if "fetch" not in request.json:
abort(400) abort(400)
feed, fetch = self.preprocess(request.json, request.json["fetch"])
self.input_queues[self.idx].put(request.json) fetch_map_batch = self.client.predict(feed=feed, fetch=fetch)
fetch_map_batch = self.postprocess(
self.idx += 1 feed=request.json, fetch=fetch, fetch_map=fetch_map_batch)
if self.idx >= len(self.gpus): for key in fetch_map_batch:
self.idx = 0 fetch_map_batch[key] = fetch_map_batch[key].tolist()
result = self.output_queue.get() result = {"result": fetch_map_batch}
if not isinstance(result, dict) and result == -1:
result = {"result": "Request Value Error"}
return result return result
def run_server(self): def run_server(self):
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册