提交 92d334c8 编写于 作者: T TeslaZhao

fix bad code style in other .py files by yapf

上级 de926182
...@@ -54,8 +54,8 @@ class OpMaker(object): ...@@ -54,8 +54,8 @@ class OpMaker(object):
def create(self, node_type, engine_name=None, inputs=[], outputs=[]): def create(self, node_type, engine_name=None, inputs=[], outputs=[]):
if node_type not in self.op_dict: if node_type not in self.op_dict:
raise Exception( raise Exception("Op type {} is not supported right now".format(
"Op type {} is not supported right now".format(node_type)) node_type))
node = server_sdk.DAGNode() node = server_sdk.DAGNode()
# node.name will be used as the infer engine name # node.name will be used as the infer engine name
if engine_name: if engine_name:
...@@ -104,8 +104,8 @@ class OpSeqMaker(object): ...@@ -104,8 +104,8 @@ class OpSeqMaker(object):
if node.dependencies[0].name != self.workflow.nodes[-1].name: if node.dependencies[0].name != self.workflow.nodes[-1].name:
raise Exception( raise Exception(
'You must add op in order in OpSeqMaker. The previous op is {}, but the current op is followed by {}.' 'You must add op in order in OpSeqMaker. The previous op is {}, but the current op is followed by {}.'
.format(node.dependencies[0].name, .format(node.dependencies[0].name, self.workflow.nodes[
self.workflow.nodes[-1].name)) -1].name))
self.workflow.nodes.extend([node]) self.workflow.nodes.extend([node])
def get_op_sequence(self): def get_op_sequence(self):
...@@ -308,8 +308,8 @@ class Server(object): ...@@ -308,8 +308,8 @@ class Server(object):
self.model_config_paths[node.name] = path self.model_config_paths[node.name] = path
print("You have specified multiple model paths, please ensure " print("You have specified multiple model paths, please ensure "
"that the input and output of multiple models are the same.") "that the input and output of multiple models are the same.")
workflow_oi_config_path = list( workflow_oi_config_path = list(self.model_config_paths.items())[0][
self.model_config_paths.items())[0][1] 1]
else: else:
raise Exception("The type of model_config_paths must be str or " raise Exception("The type of model_config_paths must be str or "
"dict({op: model_path}), not {}.".format( "dict({op: model_path}), not {}.".format(
...@@ -569,20 +569,20 @@ class MultiLangServerServiceServicer(multi_lang_general_model_service_pb2_grpc. ...@@ -569,20 +569,20 @@ class MultiLangServerServiceServicer(multi_lang_general_model_service_pb2_grpc.
tensor.data = model_result[name].tobytes() tensor.data = model_result[name].tobytes()
else: else:
if v_type == 0: # int64 if v_type == 0: # int64
tensor.int64_data.extend( tensor.int64_data.extend(model_result[name].reshape(-1)
model_result[name].reshape(-1).tolist()) .tolist())
elif v_type == 1: # float32 elif v_type == 1: # float32
tensor.float_data.extend( tensor.float_data.extend(model_result[name].reshape(-1)
model_result[name].reshape(-1).tolist()) .tolist())
elif v_type == 2: # int32 elif v_type == 2: # int32
tensor.int_data.extend( tensor.int_data.extend(model_result[name].reshape(-1)
model_result[name].reshape(-1).tolist()) .tolist())
else: else:
raise Exception("error type.") raise Exception("error type.")
tensor.shape.extend(list(model_result[name].shape)) tensor.shape.extend(list(model_result[name].shape))
if name in self.lod_tensor_set_: if name in self.lod_tensor_set_:
tensor.lod.extend( tensor.lod.extend(model_result["{}.lod".format(name)]
model_result["{}.lod".format(name)].tolist()) .tolist())
inst.tensor_array.append(tensor) inst.tensor_array.append(tensor)
model_output.insts.append(inst) model_output.insts.append(inst)
model_output.engine_name = model_name model_output.engine_name = model_name
...@@ -601,7 +601,8 @@ class MultiLangServerServiceServicer(multi_lang_general_model_service_pb2_grpc. ...@@ -601,7 +601,8 @@ class MultiLangServerServiceServicer(multi_lang_general_model_service_pb2_grpc.
def Inference(self, request, context): def Inference(self, request, context):
feed_dict, fetch_names, is_python, log_id = \ feed_dict, fetch_names, is_python, log_id = \
self._unpack_inference_request(request) self._unpack_inference_request(request)
ret = self.bclient_.predict(feed=feed_dict, ret = self.bclient_.predict(
feed=feed_dict,
fetch=fetch_names, fetch=fetch_names,
need_variant_tag=True, need_variant_tag=True,
log_id=log_id) log_id=log_id)
...@@ -684,11 +685,12 @@ class MultiLangServer(object): ...@@ -684,11 +685,12 @@ class MultiLangServer(object):
default_port = 12000 default_port = 12000
self.port_list_ = [] self.port_list_ = []
for i in range(1000): for i in range(1000):
if default_port + i != port and self._port_is_available( if default_port + i != port and self._port_is_available(default_port
default_port + i): + i):
self.port_list_.append(default_port + i) self.port_list_.append(default_port + i)
break break
self.bserver_.prepare_server(workdir=workdir, self.bserver_.prepare_server(
workdir=workdir,
port=self.port_list_[0], port=self.port_list_[0],
device=device, device=device,
cube_conf=cube_conf) cube_conf=cube_conf)
...@@ -704,8 +706,8 @@ class MultiLangServer(object): ...@@ -704,8 +706,8 @@ class MultiLangServer(object):
return result != 0 return result != 0
def run_server(self): def run_server(self):
p_bserver = Process(target=self._launch_brpc_service, p_bserver = Process(
args=(self.bserver_, )) target=self._launch_brpc_service, args=(self.bserver_, ))
p_bserver.start() p_bserver.start()
options = [('grpc.max_send_message_length', self.body_size_), options = [('grpc.max_send_message_length', self.body_size_),
('grpc.max_receive_message_length', self.body_size_)] ('grpc.max_receive_message_length', self.body_size_)]
......
...@@ -40,52 +40,46 @@ from concurrent import futures ...@@ -40,52 +40,46 @@ from concurrent import futures
def serve_args(): def serve_args():
parser = argparse.ArgumentParser("serve") parser = argparse.ArgumentParser("serve")
parser.add_argument("--thread", parser.add_argument(
type=int, "--thread", type=int, default=2, help="Concurrency of server")
default=2, parser.add_argument(
help="Concurrency of server") "--model", type=str, default="", help="Model for serving")
parser.add_argument("--model", parser.add_argument(
type=str, "--port", type=int, default=9292, help="Port of the starting gpu")
default="", parser.add_argument(
help="Model for serving") "--workdir",
parser.add_argument("--port",
type=int,
default=9292,
help="Port of the starting gpu")
parser.add_argument("--workdir",
type=str, type=str,
default="workdir", default="workdir",
help="Working dir of current service") help="Working dir of current service")
parser.add_argument("--device", parser.add_argument(
type=str, "--device", type=str, default="gpu", help="Type of device")
default="gpu",
help="Type of device")
parser.add_argument("--gpu_ids", type=str, default="", help="gpu ids") parser.add_argument("--gpu_ids", type=str, default="", help="gpu ids")
parser.add_argument("--name", parser.add_argument(
type=str, "--name", type=str, default="None", help="Default service name")
default="None", parser.add_argument(
help="Default service name") "--mem_optim_off",
parser.add_argument("--mem_optim_off",
default=False, default=False,
action="store_true", action="store_true",
help="Memory optimize") help="Memory optimize")
parser.add_argument("--ir_optim", parser.add_argument(
default=False, "--ir_optim", default=False, action="store_true", help="Graph optimize")
action="store_true", parser.add_argument(
help="Graph optimize") "--max_body_size",
parser.add_argument("--max_body_size",
type=int, type=int,
default=512 * 1024 * 1024, default=512 * 1024 * 1024,
help="Limit sizes of messages") help="Limit sizes of messages")
parser.add_argument("--use_multilang", parser.add_argument(
"--use_multilang",
default=False, default=False,
action="store_true", action="store_true",
help="Use Multi-language-service") help="Use Multi-language-service")
parser.add_argument("--product_name", parser.add_argument(
"--product_name",
type=str, type=str,
default=None, default=None,
help="product_name for authentication") help="product_name for authentication")
parser.add_argument("--container_id", parser.add_argument(
"--container_id",
type=str, type=str,
default=None, default=None,
help="container_id for authentication") help="container_id for authentication")
...@@ -108,8 +102,8 @@ class OpMaker(object): ...@@ -108,8 +102,8 @@ class OpMaker(object):
def create(self, node_type, engine_name=None, inputs=[], outputs=[]): def create(self, node_type, engine_name=None, inputs=[], outputs=[]):
if node_type not in self.op_dict: if node_type not in self.op_dict:
raise Exception( raise Exception("Op type {} is not supported right now".format(
"Op type {} is not supported right now".format(node_type)) node_type))
node = server_sdk.DAGNode() node = server_sdk.DAGNode()
# node.name will be used as the infer engine name # node.name will be used as the infer engine name
if engine_name: if engine_name:
...@@ -158,8 +152,8 @@ class OpSeqMaker(object): ...@@ -158,8 +152,8 @@ class OpSeqMaker(object):
if node.dependencies[0].name != self.workflow.nodes[-1].name: if node.dependencies[0].name != self.workflow.nodes[-1].name:
raise Exception( raise Exception(
'You must add op in order in OpSeqMaker. The previous op is {}, but the current op is followed by {}.' 'You must add op in order in OpSeqMaker. The previous op is {}, but the current op is followed by {}.'
.format(node.dependencies[0].name, .format(node.dependencies[0].name, self.workflow.nodes[
self.workflow.nodes[-1].name)) -1].name))
self.workflow.nodes.extend([node]) self.workflow.nodes.extend([node])
def get_op_sequence(self): def get_op_sequence(self):
...@@ -372,8 +366,8 @@ class Server(object): ...@@ -372,8 +366,8 @@ class Server(object):
self.model_config_paths[node.name] = path self.model_config_paths[node.name] = path
print("You have specified multiple model paths, please ensure " print("You have specified multiple model paths, please ensure "
"that the input and output of multiple models are the same.") "that the input and output of multiple models are the same.")
workflow_oi_config_path = list( workflow_oi_config_path = list(self.model_config_paths.items())[0][
self.model_config_paths.items())[0][1] 1]
else: else:
raise Exception("The type of model_config_paths must be str or " raise Exception("The type of model_config_paths must be str or "
"dict({op: model_path}), not {}.".format( "dict({op: model_path}), not {}.".format(
...@@ -636,20 +630,20 @@ class MultiLangServerServiceServicer(multi_lang_general_model_service_pb2_grpc. ...@@ -636,20 +630,20 @@ class MultiLangServerServiceServicer(multi_lang_general_model_service_pb2_grpc.
tensor.data = model_result[name].tobytes() tensor.data = model_result[name].tobytes()
else: else:
if v_type == 0: # int64 if v_type == 0: # int64
tensor.int64_data.extend( tensor.int64_data.extend(model_result[name].reshape(-1)
model_result[name].reshape(-1).tolist()) .tolist())
elif v_type == 1: # float32 elif v_type == 1: # float32
tensor.float_data.extend( tensor.float_data.extend(model_result[name].reshape(-1)
model_result[name].reshape(-1).tolist()) .tolist())
elif v_type == 2: # int32 elif v_type == 2: # int32
tensor.int_data.extend( tensor.int_data.extend(model_result[name].reshape(-1)
model_result[name].reshape(-1).tolist()) .tolist())
else: else:
raise Exception("error type.") raise Exception("error type.")
tensor.shape.extend(list(model_result[name].shape)) tensor.shape.extend(list(model_result[name].shape))
if name in self.lod_tensor_set_: if name in self.lod_tensor_set_:
tensor.lod.extend( tensor.lod.extend(model_result["{}.lod".format(name)]
model_result["{}.lod".format(name)].tolist()) .tolist())
inst.tensor_array.append(tensor) inst.tensor_array.append(tensor)
model_output.insts.append(inst) model_output.insts.append(inst)
model_output.engine_name = model_name model_output.engine_name = model_name
...@@ -668,7 +662,8 @@ class MultiLangServerServiceServicer(multi_lang_general_model_service_pb2_grpc. ...@@ -668,7 +662,8 @@ class MultiLangServerServiceServicer(multi_lang_general_model_service_pb2_grpc.
def Inference(self, request, context): def Inference(self, request, context):
feed_dict, fetch_names, is_python, log_id \ feed_dict, fetch_names, is_python, log_id \
= self._unpack_inference_request(request) = self._unpack_inference_request(request)
ret = self.bclient_.predict(feed=feed_dict, ret = self.bclient_.predict(
feed=feed_dict,
fetch=fetch_names, fetch=fetch_names,
need_variant_tag=True, need_variant_tag=True,
log_id=log_id) log_id=log_id)
...@@ -748,11 +743,12 @@ class MultiLangServer(object): ...@@ -748,11 +743,12 @@ class MultiLangServer(object):
default_port = 12000 default_port = 12000
self.port_list_ = [] self.port_list_ = []
for i in range(1000): for i in range(1000):
if default_port + i != port and self._port_is_available( if default_port + i != port and self._port_is_available(default_port
default_port + i): + i):
self.port_list_.append(default_port + i) self.port_list_.append(default_port + i)
break break
self.bserver_.prepare_server(workdir=workdir, self.bserver_.prepare_server(
workdir=workdir,
port=self.port_list_[0], port=self.port_list_[0],
device=device, device=device,
cube_conf=cube_conf) cube_conf=cube_conf)
...@@ -768,8 +764,8 @@ class MultiLangServer(object): ...@@ -768,8 +764,8 @@ class MultiLangServer(object):
return result != 0 return result != 0
def run_server(self): def run_server(self):
p_bserver = Process(target=self._launch_brpc_service, p_bserver = Process(
args=(self.bserver_, )) target=self._launch_brpc_service, args=(self.bserver_, ))
p_bserver.start() p_bserver.start()
options = [('grpc.max_send_message_length', self.body_size_), options = [('grpc.max_send_message_length', self.body_size_),
('grpc.max_receive_message_length', self.body_size_)] ('grpc.max_receive_message_length', self.body_size_)]
......
...@@ -99,11 +99,11 @@ def start_multi_card(args): # pylint: disable=doc-string-missing ...@@ -99,11 +99,11 @@ def start_multi_card(args): # pylint: disable=doc-string-missing
else: else:
gpu_processes = [] gpu_processes = []
for i, gpu_id in enumerate(gpus): for i, gpu_id in enumerate(gpus):
p = Process(target=start_gpu_card_model, args=( p = Process(
target=start_gpu_card_model, args=(
i, i,
gpu_id, gpu_id,
args, args, ))
))
gpu_processes.append(p) gpu_processes.append(p)
for p in gpu_processes: for p in gpu_processes:
p.start() p.start()
...@@ -125,9 +125,8 @@ if __name__ == "__main__": ...@@ -125,9 +125,8 @@ if __name__ == "__main__":
gpu_ids = os.environ["CUDA_VISIBLE_DEVICES"] gpu_ids = os.environ["CUDA_VISIBLE_DEVICES"]
if len(gpu_ids) > 0: if len(gpu_ids) > 0:
web_service.set_gpus(gpu_ids) web_service.set_gpus(gpu_ids)
web_service.prepare_server(workdir=args.workdir, web_service.prepare_server(
port=args.port, workdir=args.workdir, port=args.port, device=args.device)
device=args.device)
web_service.run_rpc_service() web_service.run_rpc_service()
app_instance = Flask(__name__) app_instance = Flask(__name__)
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册