提交 45114dd6 编写于 作者: T TeslaZhao

Distribute Serving for Foundation Models

上级 2cd5c109
...@@ -350,8 +350,8 @@ def start_gpu_card_model(gpu_mode, port, args): # pylint: disable=doc-string-mi ...@@ -350,8 +350,8 @@ def start_gpu_card_model(gpu_mode, port, args): # pylint: disable=doc-string-mi
general_infer_op = op_maker.create(infer_op_name) general_infer_op = op_maker.create(infer_op_name)
op_seq_maker.add_op(general_infer_op) op_seq_maker.add_op(general_infer_op)
general_response_op = op_maker.create('GeneralResponseOp') general_response_op = op_maker.create('GeneralResponseOp')
op_seq_maker.add_op(general_response_op) op_seq_maker.add_op(general_response_op)
else: else:
# for the master serving of distributed model only add one general_remote op. # for the master serving of distributed model only add one general_remote op.
if args.dist_worker_serving_endpoints is None: if args.dist_worker_serving_endpoints is None:
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册