提交 d1da04bc 编写于 作者: T TeslaZhao

Distribute Serving for Foundation Models

上级 25ca1469
...@@ -268,7 +268,7 @@ class PaddleInferenceEngine : public EngineCore { ...@@ -268,7 +268,7 @@ class PaddleInferenceEngine : public EngineCore {
config.EnableGpuMultiStream(); config.EnableGpuMultiStream();
} }
} }
config.EnableTensorRtEngine(1 << 20, config.EnableTensorRtEngine(1 << 25,
max_batch, max_batch,
min_subgraph_size, min_subgraph_size,
precision_type, precision_type,
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册