diff --git a/doc/Serving_Configure_CN.md b/doc/Serving_Configure_CN.md index 3a5b449d599f989a9b3e360e29d63560b838a277..ca68bcf52cc7559d2cfa3ae00f9bfc29cd39295e 100644 --- a/doc/Serving_Configure_CN.md +++ b/doc/Serving_Configure_CN.md @@ -401,6 +401,11 @@ op: #ir_optim, 开启TensorRT时,必须同时设置ir_optim=True,否则无效 ir_optim: True + + #precsion, 预测精度,降低预测精度可提升预测速度 + #GPU 支持: "fp32"(default), "fp16", "int8"; + #CPU 支持: "fp32"(default), "fp16", "bf16"(mkldnn); 不支持: "int8" + precision: "fp32" ``` ### 单机多卡