diff --git a/doc/Serving_Configure_CN.md b/doc/Serving_Configure_CN.md index ca68bcf52cc7559d2cfa3ae00f9bfc29cd39295e..06407e4280f326ec52d7c8f7fd598f0cf266c17f 100644 --- a/doc/Serving_Configure_CN.md +++ b/doc/Serving_Configure_CN.md @@ -366,8 +366,13 @@ op: #use_mkldnn #use_mkldnn: True - #ir_optim + #ir_optim, 开启TensorRT时,必须同时设置ir_optim=True,否则无效 ir_optim: True + + #precsion, 预测精度,降低预测精度可提升预测速度 + #GPU 支持: "fp32"(default), "fp16", "int8"; + #CPU 支持: "fp32"(default), "fp16", "bf16"(mkldnn); 不支持: "int8" + precision: "fp32" rec: #并发数,is_thread_op=True时,为线程并发;否则为进程并发 concurrency: 3