diff --git a/doc/Serving_Configure_EN.md b/doc/Serving_Configure_EN.md index ddf81ea7652356fd3b7a65af4f1ba1a4c55f6db0..d586db6d0314f5af7d0fc2b217b389552a5034a2 100644 --- a/doc/Serving_Configure_EN.md +++ b/doc/Serving_Configure_EN.md @@ -397,6 +397,9 @@ op: #ir_optim, When running on TensorRT,must set ir_optim=True ir_optim: True + #CPU 计算线程数,在CPU场景开启会降低单次请求响应时长 + #thread_num: 10 + #precsion, Decrease accuracy can increase speed #GPU 支持: "fp32"(default), "fp16", "int8"; #CPU 支持: "fp32"(default), "fp16", "bf16"(mkldnn); 不支持: "int8" @@ -435,6 +438,9 @@ op: #ir_optim, When running on TensorRT,must set ir_optim=True ir_optim: True + #CPU 计算线程数,在CPU场景开启会降低单次请求响应时长 + #thread_num: 10 + #precsion, Decrease accuracy can increase speed #GPU 支持: "fp32"(default), "fp16", "int8"; #CPU 支持: "fp32"(default), "fp16", "bf16"(mkldnn); 不支持: "int8"