diff --git a/doc/Serving_Configure_EN.md b/doc/Serving_Configure_EN.md index b725c8aa51df927c3c45cbe324fa04006a1953e2..eedb3acbde8d2a64a5638106f6ee01b818396cbd 100644 --- a/doc/Serving_Configure_EN.md +++ b/doc/Serving_Configure_EN.md @@ -424,6 +424,11 @@ op: #ir_optim, When running on TensorRT,must set ir_optim=True ir_optim: True + + #precsion, Decrease accuracy can increase speed + #GPU 支持: "fp32"(default), "fp16", "int8"; + #CPU 支持: "fp32"(default), "fp16", "bf16"(mkldnn); 不支持: "int8" + precision: "fp32" ``` ### Single-machine and multi-card inference