fix trt inference fp16 io (#54032)

7c1bc000 · Yuanle Liu · GitHub · 07223e34 · 7c1bc000
隐藏空白更改
内联并排

Showing with 2 addition and 1 deletion

paddle/fluid/inference/tensorrt/convert/op_converter.h paddle/fluid/inference/tensorrt/convert/op_converter.h +2 -1

未找到文件。
--- a/paddle/fluid/inference/tensorrt/convert/op_converter.h
+++ b/paddle/fluid/inference/tensorrt/convert/op_converter.h
@@ -27,6 +27,7 @@ limitations under the License. */
 #include "paddle/fluid/inference/tensorrt/helper.h"
 #include "paddle/fluid/inference/tensorrt/op_teller.h"
 #include "paddle/fluid/inference/utils/singleton.h"
+#include "paddle/phi/common/data_type.h"

 namespace paddle {
 namespace inference {
@@ -305,7 +306,7 @@ class OpConverter {
          platform::errors::InvalidArgument("TensorRT engine only takes "
                                            "LoDTensor as input"));
      nvinfer1::DataType in_dtype = FluidDataType2TRT(var->GetDataType());
-      if (engine->WithFp16() && !engine->WithInt8() &&
+      if (engine->precision() == phi::DataType::FLOAT16 &&
          in_dtype == nvinfer1::DataType::kFLOAT &&
          engine->EnableLowPrecisionIO()) {
        in_dtype = nvinfer1::DataType::kHALF;