diff --git a/paddle/fluid/inference/api/analysis_predictor.cc b/paddle/fluid/inference/api/analysis_predictor.cc index 5dced520f337bbf8d89375a13251df80d34da494..2fe3dbe13e71afa1ca4ead1495490507cc4a16bc 100644 --- a/paddle/fluid/inference/api/analysis_predictor.cc +++ b/paddle/fluid/inference/api/analysis_predictor.cc @@ -1365,7 +1365,9 @@ void AnalysisPredictor::OptimizeInferenceProgram() { #if defined(_WIN32) argument_->PartiallyRelease(); #else - if (config_.mkldnn_enabled() || config_.tensorrt_engine_enabled()) { + if (config_.mkldnn_enabled() || + (config_.tensorrt_engine_enabled() && + config_.tensorrt_precision_mode_ == AnalysisConfig::Precision::kInt8)) { argument_->PartiallyRelease(); } else { argument_.reset(nullptr);