modify infer gpu memory strategy (#41427)

* modify infer gpu memory strategy * modify infer gpu memory strategy

modify infer gpu memory strategy (#41427)
* modify infer gpu memory strategy * modify infer gpu memory strategy
56e72b20 · JingZhuangzhuang · GitHub · 53409bcd · 56e72b20 · 56e72b20
隐藏空白更改
内联并排

Showing with 0 addition and 11 deletion

paddle/fluid/inference/api/analysis_predictor.cc paddle/fluid/inference/api/analysis_predictor.cc +0 -7

paddle/fluid/platform/flags.cc paddle/fluid/platform/flags.cc +0 -4

未找到文件。
--- a/paddle/fluid/inference/api/analysis_predictor.cc
+++ b/paddle/fluid/inference/api/analysis_predictor.cc
@@ -1061,13 +1061,6 @@ std::unique_ptr<PaddlePredictor> CreatePaddlePredictor<
        gflags.push_back("--cudnn_deterministic=True");
      }

-// TODO(wilber): jetson tx2 may fail to run the model due to insufficient memory
-// under the native_best_fit strategy. Modify the default allocation strategy to
-// auto_growth. todo, find a more appropriate way to solve the problem.
-#ifdef WITH_NV_JETSON
-      gflags.push_back("--allocator_strategy=auto_growth");
-#endif
-
      // TODO(Shixiaowei02): Add a mandatory scheme to use the thread local
      // allocator when multi-stream is enabled.
      if (config.thread_local_stream_enabled()) {

--- a/paddle/fluid/platform/flags.cc
+++ b/paddle/fluid/platform/flags.cc
@@ -364,11 +364,7 @@ PADDLE_DEFINE_EXPORTED_double(
 * Example:
 * Note: For selecting allocator policy of PaddlePaddle.
 */
-#ifdef PADDLE_ON_INFERENCE
-static constexpr char kDefaultAllocatorStrategy[] = "naive_best_fit";
-#else
 static constexpr char kDefaultAllocatorStrategy[] = "auto_growth";
-#endif
 PADDLE_DEFINE_EXPORTED_string(
    allocator_strategy, kDefaultAllocatorStrategy,
    "The allocation strategy, enum in [naive_best_fit, auto_growth]. "