Merge pull request #10076 from reyoung/feature/FLAGS_eager_deletion_scope

Eager destruct local scope

Merge pull request #10076 from reyoung/feature/FLAGS_eager_deletion_scope
Eager destruct local scope
d114d2b2 · Yu Yang · GitHub · ba927b88 · 92b5f49e · d114d2b2
隐藏空白更改
内联并排

Showing with 8 addition and 2 deletion

paddle/fluid/framework/scope.cc paddle/fluid/framework/scope.cc +6 -1

python/paddle/fluid/__init__.py python/paddle/fluid/__init__.py +2 -1

未找到文件。
--- a/paddle/fluid/framework/scope.cc
+++ b/paddle/fluid/framework/scope.cc
@@ -26,6 +26,11 @@ DEFINE_bool(benchmark, false,
            "Default cuda is asynchronous device, set to True will"
            "force op run in synchronous mode.");

+DEFINE_bool(
+    eager_delete_scope, true,
+    "Delete local scope eagerly. It will reduce GPU memory usage but "
+    "slow down the destruction of variables.(around 1% performance harm)");
+
 namespace paddle {
 namespace framework {

@@ -97,7 +102,7 @@ void Scope::DeleteScope(Scope* scope) const {
  PADDLE_ENFORCE(it != this->kids_.end(), "Cannot find %p as kid scope", scope);
  this->kids_.erase(it);
  // When making memory benchmark on Fluid, we have to delete scope sync.
-  if (FLAGS_benchmark) {
+  if (FLAGS_benchmark || FLAGS_eager_delete_scope) {
    delete scope;
  } else {
    Async([scope] { delete scope; });

--- a/python/paddle/fluid/__init__.py
+++ b/python/paddle/fluid/__init__.py
@@ -107,7 +107,8 @@ def __bootstrap__():
    os.environ['OMP_NUM_THREADS'] = str(num_threads)

    read_env_flags = [
-        'use_pinned_memory', 'check_nan_inf', 'benchmark', 'warpctc_dir'
+        'use_pinned_memory', 'check_nan_inf', 'benchmark', 'warpctc_dir',
+        'eager_delete_scope'
    ]
    if core.is_compiled_with_cuda():
        read_env_flags += ['fraction_of_gpu_memory_to_use']