From ce48236587548b6b0ab61831be4394f698ef20c5 Mon Sep 17 00:00:00 2001
From: whs <wanghaoshuang@baidu.com>
Date: Fri, 27 May 2022 14:06:32 +0800
Subject: [PATCH] Refine temp directory of ACT (#1145)

1. fix temp work dir not found error
2. move temp work dir to final directory formated by pid and datetime
3. remove temp work dir of ACT when job is done
4. remove temp work dir of quant_post_hpo when job is done
---
 paddleslim/auto_compression/compressor.py | 40 ++++++++++++++---------
 paddleslim/quant/quant_post_hpo.py        | 21 ++++++++++--
 2 files changed, 43 insertions(+), 18 deletions(-)

diff --git a/paddleslim/auto_compression/compressor.py b/paddleslim/auto_compression/compressor.py
index df764017..2102c43c 100644
--- a/paddleslim/auto_compression/compressor.py
+++ b/paddleslim/auto_compression/compressor.py
@@ -20,6 +20,7 @@ import inspect
 import shutil
 from collections import namedtuple
 from collections.abc import Iterable
+from time import gmtime, strftime
 import platform
 import paddle
 import paddle.distributed.fleet as fleet
@@ -67,7 +68,8 @@ class AutoCompression:
                 When all parameters are saved in a single file, set it
                 as filename. If parameters are saved in separate files,
                 set it as 'None'. Default : 'None'.
-            save_dir(str): The path to save compressed model.
+            save_dir(str): The path to save compressed model. The models in this directory will be overwrited
+                after calling 'compress()' function.
             train_data_loader(Python Generator, Paddle.io.DataLoader): The
                 Generator or Dataloader provides train data, and it could
                 return a batch every time.
@@ -108,11 +110,9 @@ class AutoCompression:
         if params_filename == 'None':
             params_filename = None
         self.params_filename = params_filename
-        base_path = os.path.basename(os.path.normpath(save_dir))
-        parent_path = os.path.abspath(os.path.join(save_dir, os.pardir))
-        base_path = base_path + '_temp'
-        self.save_dir = os.path.join(parent_path, base_path)
         self.final_dir = save_dir
+        if not os.path.exists(self.final_dir):
+            os.makedirs(self.final_dir)
         self.strategy_config = strategy_config
         self.train_config = train_config
         self.train_dataloader = train_dataloader
@@ -355,6 +355,13 @@ class AutoCompression:
         return program_info
 
     def compress(self):
+        # create a new temp directory in final dir
+        s_datetime = strftime("%Y-%m-%d-%H:%M:%S", gmtime())
+        tmp_base_name = "_".join(["tmp", str(os.getpid()), s_datetime])
+        self.tmp_dir = os.path.join(self.final_dir, tmp_base_name)
+        if not os.path.exists(self.tmp_dir):
+            os.makedirs(self.tmp_dir)
+
         for strategy_idx, (
                 strategy,
                 config) in enumerate(zip(self._strategy, self._config)):
@@ -371,7 +378,7 @@ class AutoCompression:
                 self.single_strategy_compress(quant_strategy[0],
                                               quant_config[0], strategy_idx)
         tmp_model_path = os.path.join(
-            self.save_dir, 'strategy_{}'.format(str(strategy_idx + 1)))
+            self.tmp_dir, 'strategy_{}'.format(str(strategy_idx + 1)))
         final_model_path = os.path.join(self.final_dir)
         if not os.path.exists(final_model_path):
             os.makedirs(final_model_path)
@@ -382,6 +389,7 @@ class AutoCompression:
         if paddle.distributed.get_rank() == 0:
             shutil.move(tmp_model_file, final_model_file)
             shutil.move(tmp_params_file, final_params_file)
+            shutil.rmtree(self.tmp_dir)
             _logger.info(
                 "==> Finished the ACT process and the final model is saved in:{}".
                 format(final_model_path))
@@ -395,7 +403,7 @@ class AutoCompression:
                 self._exe,
                 model_dir=self.model_dir,
                 quantize_model_path=os.path.join(
-                    self.save_dir, 'strategy_{}'.format(str(strategy_idx + 1))),
+                    self.tmp_dir, 'strategy_{}'.format(str(strategy_idx + 1))),
                 data_loader=self.train_dataloader,
                 model_filename=self.model_filename,
                 params_filename=self.params_filename,
@@ -425,7 +433,7 @@ class AutoCompression:
                 self._places,
                 model_dir=self.model_dir,
                 quantize_model_path=os.path.join(
-                    self.save_dir, 'strategy_{}'.format(str(strategy_idx + 1))),
+                    self.tmp_dir, 'strategy_{}'.format(str(strategy_idx + 1))),
                 train_dataloader=self.train_dataloader,
                 eval_dataloader=self.eval_dataloader,
                 eval_function=self.eval_function,
@@ -452,7 +460,7 @@ class AutoCompression:
                 model_dir = self.model_dir
             else:
                 model_dir = os.path.join(
-                    self.save_dir, 'strategy_{}'.format(str(strategy_idx)))
+                    self.tmp_dir, 'strategy_{}'.format(str(strategy_idx)))
 
             [inference_program, feed_target_names, fetch_targets]= paddle.fluid.io.load_inference_model( \
                 dirname=model_dir, \
@@ -528,7 +536,7 @@ class AutoCompression:
                         if metric > best_metric:
                             paddle.static.save(
                                 program=test_program_info.program._program,
-                                model_path=os.path.join(self.save_dir,
+                                model_path=os.path.join(self.tmp_dir,
                                                         'best_model'))
                             best_metric = metric
                             if self.metric_before_compressed is not None and float(
@@ -555,12 +563,12 @@ class AutoCompression:
             test_program_info.program,
             paddle.static.CompiledProgram) else test_program_info.program
 
-        if os.path.exists(os.path.join(self.save_dir, 'best_model.pdparams')):
+        if os.path.exists(os.path.join(self.tmp_dir, 'best_model.pdparams')):
             paddle.static.load(test_program,
-                               os.path.join(self.save_dir, 'best_model'))
-            os.remove(os.path.join(self.save_dir, 'best_model.pdmodel'))
-            os.remove(os.path.join(self.save_dir, 'best_model.pdopt'))
-            os.remove(os.path.join(self.save_dir, 'best_model.pdparams'))
+                               os.path.join(self.tmp_dir, 'best_model'))
+            os.remove(os.path.join(self.tmp_dir, 'best_model.pdmodel'))
+            os.remove(os.path.join(self.tmp_dir, 'best_model.pdopt'))
+            os.remove(os.path.join(self.tmp_dir, 'best_model.pdparams'))
 
         if 'qat' in strategy:
             float_program, int8_program = convert(test_program_info.program._program, self._places, self._quant_config, \
@@ -568,7 +576,7 @@ class AutoCompression:
                                           save_int8=True)
             test_program_info.program = float_program
 
-        model_dir = os.path.join(self.save_dir,
+        model_dir = os.path.join(self.tmp_dir,
                                  'strategy_{}'.format(str(strategy_idx + 1)))
         if not os.path.exists(model_dir):
             os.makedirs(model_dir)
diff --git a/paddleslim/quant/quant_post_hpo.py b/paddleslim/quant/quant_post_hpo.py
index a6ff710f..08cbcfa8 100755
--- a/paddleslim/quant/quant_post_hpo.py
+++ b/paddleslim/quant/quant_post_hpo.py
@@ -24,6 +24,8 @@ import paddle.fluid as fluid
 import logging
 import argparse
 import functools
+import shutil
+import glob
 from scipy.stats import wasserstein_distance
 
 # smac
@@ -36,6 +38,20 @@ from smac.scenario.scenario import Scenario
 from paddleslim.common import get_logger
 from paddleslim.quant import quant_post
 
+SMAC_TMP_FILE_PATTERN = "smac3-output*"
+
+
+def remove(path):
+    """Remove files or directories matched by regex.
+    Args:
+        path(str): regular expressions to match the files and directories.
+    """
+    for p in glob.glob(path):
+        if os.path.isdir(p):
+            shutil.rmtree(p)
+        else:
+            os.remove(p)
+
 
 class QuantConfig:
     """quant config"""
@@ -472,7 +488,7 @@ def quant_post_hpo(
             bias_correction=bias_correct, \
             batch_size=batch_size, \
             batch_nums=batch_num)
-
+        shutil.rmtree(g_quant_model_cache_path)
         return
 
     cs.add_hyperparameters(hyper_params)
@@ -486,7 +502,6 @@ def quant_post_hpo(
         "limit_resources": "False",
         "memory_limit": 4096  # adapt this to reasonable value for your hardware
     })
-
     # To optimize, we pass the function to the SMAC-object
     smac = SMAC4HPO(
         scenario=scenario, rng=np.random.RandomState(42), tae_runner=quantize)
@@ -504,4 +519,6 @@ def quant_post_hpo(
 
     inc_value = smac.get_tae_runner().run(incumbent, 1)[1]
     print("Optimized Value: %.8f" % inc_value)
+    shutil.rmtree(g_quant_model_cache_path)
+    remove(SMAC_TMP_FILE_PATTERN)
     print("quantize completed")
-- 
GitLab