add transformer prune unittest (#1362)

* add act unittest

add transformer prune unittest (#1362)
* add act unittest
50ec7275 · ceci3 · GitHub · c3c6ef19 · 50ec7275 · 50ec7275
8 changed file
--- a/paddleslim/auto_compression/compressor.py
+++ b/paddleslim/auto_compression/compressor.py
@@ -640,6 +640,11 @@ class AutoCompression:
                    model_filename=self.model_filename,
                    params_filename=self.params_filename,
                    executor=self._exe)
+            if self.eval_function is None:
+                # If eval function is None, ptq_hpo will use emd distance to eval the quantized model, so need the dataloader without label
+                eval_dataloader = self.train_dataloader
+            else:
+                eval_dataloader = self.eval_dataloader
            post_quant_hpo.quant_post_hpo(
                self._exe,
                self._places,
@@ -647,7 +652,7 @@ class AutoCompression:
                quantize_model_path=os.path.join(
                    self.tmp_dir, 'strategy_{}'.format(str(strategy_idx + 1))),
                train_dataloader=self.train_dataloader,
-                eval_dataloader=self.eval_dataloader,
+                eval_dataloader=eval_dataloader,
                eval_function=self.eval_function,
                model_filename=self.model_filename,
                params_filename=self.params_filename,

--- a/paddleslim/auto_compression/utils/fake_ptq.py
+++ b/paddleslim/auto_compression/utils/fake_ptq.py
@@ -47,7 +47,9 @@ def post_quant_fake(executor,
        set(_weight_supported_quantizable_op_type +
            _act_supported_quantizable_op_type + _dynamic_quantize_op_type))
    _place = executor.place
-    _scope = paddle.static.global_scope()
+    _scope = paddle.static.Scope()
+
+    with paddle.static.scope_guard(_scope):
        if is_full_quantize:
            _quantizable_op_type = _support_quantize_op_type
        else:

--- a/tests/act/qat_dist_train.yaml
+++ b/tests/act/qat_dist_train.yaml
@@ -10,7 +10,7 @@ Distillation:

 TrainConfig:
  epochs: 1
-  eval_iter: 1070
+  eval_iter: 1
  learning_rate: 2.0e-5
  optimizer_builder:
    optimizer: 

--- a/tests/act/test_act_api.py
+++ b/tests/act/test_act_api.py
@@ -125,7 +125,7 @@ class TestLoadONNXModel(ACTBase):
    def __init__(self, *args, **kwargs):
        super(TestLoadONNXModel, self).__init__(*args, **kwargs)
        os.system(
-            'wget https://paddle-slim-models.bj.bcebos.com/act/yolov5s.onnx')
+            'wget -q https://paddle-slim-models.bj.bcebos.com/act/yolov5s.onnx')
        self.model_dir = 'yolov5s.onnx'

    def test_compress(self):

--- a/tests/act/test_act_sparse.py
+++ b/tests/act/test_act_sparse.py
+import os
+import sys
+import unittest
+sys.path.append("../../")
+import numpy as np
+import paddle
+from paddle.io import Dataset
+from paddleslim.auto_compression import AutoCompression
+paddle.enable_static()
+
+
+class RandomEvalDataset(Dataset):
+    def __init__(self, num_samples, image_shape=[3, 398, 224], class_num=10):
+        self.num_samples = num_samples
+        self.image_shape = image_shape
+        self.class_num = class_num
+
+    def __getitem__(self, idx):
+        image = np.random.random(self.image_shape).astype('float32')
+        return image
+
+    def __len__(self):
+        return self.num_samples
+
+
+class ACTSparse(unittest.TestCase):
+    def __init__(self, *args, **kwargs):
+        super(ACTSparse, self).__init__(*args, **kwargs)
+        if not os.path.exists('ppseg_lite_portrait_398x224_with_softmax'):
+            os.system(
+                "wget -q https://paddleseg.bj.bcebos.com/dygraph/ppseg/ppseg_lite_portrait_398x224_with_softmax.tar.gz"
+            )
+            os.system(
+                'tar -xzvf ppseg_lite_portrait_398x224_with_softmax.tar.gz')
+        self.create_dataloader()
+        self.get_train_config()
+
+    def create_dataloader(self):
+        # define a random dataset
+        self.eval_dataset = RandomEvalDataset(32)
+
+    def get_train_config(self):
+        self.train_config = {
+            'TrainConfig': {
+                'epochs': 1,
+                'eval_iter': 1,
+                'learning_rate': 5.0e-03,
+                'optimizer_builder': {
+                    'optimizer': {
+                        'type': 'SGD'
+                    },
+                    "weight_decay": 0.0005,
+                }
+            }
+        }
+
+    def test_demo(self):
+        image = paddle.static.data(
+            name='x', shape=[-1, 3, 398, 224], dtype='float32')
+        train_loader = paddle.io.DataLoader(
+            self.eval_dataset, feed_list=[image], batch_size=4)
+
+        ac = AutoCompression(
+            model_dir="./ppseg_lite_portrait_398x224_with_softmax",
+            model_filename="model.pdmodel",
+            params_filename="model.pdiparams",
+            input_shapes=[1, 3, 398, 224],
+            config=self.train_config,
+            save_dir="ppliteseg_output",
+            train_dataloader=train_loader,
+            deploy_hardware='SD710')
+        ac.compress()
+        os.system('rm -rf ppliteseg_output')
+
+
+if __name__ == '__main__':
+    unittest.main()
--- a/tests/act/test_demo.py
+++ b/tests/act/test_demo.py
@@ -31,10 +31,12 @@ class ImageNetDataset(DatasetFolder):
 class ACTDemo(unittest.TestCase):
    def __init__(self, *args, **kwargs):
        super(ACTDemo, self).__init__(*args, **kwargs)
+        if not os.path.exists('MobileNetV1_infer'):
            os.system(
                'wget https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/inference/MobileNetV1_infer.tar'
            )
            os.system('tar -xf MobileNetV1_infer.tar')
+        if not os.path.exists('ILSVRC2012_data_demo'):
            os.system(
                'wget https://sys-p0.bj.bcebos.com/slim_ci/ILSVRC2012_data_demo.tar.gz'
            )

--- a/tests/act/test_eval_function.py
+++ b/tests/act/test_eval_function.py
+import os
+import sys
+import unittest
+import numpy as np
+sys.path.append("../../")
+import paddle
+from PIL import Image
+from paddle.vision.datasets import DatasetFolder
+from paddle.vision.transforms import transforms
+from paddleslim.auto_compression import AutoCompression
+paddle.enable_static()
+
+
+class ImageNetDataset(DatasetFolder):
+    def __init__(self, data_dir, image_size=224, mode='train'):
+        super(ImageNetDataset, self).__init__(data_dir)
+        self.data_dir = data_dir
+        normalize = transforms.Normalize(
+            mean=[123.675, 116.28, 103.53], std=[58.395, 57.120, 57.375])
+        self.transform = transforms.Compose([
+            transforms.Resize(256), transforms.CenterCrop(image_size),
+            transforms.Transpose(), normalize
+        ])
+        self.mode = mode
+        train_file_list = os.path.join(data_dir, 'train_list.txt')
+        val_file_list = os.path.join(data_dir, 'val_list.txt')
+        self.mode = mode
+        if mode == 'train':
+            with open(train_file_list) as flist:
+                full_lines = [line.strip() for line in flist]
+                np.random.shuffle(full_lines)
+                lines = full_lines
+            self.samples = [line.split() for line in lines]
+        else:
+            with open(val_file_list) as flist:
+                lines = [line.strip() for line in flist]
+                self.samples = [line.split() for line in lines]
+
+    def __getitem__(self, idx):
+        img_path, label = self.samples[idx]
+        if self.mode == 'train':
+            return self.transform(
+                Image.open(os.path.join(self.data_dir, img_path)).convert(
+                    'RGB'))
+        else:
+            return self.transform(
+                Image.open(os.path.join(self.data_dir, img_path)).convert(
+                    'RGB')), np.array([label]).astype('int64')
+
+    def __len__(self):
+        return len(self.samples)
+
+
+class ACTEvalFunction(unittest.TestCase):
+    def __init__(self, *args, **kwargs):
+        super(ACTEvalFunction, self).__init__(*args, **kwargs)
+        if not os.path.exists('MobileNetV1_infer'):
+            os.system(
+                'wget -q https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/inference/MobileNetV1_infer.tar'
+            )
+            os.system('tar -xf MobileNetV1_infer.tar')
+        if not os.path.exists('ILSVRC2012_data_demo'):
+            os.system(
+                'wget -q https://sys-p0.bj.bcebos.com/slim_ci/ILSVRC2012_data_demo.tar.gz'
+            )
+            os.system('tar -xf ILSVRC2012_data_demo.tar.gz')
+
+    def test_demo(self):
+        train_dataset = ImageNetDataset("./ILSVRC2012_data_demo/ILSVRC2012/")
+        image = paddle.static.data(
+            name='inputs', shape=[None] + [3, 224, 224], dtype='float32')
+        label = paddle.static.data(
+            name='labels', shape=[None] + [1], dtype='float32')
+        train_loader = paddle.io.DataLoader(
+            train_dataset, feed_list=[image], batch_size=32, return_list=False)
+
+        def reader_wrapper(reader, input_name):
+            def gen():
+                for i, (imgs, label) in enumerate(reader()):
+                    yield {input_name: imgs}
+
+            return gen
+
+        def eval_reader(data_dir,
+                        batch_size,
+                        crop_size,
+                        resize_size,
+                        place=None):
+            val_dataset = ImageNetDataset(
+                "./ILSVRC2012_data_demo/ILSVRC2012/", mode='val')
+            val_loader = paddle.io.DataLoader(
+                val_dataset,
+                feed_list=[image, label],
+                batch_size=batch_size,
+                shuffle=False,
+                drop_last=False,
+                num_workers=0,
+                return_list=False)
+            return val_loader
+
+        def eval_function(exe, compiled_test_program, test_feed_names,
+                          test_fetch_list):
+            val_loader = eval_reader(
+                './ILSVRC2012_data_demo/ILSVRC2012/',
+                batch_size=32,
+                crop_size=224,
+                resize_size=256)
+
+            results = []
+            print('Evaluating...')
+            for batch_id, data in enumerate(val_loader):
+                image = data[0]['inputs']
+                label = data[0]['labels']
+                # top1_acc, top5_acc
+                if len(test_feed_names) == 1:
+                    image = np.array(image)
+                    label = np.array(label).astype('int64')
+                    pred = exe.run(compiled_test_program,
+                                   feed={test_feed_names[0]: image},
+                                   fetch_list=test_fetch_list)
+                    pred = np.array(pred[0])
+                    label = np.array(label)
+                    sort_array = pred.argsort(axis=1)
+                    top_1_pred = sort_array[:, -1:][:, ::-1]
+                    top_1 = np.mean(label == top_1_pred)
+                    top_5_pred = sort_array[:, -5:][:, ::-1]
+                    acc_num = 0
+                    for i in range(len(label)):
+                        if label[i][0] in top_5_pred[i]:
+                            acc_num += 1
+                    top_5 = float(acc_num) / len(label)
+                    results.append([top_1, top_5])
+                else:
+                    # eval "eval model", which inputs are image and label, output is top1 and top5 accuracy
+                    image = np.array(image)
+                    label = np.array(label).astype('int64')
+                    result = exe.run(compiled_test_program,
+                                     feed={
+                                         test_feed_names[0]: image,
+                                         test_feed_names[1]: label
+                                     },
+                                     fetch_list=test_fetch_list)
+                    result = [np.mean(r) for r in result]
+                    results.append(result)
+                if batch_id % 100 == 0:
+                    print('Eval iter: ', batch_id)
+            result = np.mean(np.array(results), axis=0)
+            return result[0]
+
+        ac = AutoCompression(
+            model_dir="./MobileNetV1_infer",
+            model_filename="inference.pdmodel",
+            params_filename="inference.pdiparams",
+            save_dir="MobileNetV1_eval_quant",
+            config='./qat_dist_train.yaml',
+            train_dataloader=train_loader,
+            eval_callback=eval_function)
+        ac.compress()
+        os.system('rm -rf MobileNetV1_eval_quant')
+
+
+if __name__ == '__main__':
+    unittest.main()
--- a/tests/act/test_nlp_ac.py
+++ b/tests/act/test_nlp_ac.py
+import os
+import sys
+sys.path.append("../../")
+import numpy as np
+import unittest
+import paddle
+from paddle.io import Dataset
+from paddleslim.common import load_config
+from paddleslim.auto_compression.compressor import AutoCompression
+
+
+class RandomDataset(Dataset):
+    def __init__(self, num_samples, sample_shape=[128]):
+        self.num_samples = num_samples
+        self.sample_shape = sample_shape
+
+    def __getitem__(self, idx):
+        input_ids = np.random.random(self.sample_shape).astype('int64')
+        token_type_ids = np.random.random(self.sample_shape).astype('int64')
+        return input_ids, token_type_ids
+
+    def __len__(self):
+        return self.num_samples
+
+
+class RandomEvalDataset(Dataset):
+    def __init__(self, num_samples, sample_shape=[128]):
+        self.num_samples = num_samples
+        self.sample_shape = sample_shape
+
+    def __getitem__(self, idx):
+        input_ids = np.random.random(self.sample_shape).astype('int64')
+        token_type_ids = np.random.random(self.sample_shape).astype('int64')
+        labels = np.ones(([1])).astype('int64')
+        return input_ids, token_type_ids, labels
+
+    def __len__(self):
+        return self.num_samples
+
+
+### select transformer_prune and qat
+class NLPAutoCompress(unittest.TestCase):
+    def __init__(self, *args, **kwargs):
+        super(NLPAutoCompress, self).__init__(*args, **kwargs)
+        paddle.enable_static()
+        if not os.path.exists('afqmc'):
+            os.system(
+                'wget -q https://bj.bcebos.com/v1/paddle-slim-models/act/afqmc.tar'
+            )
+            os.system('tar -xf afqmc.tar')
+        self.create_dataset()
+        self.get_train_config()
+
+    def create_dataset(self):
+        self.fake_dataset = RandomDataset(32)
+        self.fake_eval_dataset = RandomEvalDataset(32)
+
+    def get_train_config(self):
+        self.train_config = {
+            'TrainConfig': {
+                'epochs': 1,
+                'eval_iter': 1,
+                'learning_rate': 2.0e-5,
+                'optimizer_builder': {
+                    'optimizer': {
+                        'type': 'AdamW'
+                    },
+                    'weight_decay': 0.01
+                },
+            }
+        }
+
+    def test_nlp(self):
+        input_ids = paddle.static.data(
+            name='input_ids', shape=[-1, -1], dtype='int64')
+        token_type_ids = paddle.static.data(
+            name='token_type_ids', shape=[-1, -1], dtype='int64')
+        labels = paddle.static.data(name='labels', shape=[-1], dtype='int64')
+        train_loader = paddle.io.DataLoader(
+            self.fake_dataset,
+            feed_list=[input_ids, token_type_ids],
+            batch_size=32,
+            return_list=False)
+        eval_loader = paddle.io.DataLoader(
+            self.fake_eval_dataset,
+            feed_list=[input_ids, token_type_ids, labels],
+            batch_size=32,
+            return_list=False)
+
+        ac = AutoCompression(
+            model_dir='afqmc',
+            model_filename="inference.pdmodel",
+            params_filename="inference.pdiparams",
+            config=self.train_config,
+            save_dir="nlp_ac_output",
+            train_dataloader=train_loader,
+            eval_dataloader=eval_loader)
+        ac.compress()
+        os.system("rm -rf nlp_ac_output")
+        os.system("rm -rf afqmc*")
+
+
+if __name__ == '__main__':
+    unittest.main()