Remove slim from paddle framework (#25666)

* Remove slim from paddle framework test=develop Co-authored-by: N wanghaoshuang <wanghaoshuang@baidu.com>

Remove slim from paddle framework (#25666)
* Remove slim from paddle framework test=develop Co-authored-by: N wanghaoshuang <wanghaoshuang@baidu.com>
2131559d · Bai Yifan · GitHub · bca30316 · 2131559d · 2131559d
56 changed file
--- a/python/paddle/fluid/contrib/__init__.py
+++ b/python/paddle/fluid/contrib/__init__.py
@@ -25,7 +25,6 @@ from .quantize import *
 from . import reader
 from .reader import *
 from . import slim
-from .slim import *
 from . import utils
 from .utils import *
 from . import extend_optimizer
@@ -43,7 +42,6 @@ __all__ += memory_usage_calc.__all__
 __all__ += op_frequence.__all__
 __all__ += quantize.__all__
 __all__ += reader.__all__
-__all__ += slim.__all__
 __all__ += utils.__all__
 __all__ += extend_optimizer.__all__
 __all__ += ['mixed_precision']

--- a/python/paddle/fluid/contrib/slim/__init__.py
+++ b/python/paddle/fluid/contrib/slim/__init__.py
@@ -11,6 +11,3 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
-from .core import *
-__all__ = ['Compressor', ]
--- a/python/paddle/fluid/contrib/slim/core/__init__.py
+++ b/python/paddle/fluid/contrib/slim/core/__init__.py
-#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from . import config
-from .config import *
-from . import compressor
-from .compressor import *
-from . import strategy
-from .strategy import *
-
-__all__ = config.__all__ + compressor.__all__ + strategy.__all__
--- a/python/paddle/fluid/contrib/slim/core/compressor.py
+++ b/python/paddle/fluid/contrib/slim/core/compressor.py
--- a/python/paddle/fluid/contrib/slim/core/config.py
+++ b/python/paddle/fluid/contrib/slim/core/config.py
-#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import inspect
-import funcsigs
-import yaml
-from collections import OrderedDict
-from ..prune import *
-from ..quantization import *
-from .strategy import *
-from ..distillation import *
-from ..searcher import *
-from ..nas import *
-
-__all__ = ['ConfigFactory']
-"""This factory is used to create instances by loading and parsing configure file with yaml format.
-"""
-
-PLUGINS = ['pruners', 'quantizers', 'distillers', 'strategies', 'controllers']
-
-
-class ConfigFactory(object):
-    def __init__(self, config):
-        """Init a factory from configure file."""
-        self.instances = {}
-        self.compressor = {}
-        self.version = None
-        self._parse_config(config)
-
-    def instance(self, name):
-        """
-        Get instance from factory.
-        """
-        if name in self.instances:
-            return self.instances[name]
-        else:
-            return None
-
-    def _new_instance(self, name, attrs):
-        if name not in self.instances:
-            class_ = globals()[attrs['class']]
-            sig = funcsigs.signature(class_.__init__)
-            keys = [
-                param.name for param in sig.parameters.values()
-                if (param.kind == param.POSITIONAL_OR_KEYWORD)
-            ][1:]
-            keys = set(attrs.keys()).intersection(set(keys))
-            args = {}
-            for key in keys:
-                value = attrs[key]
-                if isinstance(value, str) and value.lower() == 'none':
-                    value = None
-                if isinstance(value, str) and value in self.instances:
-                    value = self.instances[value]
-                if isinstance(value, list):
-                    for i in range(len(value)):
-                        if isinstance(value[i],
-                                      str) and value[i] in self.instances:
-                            value[i] = self.instances[value[i]]
-
-                args[key] = value
-            self.instances[name] = class_(**args)
-        return self.instances.get(name)
-
-    def _parse_config(self, config):
-        assert config
-        with open(config, 'r') as config_file:
-            key_values = self._ordered_load(config_file)
-            for key in key_values:
-                # parse version
-                if key == 'version' and self.version is None:
-                    self.version = int(key_values['version'])
-                    assert self.version == int(key_values['version'])
-
-                # parse pruners
-                if key in PLUGINS:
-                    instances = key_values[key]
-                    for name in instances:
-                        self._new_instance(name, instances[name])
-
-                if key == 'compressor':
-                    self.compressor['strategies'] = []
-                    self.compressor['epoch'] = key_values[key]['epoch']
-                    if 'init_model' in key_values[key]:
-                        self.compressor['init_model'] = key_values[key][
-                            'init_model']
-                    if 'checkpoint_path' in key_values[key]:
-                        self.compressor['checkpoint_path'] = key_values[key][
-                            'checkpoint_path']
-                    if 'eval_epoch' in key_values[key]:
-                        self.compressor['eval_epoch'] = key_values[key][
-                            'eval_epoch']
-                    if 'strategies' in key_values[key]:
-                        for name in key_values[key]['strategies']:
-                            strategy = self.instance(name)
-                            self.compressor['strategies'].append(strategy)
-
-                if key == 'include':
-                    for config_file in key_values[key]:
-                        self._parse_config(config_file.strip())
-
-    def _ordered_load(self,
-                      stream,
-                      Loader=yaml.Loader,
-                      object_pairs_hook=OrderedDict):
-        """
-        See: https://stackoverflow.com/questions/5121931/in-python-how-can-you-load-yaml-mappings-as-ordereddicts
-        """
-
-        class OrderedLoader(Loader):
-            pass
-
-        def construct_mapping(loader, node):
-            loader.flatten_mapping(node)
-            return object_pairs_hook(loader.construct_pairs(node))
-
-        OrderedLoader.add_constructor(
-            yaml.resolver.BaseResolver.DEFAULT_MAPPING_TAG, construct_mapping)
-        return yaml.load(stream, OrderedLoader)
--- a/python/paddle/fluid/contrib/slim/core/strategy.py
+++ b/python/paddle/fluid/contrib/slim/core/strategy.py
-#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-__all__ = ['Strategy']
-
-
-class Strategy(object):
-    """
-    Base class for all strategies.
-    """
-
-    def __init__(self, start_epoch=0, end_epoch=0):
-        """
-        Args:
-            start_epoch: The first epoch to apply the strategy.
-            end_epoch: The last epoch to apply the strategy.
-        """
-        self.start_epoch = start_epoch
-        self.end_epoch = end_epoch
-
-    def __getstate__(self):
-        d = {}
-        for key in self.__dict__:
-            if key not in ["start_epoch", "end_epoch"]:
-                d[key] = self.__dict__[key]
-        return d
-
-    def on_compression_begin(self, context):
-        pass
-
-    def on_epoch_begin(self, context):
-        pass
-
-    def on_epoch_end(self, context):
-        pass
-
-    def on_batch_begin(self, context):
-        pass
-
-    def on_batch_end(self, context):
-        pass
-
-    def on_compression_end(self, context):
-        pass
-
-    def restore_from_checkpoint(self, context):
-        pass
--- a/python/paddle/fluid/contrib/slim/distillation/__init__.py
+++ b/python/paddle/fluid/contrib/slim/distillation/__init__.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from . import distiller
-from .distiller import *
-from . import distillation_strategy
-from .distillation_strategy import *
-
-__all__ = distiller.__all__
-__all__ += distillation_strategy.__all__
--- a/python/paddle/fluid/contrib/slim/distillation/distillation_strategy.py
+++ b/python/paddle/fluid/contrib/slim/distillation/distillation_strategy.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from ..core.strategy import Strategy
-from ....framework import Program, Variable, program_guard
-from ....log_helper import get_logger
-from .... import Executor
-import logging
-
-__all__ = ['DistillationStrategy']
-
-_logger = get_logger(
-    __name__, logging.INFO, fmt='%(asctime)s-%(levelname)s: %(message)s')
-
-
-class DistillationStrategy(Strategy):
-    def __init__(self, distillers=None, start_epoch=0, end_epoch=0):
-        """
-        Args:
-            distillers(list): A list of distiller used to combine student graph and teacher graph
-                              by adding some loss.
-            start_epoch(int): The epoch when to merge student graph and teacher graph for
-                              distillation training. default: 0
-            end_epoch(int): The epoch when to finish distillation training. default: 0
-            
-        """
-        super(DistillationStrategy, self).__init__(start_epoch, end_epoch)
-        self.distillers = distillers
-
-    def restore_from_checkpoint(self, context):
-        # load from checkpoint
-        if context.epoch_id > 0:
-            if context.epoch_id > self.start_epoch and context.epoch_id < self.end_epoch:
-                _logger.info('Restore DistillationStrategy')
-                self._create_distillation_graph(context)
-                _logger.info('Restore DistillationStrategy finish.')
-
-    def on_epoch_begin(self, context):
-        if self.start_epoch == context.epoch_id:
-            _logger.info('DistillationStrategy::on_epoch_begin.')
-            self._create_distillation_graph(context)
-            _logger.info('DistillationStrategy set optimize_graph.')
-
-    def _create_distillation_graph(self, context):
-        """
-        step 1: Merge student graph and teacher graph into distillation graph.
-        step 2: Add loss into distillation graph by distillers.
-        step 3: Append backward ops and optimize ops into distillation graph for training.
-        """
-        # step 1
-        teacher = context.teacher_graphs[0]
-        for var in teacher.program.list_vars():
-            var.stop_gradient = True
-        graph = context.train_graph.clone()
-        graph.merge(teacher)
-        if 'loss' in graph.out_nodes:
-            graph.out_nodes['student_loss'] = graph.out_nodes['loss']
-
-        # step 2
-        for distiller in self.distillers:
-            graph = distiller.distiller_loss(graph)
-
-        # step 3
-        startup_program = Program()
-        with program_guard(graph.program, startup_program):
-            context.distiller_optimizer._name = 'distillation_optimizer'
-
-            # The learning rate variable may be created in other program.
-            # Update information in optimizer to make
-            # learning rate variable being accessible in current program.
-            optimizer = context.distiller_optimizer
-            if isinstance(optimizer._learning_rate, Variable):
-                optimizer._learning_rate_map[
-                    graph.program] = optimizer._learning_rate
-
-            optimizer.minimize(graph.var(graph.out_nodes['loss'])._var)
-
-        exe = Executor(context.place)
-        exe.run(startup_program, scope=context.scope)
-
-        # backup graph for fine-tune after distillation
-        context.put('distillation_backup_optimize_graph',
-                    context.optimize_graph)
-        context.optimize_graph = graph
-
-    def on_epoch_end(self, context):
-        if context.epoch_id == (self.end_epoch - 1):
-            _logger.info('DistillationStrategy::on_epoch_end.')
-            # restore optimize_graph for fine-tune or other strategy in next stage.
-            context.optimize_graph = context.get(
-                'distillation_backup_optimize_graph')
-            _logger.info(
-                'DistillationStrategy set context.optimize_graph to None.')
--- a/python/paddle/fluid/contrib/slim/distillation/distiller.py
+++ b/python/paddle/fluid/contrib/slim/distillation/distiller.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from .... import layers
-from .... import optimizer
-from .... import Executor
-from .... import Program
-from .... import program_guard
-from .... import regularizer
-
-__all__ = ['FSPDistiller', 'L2Distiller', 'SoftLabelDistiller']
-
-
-class L2Distiller(object):
-    """
-    Combine two layers from student net and teacher net by l2-loss.
-    And add the loss into the total loss using for distillation training.
-    """
-
-    def __init__(self,
-                 student_feature_map,
-                 teacher_feature_map,
-                 distillation_loss_weight=1):
-        """
-        Args:
-            student_feature_map(str): The name of feature map from student network.
-            teacher_feature_map(str): The name of feature map from teacher network.
-                                      It's shape should be the same with student network.
-            distillation_loss_weight(float): The weight of the l2-loss.
-        """
-        self.student_feature_map = student_feature_map
-        self.teacher_feature_map = teacher_feature_map
-        self.distillation_loss_weight = distillation_loss_weight
-
-    def distiller_loss(self, graph):
-        """
-        Modify graph inplace to add l2-loss.
-        Args: 
-            graph(GraphWrapper): The graph to be modified.
-        Returns:
-            GraphWrapper: The modified graph.
-        """
-        distiller_pass = L2DistillerPass(self.student_feature_map,
-                                         self.teacher_feature_map,
-                                         self.distillation_loss_weight)
-        dis_graph = distiller_pass.apply(graph)
-        return dis_graph
-
-
-class L2DistillerPass(object):
-    """
-    The pass used to add l2-loss.
-    """
-
-    def __init__(self,
-                 student_feature_map,
-                 teacher_feature_map,
-                 distillation_loss_weight=1):
-        """
-        Args:
-            student_feature_map(str): The name of feature map from student network.
-            teacher_feature_map(str): The name of feature map from teacher network.
-                                      It's shape should be the same with student network.
-            distillation_loss_weight(float): The weight of the l2-loss.
-        """
-        self.student_feature_map = student_feature_map
-        self.teacher_feature_map = teacher_feature_map
-        self.distillation_loss_weight = distillation_loss_weight
-
-    def apply(self, graph):
-        ret_graph = graph
-        with program_guard(ret_graph.program):
-
-            student_feature_map = ret_graph.var(self.student_feature_map)._var
-            teacher_feature_map = ret_graph.var(self.teacher_feature_map)._var
-            l2loss = layers.reduce_mean(
-                layers.square(student_feature_map - teacher_feature_map))
-
-            distillation_loss = l2loss * self.distillation_loss_weight
-            student_loss = 0
-            if 'loss' in ret_graph.out_nodes:
-                student_loss = ret_graph.var(ret_graph.out_nodes['loss'])._var
-            loss = distillation_loss + student_loss
-
-            ret_graph.out_nodes['loss'] = loss.name
-            ret_graph.out_nodes[
-                'l2loss_' + self.student_feature_map + "_" +
-                self.teacher_feature_map] = distillation_loss.name
-        return ret_graph
-
-
-class FSPDistiller(object):
-    """
-    Combine layers from student net and teacher net by fsp-loss.
-    """
-
-    def __init__(self, student_pairs, teacher_pairs,
-                 distillation_loss_weight=1):
-        """
-        Args:
-            student_pairs(list<tuple>): Each tuple, with two variable names, in student_pairs indicates
-                                        a section in student network. The variables in a tuple should
-                                        have the same feature map size.
-            teacher_pairs(list<tuple>): Each tuple, with two variable names, in teacher_pairs indicates
-                                        a section in teacher network. The variables in a tuple should
-                                        have the same feature map size. Varibale named teacher_pairs[i][j]
-                                        should has the save channel number with that of variable named 
-                                        student_pairs[i][j].
-
-            distillation_loss_weight(float): The weight of the fsp-loss. default: 1.
-        """
-        self.student_pairs = student_pairs
-        self.teacher_pairs = teacher_pairs
-        self.distillation_loss_weight = distillation_loss_weight
-
-    def distiller_loss(self, graph):
-        """
-        Modify graph inplace to add fsp-loss.
-        Args: 
-            graph(GraphWrapper): The graph to be modified.
-        Returns:
-            GraphWrapper: The modified graph.
-        """
-        distiller_pass = FSPDistillerPass(self.student_pairs,
-                                          self.teacher_pairs,
-                                          self.distillation_loss_weight)
-        dis_graph = distiller_pass.apply(graph)
-        return dis_graph
-
-
-class FSPDistillerPass(object):
-    '''
-    Combine layers from student net and teacher net by fsp-loss.
-    '''
-
-    def __init__(self, s_pairs, t_pairs, distillation_loss_weight=1):
-        """
-        Args:
-            s_pairs(list<tuple>): Each tuple, with two variable names, in student_pairs indicates
-                                        a section in student network. The variables in a tuple should
-                                        have the same feature map size.
-            t_pairs(list<tuple>): Each tuple, with two variable names, in teacher_pairs indicates
-                                        a section in teacher network. The variables in a tuple should
-                                        have the same feature map size. Varibale named teacher_pairs[i][j]
-                                        should has the save channel number with that of variable named 
-                                        student_pairs[i][j].
-
-            distillation_loss_weight(float): The weight of the fsp-loss. default: 1.
-        """
-        self.s_pairs = s_pairs
-        self.t_pairs = t_pairs
-        self.distillation_loss_weight = distillation_loss_weight
-
-    def apply(self, graph):
-        ret_graph = graph
-        with program_guard(ret_graph.program):
-            losses = []
-            for s_pair, t_pair in zip(self.s_pairs, self.t_pairs):
-                s_pair_start = ret_graph.var(s_pair[0])._var
-                s_pair_end = ret_graph.var(s_pair[1])._var
-                s_fsp_matrix = self._fsp_matrix(s_pair_start, s_pair_end)
-                t_pair_start = ret_graph.var(t_pair[0])._var
-                t_pair_end = ret_graph.var(t_pair[1])._var
-                t_fsp_matrix = self._fsp_matrix(t_pair_start, t_pair_end)
-                l2_loss = layers.reduce_mean(
-                    layers.square(s_fsp_matrix - t_fsp_matrix))
-                losses.append(l2_loss)
-            distillation_loss = layers.sum(
-                losses) * self.distillation_loss_weight
-            student_loss = 0
-            if 'loss' in ret_graph.out_nodes:
-                student_loss = ret_graph.var(ret_graph.out_nodes['loss'])._var
-            loss = distillation_loss + student_loss
-
-            ret_graph.out_nodes['loss'] = loss.name
-            ret_graph.out_nodes[
-                'fsp_distillation_loss'] = distillation_loss.name
-        return ret_graph
-
-    def _fsp_matrix(self, fea_map_0, fea_map_1):
-        return layers.fsp_matrix(fea_map_0, fea_map_1)
-
-
-class SoftLabelDistiller(object):
-    """
-    Combine two layers from student net and teacher net by softmax_with_cross_entropy loss.
-    And add the loss into the total loss using for distillation training.
-    """
-
-    def __init__(self,
-                 student_feature_map=None,
-                 teacher_feature_map=None,
-                 student_temperature=1.0,
-                 teacher_temperature=1.0,
-                 distillation_loss_weight=1):
-        """
-        Args:
-            student_feature_map(str): The name of feature map from student network.
-            teacher_feature_map(str): The name of feature map from teacher network.
-                                      It's shape should be the same with student network.
-            student_temperature(float): Temperature used to divide student_feature_map before softmax_with_cross_entropy. default: 1.0
-            teacher_temperature(float): Temperature used to divide teacher_feature_map before softmax_with_cross_entropy. default: 1.0
-            distillation_loss_weight(float): The weight of the l2-loss.
-        """
-
-        self.student_feature_map = student_feature_map
-        self.teacher_feature_map = teacher_feature_map
-        self.distillation_loss_weight = distillation_loss_weight
-        self.student_temperature = student_temperature
-        self.teacher_temperature = teacher_temperature
-
-    def distiller_loss(self, graph):
-        """
-        Modify graph inplace to add softmax_with_cross_entropy loss.
-        Args: 
-            graph(GraphWrapper): The graph to be modified.
-        Returns:
-            GraphWrapper: The modified graph.
-        """
-        distiller_pass = SoftLabelDistillerPass(
-            self.student_feature_map, self.teacher_feature_map,
-            self.student_temperature, self.teacher_temperature,
-            self.distillation_loss_weight)
-        dis_graph = distiller_pass.apply(graph)
-        return dis_graph
-
-
-class SoftLabelDistillerPass(object):
-    def __init__(self,
-                 student_feature_map,
-                 teacher_feature_map,
-                 student_temperature,
-                 teacher_temperature,
-                 distillation_loss_weight=1):
-        """
-        Args:
-            student_feature_map(str): The name of feature map from student network.
-            teacher_feature_map(str): The name of feature map from teacher network.
-                                      It's shape should be the same with student network.
-            student_temperature(float): Temperature used to divide student_feature_map before softmax_with_cross_entropy.
-            teacher_temperature(float): Temperature used to divide teacher_feature_map before softmax_with_cross_entropy.
-            distillation_loss_weight(float): The weight of the l2-loss.
-        """
-        self.student_feature_map = student_feature_map
-        self.teacher_feature_map = teacher_feature_map
-        self.student_temperature = student_temperature
-        self.teacher_temperature = teacher_temperature
-        self.distillation_loss_weight = distillation_loss_weight
-
-    def apply(self, graph):
-        ret_graph = graph
-        with program_guard(ret_graph.program):
-
-            student_feature_map = ret_graph.var(self.student_feature_map)._var
-            teacher_feature_map = ret_graph.var(self.teacher_feature_map)._var
-            s_fea = layers.softmax(student_feature_map /
-                                   self.student_temperature)
-            t_fea = layers.softmax(teacher_feature_map /
-                                   self.teacher_temperature)
-            t_fea.stop_gradient = True
-            ce_loss = layers.reduce_mean(
-                layers.cross_entropy(
-                    s_fea, t_fea, soft_label=True))
-            distillation_loss = ce_loss * self.distillation_loss_weight
-            student_loss = 0
-            if 'loss' in ret_graph.out_nodes:
-                student_loss = ret_graph.var(ret_graph.out_nodes['loss'])._var
-            loss = distillation_loss + student_loss
-
-            ret_graph.out_nodes['loss'] = loss.name
-            ret_graph.out_nodes[
-                'soft_label_loss_' + self.student_feature_map + "_" +
-                self.teacher_feature_map] = distillation_loss.name
-        return ret_graph
--- a/python/paddle/fluid/contrib/slim/graph/__init__.py
+++ b/python/paddle/fluid/contrib/slim/graph/__init__.py
-#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from . import executor
-from .executor import *
-from . import graph_wrapper
-from .graph_wrapper import *
-__all__ = executor.__all__
-__all__ += graph_wrapper.__all__
--- a/python/paddle/fluid/contrib/slim/graph/executor.py
+++ b/python/paddle/fluid/contrib/slim/graph/executor.py
-#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from ....compiler import CompiledProgram
-from ....data_feeder import DataFeeder
-from .... import executor
-from .graph_wrapper import GraphWrapper
-
-__all__ = ['SlimGraphExecutor']
-
-
-class SlimGraphExecutor(object):
-    """
-    Wrapper of executor used to run GraphWrapper.
-    """
-
-    def __init__(self, place):
-        self.exe = executor.Executor(place)
-        self.place = place
-
-    def run(self, graph, scope, data=None):
-        """
-        Runing a graph with a batch of data.
-        Args:
-            graph(GraphWrapper): The graph to be executed.
-            scope(fluid.core.Scope): The scope to be used.
-            data(list<tuple>): A batch of data. Each tuple in this list is a sample.
-                               It will feed the items of tuple to the in_nodes of graph.
-        Returns:
-            results(list): A list of result with the same order indicated by graph.out_nodes.
-        """
-        assert isinstance(graph, GraphWrapper)
-        feed = None
-        if data is not None and isinstance(data[0], dict):
-            # return list = False
-            feed = data
-        elif data is not None:
-            feeder = DataFeeder(
-                feed_list=list(graph.in_nodes.values()),
-                place=self.place,
-                program=graph.program)
-            feed = feeder.feed(data)
-
-        fetch_list = list(graph.out_nodes.values())
-        program = graph.compiled_graph if graph.compiled_graph else graph.program
-        results = self.exe.run(program,
-                               scope=scope,
-                               fetch_list=fetch_list,
-                               feed=feed)
-        return results
--- a/python/paddle/fluid/contrib/slim/graph/graph_wrapper.py
+++ b/python/paddle/fluid/contrib/slim/graph/graph_wrapper.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from collections import OrderedDict
-from .... import io
-from .... import compiler
-from ....framework import Program
-from ....framework import program_guard
-from ....framework import Parameter
-from ....framework import Variable
-from ....executor import Executor
-import copy
-from collections import Iterable
-from ....io import save_inference_model, load_inference_model, save_persistables
-import numpy as np
-import pickle
-import os
-
-__all__ = ['GraphWrapper', 'VarWrapper', 'OpWrapper']
-
-OPTIMIZER_OPS = [
-    'momentum',
-    'lars_momentum',
-    'adagrad',
-    'adam',
-    'adamax',
-    'dpsgd',
-    'decayed_adagrad',
-    'adadelta',
-    'rmsprop',
-]
-
-
-class VarWrapper(object):
-    def __init__(self, var, graph):
-        assert isinstance(var, Variable)
-        assert isinstance(graph, GraphWrapper)
-        self._var = var
-        self._graph = graph
-
-    def __eq__(self, v):
-        """
-        Overwrite this function for ...in... syntax in python.
-        """
-        return self._var.name == v._var.name
-
-    def name(self):
-        """
-        Get the name of the variable.
-        """
-        return self._var.name
-
-    def shape(self):
-        """
-        Get the shape of the variable.
-        """
-        return self._var.shape
-
-    def set_shape(self, shape):
-        """
-        Set the shape of the variable.
-        """
-        self._var.desc.set_shape(shape)
-
-    def inputs(self):
-        """
-        Get all the operators that use this variable as output.
-        Returns:
-            list<OpWrapper>: A list of operators.
-        """
-        ops = []
-        for op in self._graph.ops():
-            if self in op.all_inputs():
-                ops.append(op)
-        return ops
-
-    def outputs(self):
-        """
-        Get all the operators that use this variable as input.
-        Returns:
-            list<OpWrapper>: A list of operators.
-        """
-        ops = []
-        for op in self._graph.ops():
-            if self in op.all_outputs():
-                ops.append(op)
-        return ops
-
-
-class OpWrapper(object):
-    def __init__(self, op, graph):
-        assert isinstance(graph, GraphWrapper)
-        self._op = op
-        self._graph = graph
-
-    def __eq__(self, op):
-        """
-        Overwrite this function for ...in... syntax in python.
-        """
-        return self.idx() == op.idx()
-
-    def all_inputs(self):
-        """
-        Get all the input variables of this operator.
-        """
-        return [
-            self._graph.var(var_name) for var_name in self._op.input_arg_names
-        ]
-
-    def all_outputs(self):
-        """
-        Get all the output variables of this operator.
-        """
-        return [
-            self._graph.var(var_name) for var_name in self._op.output_arg_names
-        ]
-
-    def idx(self):
-        """
-        Get the id of this operator.
-        """
-        return self._op.idx
-
-    def type(self):
-        """
-        Get the type of this operator.
-        """
-        return self._op.type
-
-    def is_bwd_op(self):
-        """
-        Whether this operator is backward op.
-        """
-        return self.type().endswith('_grad')
-
-    def is_opt_op(self):
-        """
-        Whether this operator is optimizer op.
-        """
-        return self.type() in OPTIMIZER_OPS
-
-    def inputs(self, name):
-        """
-        Get all the variables by the input name.
-        """
-        return [self._graph.var(var_name) for var_name in self._op.input(name)]
-
-    def outputs(self, name):
-        """
-        Get all the variables by the output name.
-        """
-        return [self._graph.var(var_name) for var_name in self._op.output(name)]
-
-    def set_attr(self, key, value):
-        """
-        Set the value of attribute by attribute's name.
-
-        Args:
-            key(str): the attribute name.
-            value(bool|int|str|float|list): the value of the attribute.
-        """
-        self._op._set_attr(key, value)
-
-    def attr(self, name):
-        """
-        Get the attribute by name.
-
-        Args:
-            name(str): the attribute name.
-
-        Returns:
-            bool|int|str|float|list: The attribute value. The return value
-            can be any valid attribute type.
-        """
-        return self._op.attr(name)
-
-
-class GraphWrapper(object):
-    """
-    It is a wrapper of paddle.fluid.framework.IrGraph with some special functions
-    for paddle slim framework.
-    """
-
-    def __init__(self, program=None, in_nodes=[], out_nodes=[]):
-        """
-        Args:
-            program(framework.Program): A program with 
-            in_nodes(dict): A dict to indicate the input nodes of the graph.
-                            The key is user-defined and human-readable name.
-                            The value is the name of Variable.
-            out_nodes(dict): A dict to indicate the input nodes of the graph.
-                            The key is user-defined and human-readable name.
-                            The value is the name of Variable.
-        """
-        super(GraphWrapper, self).__init__()
-        self.program = Program() if program is None else program
-        self.persistables = {}
-        self.teacher_persistables = {}
-        for var in self.program.list_vars():
-            if var.persistable:
-                self.persistables[var.name] = var
-        self.compiled_graph = None
-        in_nodes = [] if in_nodes is None else in_nodes
-        out_nodes = [] if out_nodes is None else out_nodes
-        self.in_nodes = OrderedDict(in_nodes)
-        self.out_nodes = OrderedDict(out_nodes)
-        self._attrs = OrderedDict()
-
-    def all_parameters(self):
-        """
-        Get all the parameters in this graph.
-        Returns:
-            list<VarWrapper>: A list of VarWrapper instances.
-        """
-        params = []
-        for block in self.program.blocks:
-            for param in block.all_parameters():
-                params.append(VarWrapper(param, self))
-        return params
-
-    def is_parameter(self, var):
-        """
-        Whether the given variable is parameter.
-        Args:
-            var(VarWrapper): The given variable.
-        """
-        return isinstance(var._var, Parameter)
-
-    def is_persistable(self, var):
-        """
-        Whether the given variable is persistable.
-        Args:
-            var(VarWrapper): The given variable.
-        """
-        return var._var.persistable
-
-    def compile(self, for_parallel=True, for_test=False, mem_opt=False):
-        """
-        Compile the program in this wrapper to framework.CompiledProgram for next running.
-        This function must be called if the program is modified.
-        Args:
-            for_parallel(bool): Whether the program to run in data parallel way. default: True.
-            for_test(bool): Whether the compiled program is used for test.
-        """
-        target = self.program
-        if for_test:
-            loss = None
-        else:
-            loss = self.out_nodes['loss']
-        if for_parallel:
-            # disable memory optimize for stable training
-            build_strategy = compiler.BuildStrategy()
-            build_strategy.enable_inplace = mem_opt
-            build_strategy.memory_optimize = mem_opt
-            build_strategy.fuse_all_reduce_ops = False
-            #            build_strategy.async_mode = False
-            self.compiled_graph = compiler.CompiledProgram(
-                target).with_data_parallel(
-                    loss_name=loss, build_strategy=build_strategy)
-        else:
-            self.compiled_graph = compiler.CompiledProgram(target)
-
-    def ops(self):
-        """
-        Return all operator nodes included in the graph as a set.
-        """
-        ops = []
-        for block in self.program.blocks:
-            for op in block.ops:
-                ops.append(OpWrapper(op, self))
-        return ops
-
-    def vars(self):
-        """
-        Get all the variables.
-        """
-        return [VarWrapper(var, self) for var in self.program.list_vars()]
-
-    def var(self, name):
-        """
-        Get the variable by variable name.
-        """
-        return VarWrapper(self.program.global_block().var(name), self)
-
-    def clone(self, for_test=False):
-        """
-        Clone a new graph from current graph.
-        Returns:
-            (GraphWrapper): The wrapper of a new graph.
-        """
-        return GraphWrapper(
-            self.program.clone(for_test),
-            copy.deepcopy(self.in_nodes), copy.deepcopy(self.out_nodes))
-
-    def merge(self, graph):
-        """
-        Merge a graph into current graph.
-        Args:
-            graph(GraphWrapper): The graph to be merged by current graph.
-        """
-        for var in graph.program.list_vars():
-            if var.persistable:
-                self.teacher_persistables[var.name] = var
-            new_var = self.program.global_block()._clone_variable(
-                var, force_persistable=False)
-            new_var.stop_gradient = var.stop_gradient
-            # TODO: parameters should be cloned
-        for op in graph.ops():
-            op = op._op
-            inputs = {}
-            outputs = {}
-            attrs = {}
-            for input_name in op.input_names:
-                inputs[input_name] = [
-                    self.var(in_var_name)._var
-                    for in_var_name in op.input(input_name)
-                ]
-            for output_name in op.output_names:
-                outputs[output_name] = [
-                    self.var(out_var_name)._var
-                    for out_var_name in op.output(output_name)
-                ]
-            for attr_name in op.attr_names:
-                attrs[attr_name] = op.attr(attr_name)
-            self.program.global_block().append_op(
-                type=op.type, inputs=inputs, outputs=outputs, attrs=attrs)
-
-    def program(self):
-        """
-        Get the program in current wrapper.
-        """
-        return self.program
-
-    def pre_ops(self, op):
-        """
-        Get all the previous operators of target operator.
-        Args:
-            op(OpWrapper): Target operator..
-        Returns:
-            list<OpWrapper>: A list of operators.
-        """
-        ops = []
-        for p in self.ops():
-            for in_var in op.all_inputs():
-                if in_var in p.all_outputs():
-                    ops.append(p)
-        return ops
-
-    def next_ops(self, op):
-        """
-        Get all the next operators of target operator.
-        Args:
-            op(OpWrapper): Target operator..
-        Returns:
-            list<OpWrapper>: A list of operators.
-        """
-        ops = []
-        for p in self.ops():
-            for out_var in op.all_outputs():
-                if out_var in p.all_inputs():
-                    ops.append(p)
-        return ops
-
-    def get_param_by_op(self, op):
-        """
-        Get the parameters used by target operator.
-        """
-        assert isinstance(op, OpWrapper)
-        params = []
-        for var in op.all_inputs():
-            if isinstance(var._var, Parameter):
-                params.append(var)
-        assert len(params) > 0
-        return params
-
-    def numel_params(self):
-        """
-        Get the number of elements in all parameters.
-        """
-        ret = 0
-        for param in self.all_parameters():
-            ret += np.product(param.shape())
-        return ret
-
-    def get_optimize_graph(self, optimizer, place, scope, no_grad_var_names=[]):
-        """
-        Get a new graph for training by appending some backward operators and optimization operators.
-        Args:
-            optimizer: The optimizer used to generate training graph.
-            place: The place to run the graph.
-            scope: The scope used to run the graph. Some new variable will be added into this scope.
-            no_grad_var_names(list<str>): Names of variables that should be ignored while computing gradients. default: [].
-        Returns:
-            (GraphWrapper): The wrapper of new graph with backward ops and optimization ops. 
-        """
-        graph = self.clone()
-        startup_program = Program()
-        with program_guard(
-                main_program=graph.program, startup_program=startup_program):
-            target_name = None
-            if 'loss' in graph.out_nodes:
-                target_name = graph.out_nodes['loss']
-            elif 'cost' in graph.out_nodes:
-                target_name = graph.out_nodes['cost']
-            else:
-                return None
-            target = graph.var(target_name)._var
-            # The learning rate variable may be created in other program.
-            # Update information in optimizer to make
-            # learning rate variable being accessible in current program.
-            if isinstance(optimizer._learning_rate, Variable):
-                optimizer._learning_rate_map[
-                    graph.program] = optimizer._learning_rate
-            optimizer.minimize(target, no_grad_set=no_grad_var_names)
-
-        exe = Executor(place)
-        exe.run(program=startup_program, scope=scope)
-        return graph
-
-    def flops(self, only_conv=False):
-        """
-        Get the flops of current graph.
-        Args:
-            only_conv: Only calculating the conv layers. default: False.
-        Returns:
-            int: The flops of current graph.
-        """
-        flops = 0
-        for op in self.ops():
-            if op.type() in ['conv2d', 'depthwise_conv2d']:
-                filter_shape = op.inputs("Filter")[0].shape()
-                input_shape = op.inputs("Input")[0].shape()
-                output_shape = op.outputs("Output")[0].shape()
-                c_out, c_in, k_h, k_w = filter_shape
-                _, _, h_out, w_out = output_shape
-                groups = op.attr("groups")
-                kernel_ops = k_h * k_w * (c_in / groups)
-                if len(op.inputs("Bias")) > 0:
-                    with_bias = 1
-                else:
-                    with_bias = 0
-                flops += 2 * h_out * w_out * c_out * (kernel_ops + with_bias)
-            elif op.type() == 'pool2d' and not only_conv:
-                input_shape = op.inputs("X")[0].shape()
-                output_shape = op.outputs("Out")[0].shape()
-                _, c_out, h_out, w_out = output_shape
-                k_size = op.attr("ksize")
-                flops += h_out * w_out * c_out * (k_size[0]**2)
-
-            elif op.type() == 'mul' and not only_conv:
-                x_shape = list(op.inputs("X")[0].shape())
-                y_shape = op.inputs("Y")[0].shape()
-                if x_shape[0] == -1:
-                    x_shape[0] = 1
-                flops += 2 * x_shape[0] * x_shape[1] * y_shape[1]
-
-            elif op.type() in ['relu', 'sigmoid', 'batch_norm'
-                               ] and not only_conv:
-                input_shape = list(op.inputs("X")[0].shape())
-                if input_shape[0] == -1:
-                    input_shape[0] = 1
-                flops += np.product(input_shape)
-
-        return flops
-
-    def save_model(self, path, exe):
-        """
-        Save network and parameters into file which can be load by load_inference_model api.
-        Args:
-            path(str): The path to save the persistables.
-            exe(framework.Executor): The executor used to save the persistables.
-        """
-        out_vars = [
-            self.var(var_name)._var for var_name in self.out_nodes.values()
-        ]
-        in_vars = list(self.in_nodes.values())
-        assert (len(in_vars) > 0)
-        assert (len(out_vars) > 0)
-        io.save_inference_model(
-            path,
-            in_vars,
-            out_vars,
-            exe.exe,
-            model_filename="__model__",
-            params_filename="__params__",
-            main_program=self.program.clone(),
-            export_for_deployment=True)
-
-    def save_infer_model(self, path, exe, in_out, program_only=False):
-        """
-        Save network and parameters into file which can be load by load_inference_model api.
-        Args:
-            path(str): The path to save the persistables.
-            exe(framework.Executor): The executor used to save the persistables.
-            in_out(tuple|list): in_out[0] is a list of input nodes' names
-            and in_out[1] is a list of output nodes' names.
-            program_only(bool): Whether to save program only.
-        """
-        out_vars = [self.var(var_name)._var for var_name in in_out[1]]
-        in_vars = list(in_out[0])
-        assert (len(in_vars) > 0)
-        assert (len(out_vars) > 0)
-        io.save_inference_model(
-            path,
-            in_vars,
-            out_vars,
-            exe.exe,
-            model_filename="__model__.infer",
-            params_filename="__params__",
-            program_only=program_only,
-            main_program=self.program.clone(),
-            export_for_deployment=True)
-
-    def save_persistables(self, path, exe):
-        """
-        Save all the persistable variables into file.
-        Args:
-            path(str): The path to save the persistables.
-            exe(framework.Executor): The executor used to save the persistables.
-        """
-        # update persistables from program
-        for var in self.program.list_vars():
-            if var.persistable and var.name not in self.persistables:
-                self.persistables[var.name] = var
-        persistables = []
-        for var in self.persistables:
-            if 'reader' not in var and 'double_buffer' not in var and var not in self.teacher_persistables:
-                persistables.append(self.persistables[var])
-
-        io.save_vars(exe.exe, path, vars=persistables)
-
-    def load_persistables(self, path, exe):
-        """
-        Load the persistable variables from file.
-        Args:
-            path(str): The path to load the persistables.
-            exe(framework.Executor): The executor used to load the persistables.
-        """
-
-        def if_exist(var):
-            return os.path.exists(os.path.join(path, var.name))
-
-        persistables = []
-        for var in self.persistables:
-            if 'reader' not in var and 'double_buffer' not in var:
-                persistables.append(self.persistables[var])
-        io.load_vars(exe.exe, path, vars=persistables, predicate=if_exist)
-
-    def update_param_shape(self, scope):
-        """
-        Update the shape of parameters in the graph according to tensors in scope.
-        It is used after loading pruned parameters from file.
-        """
-        for param in self.all_parameters():
-            tensor_shape = np.array(scope.find_var(param.name()).get_tensor(
-            )).shape
-            param.set_shape(tensor_shape)
-
-    def infer_shape(self):
-        """
-        Update the groups of convolution layer according to current filters.
-        It is used after loading pruned parameters from file.
-        """
-        for op in self.ops():
-            if op.type() != 'conditional_block':
-                op._op.desc.infer_shape(op._op.block.desc)
-
-    def update_groups_of_conv(self):
-        for op in self.ops():
-            if op.type() == 'depthwise_conv2d' or op.type(
-            ) == 'depthwise_conv2d_grad':
-                op.set_attr('groups', op.inputs('Filter')[0].shape()[0])
--- a/python/paddle/fluid/contrib/slim/nas/__init__.py
+++ b/python/paddle/fluid/contrib/slim/nas/__init__.py
-#   Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from . import light_nas_strategy
-from .light_nas_strategy import *
-from . import controller_server
-from .controller_server import *
-from . import search_agent
-from .search_agent import *
-from . import search_space
-from .search_space import *
-from . import lock
-from .lock import *
-
-__all__ = light_nas_strategy.__all__
-__all__ += controller_server.__all__
-__all__ += search_agent.__all__
-__all__ += search_space.__all__
--- a/python/paddle/fluid/contrib/slim/nas/controller_server.py
+++ b/python/paddle/fluid/contrib/slim/nas/controller_server.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import logging
-import socket
-from threading import Thread
-from ....log_helper import get_logger
-
-__all__ = ['ControllerServer']
-
-_logger = get_logger(
-    __name__,
-    logging.INFO,
-    fmt='ControllerServer-%(asctime)s-%(levelname)s: %(message)s')
-
-
-class ControllerServer(object):
-    """
-    The controller wrapper with a socket server to handle the request of search agent.
-    """
-
-    def __init__(self,
-                 controller=None,
-                 address=('', 0),
-                 max_client_num=100,
-                 search_steps=None,
-                 key=None):
-        """
-        Args:
-            controller(slim.searcher.Controller): The controller used to generate tokens.
-            address(tuple): The address of current server binding with format (ip, port). Default: ('', 0).
-                            which means setting ip automatically
-            max_client_num(int): The maximum number of clients connecting to current server simultaneously. Default: 100.
-            search_steps(int): The total steps of searching. None means never stopping. Default: None 
-        """
-        self._controller = controller
-        self._address = address
-        self._max_client_num = max_client_num
-        self._search_steps = search_steps
-        self._closed = False
-        self._port = address[1]
-        self._ip = address[0]
-        self._key = key
-
-    def start(self):
-        self._socket_server = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
-        self._socket_server.bind(self._address)
-        self._socket_server.listen(self._max_client_num)
-        self._port = self._socket_server.getsockname()[1]
-        self._ip = self._socket_server.getsockname()[0]
-        _logger.info("listen on: [{}:{}]".format(self._ip, self._port))
-        thread = Thread(target=self.run)
-        thread.start()
-        return str(thread)
-
-    def close(self):
-        """Close the server."""
-        self._closed = True
-
-    def port(self):
-        """Get the port."""
-        return self._port
-
-    def ip(self):
-        """Get the ip."""
-        return self._ip
-
-    def run(self):
-        _logger.info("Controller Server run...")
-        while ((self._search_steps is None) or
-               (self._controller._iter <
-                (self._search_steps))) and not self._closed:
-            conn, addr = self._socket_server.accept()
-            message = conn.recv(1024).decode()
-            if message.strip("\n") == "next_tokens":
-                tokens = self._controller.next_tokens()
-                tokens = ",".join([str(token) for token in tokens])
-                conn.send(tokens.encode())
-            else:
-                _logger.info("recv message from {}: [{}]".format(addr, message))
-                messages = message.strip('\n').split("\t")
-                if (len(messages) < 3) or (messages[0] != self._key):
-                    _logger.info("recv noise from {}: [{}]".format(addr,
-                                                                   message))
-                    continue
-                tokens = messages[1]
-                reward = messages[2]
-                tokens = [int(token) for token in tokens.split(",")]
-                self._controller.update(tokens, float(reward))
-                tokens = self._controller.next_tokens()
-                tokens = ",".join([str(token) for token in tokens])
-                conn.send(tokens.encode())
-                _logger.info("send message to {}: [{}]".format(addr, tokens))
-            conn.close()
-        self._socket_server.close()
-        _logger.info("server closed!")
--- a/python/paddle/fluid/contrib/slim/nas/light_nas_strategy.py
+++ b/python/paddle/fluid/contrib/slim/nas/light_nas_strategy.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-from ..core.strategy import Strategy
-from ..graph import GraphWrapper
-from .controller_server import ControllerServer
-from .search_agent import SearchAgent
-from ....executor import Executor
-from ....log_helper import get_logger
-import re
-import logging
-import functools
-import socket
-from .lock import lock, unlock
-
-__all__ = ['LightNASStrategy']
-
-_logger = get_logger(
-    __name__,
-    logging.INFO,
-    fmt='LightNASStrategy-%(asctime)s-%(levelname)s: %(message)s')
-
-
-class LightNASStrategy(Strategy):
-    """
-    Light-NAS search strategy.
-    """
-
-    def __init__(self,
-                 controller=None,
-                 end_epoch=1000,
-                 target_flops=629145600,
-                 target_latency=0,
-                 retrain_epoch=1,
-                 metric_name='top1_acc',
-                 server_ip=None,
-                 server_port=0,
-                 is_server=False,
-                 max_client_num=100,
-                 search_steps=None,
-                 key="light-nas"):
-        """
-        Args:
-            controller(searcher.Controller): The searching controller. Default: None.
-            end_epoch(int): The 'on_epoch_end' function will be called in end_epoch. Default: 0
-            target_flops(int): The constraint of FLOPS.
-            target_latency(float): The constraint of latency.
-            retrain_epoch(int): The number of training epochs before evaluating structure generated by controller. Default: 1.
-            metric_name(str): The metric used to evaluate the model.
-                         It should be one of keys in out_nodes of graph wrapper. Default: 'top1_acc'
-            server_ip(str): The ip that controller server listens on. None means getting the ip automatically. Default: None.
-            server_port(int): The port that controller server listens on. 0 means getting usable port automatically. Default: 0.
-            is_server(bool): Whether current host is controller server. Default: False.
-            max_client_num(int): The maximum number of clients that connect to controller server concurrently. Default: 100.
-            search_steps(int): The total steps of searching. Default: None.
-            key(str): The key used to identify legal agent for controller server. Default: "light-nas"
-        """
-        self.start_epoch = 0
-        self.end_epoch = end_epoch
-        self._max_flops = target_flops
-        self._max_latency = target_latency
-        self._metric_name = metric_name
-        self._controller = controller
-        self._retrain_epoch = 0
-        self._server_ip = server_ip
-        self._server_port = server_port
-        self._is_server = is_server
-        self._retrain_epoch = retrain_epoch
-        self._search_steps = search_steps
-        self._max_client_num = max_client_num
-        self._max_try_times = 100
-        self._key = key
-
-        if self._server_ip is None:
-            self._server_ip = self._get_host_ip()
-
-    def _get_host_ip(self):
-        return socket.gethostbyname(socket.gethostname())
-
-    def on_compression_begin(self, context):
-        self._current_tokens = context.search_space.init_tokens()
-        self._controller.reset(context.search_space.range_table(),
-                               self._current_tokens, None)
-
-        # create controller server
-        if self._is_server:
-            open("./slim_LightNASStrategy_controller_server.socket",
-                 'a').close()
-            socket_file = open(
-                "./slim_LightNASStrategy_controller_server.socket", 'r+')
-            lock(socket_file)
-            tid = socket_file.readline()
-            if tid == '':
-                _logger.info("start controller server...")
-                self._server = ControllerServer(
-                    controller=self._controller,
-                    address=(self._server_ip, self._server_port),
-                    max_client_num=self._max_client_num,
-                    search_steps=self._search_steps,
-                    key=self._key)
-                tid = self._server.start()
-                self._server_port = self._server.port()
-                socket_file.write(tid)
-                _logger.info("started controller server...")
-            unlock(socket_file)
-            socket_file.close()
-        _logger.info("self._server_ip: {}; self._server_port: {}".format(
-            self._server_ip, self._server_port))
-        # create client
-        self._search_agent = SearchAgent(
-            self._server_ip, self._server_port, key=self._key)
-
-    def __getstate__(self):
-        """Socket can't be pickled."""
-        d = {}
-        for key in self.__dict__:
-            if key not in ["_search_agent", "_server"]:
-                d[key] = self.__dict__[key]
-        return d
-
-    def on_epoch_begin(self, context):
-        if context.epoch_id >= self.start_epoch and context.epoch_id <= self.end_epoch and (
-                self._retrain_epoch == 0 or
-            (context.epoch_id - self.start_epoch) % self._retrain_epoch == 0):
-            _logger.info("light nas strategy on_epoch_begin")
-            min_flops = -1
-            for _ in range(self._max_try_times):
-                startup_p, train_p, test_p, _, _, train_reader, test_reader = context.search_space.create_net(
-                    self._current_tokens)
-                context.eval_graph.program = test_p
-                flops = context.eval_graph.flops()
-                if min_flops == -1:
-                    min_flops = flops
-                    min_tokens = self._current_tokens[:]
-                else:
-                    if flops < min_flops:
-                        min_tokens = self._current_tokens[:]
-                if self._max_latency > 0:
-                    latency = context.search_space.get_model_latency(test_p)
-                    _logger.info("try [{}] with latency {} flops {}".format(
-                        self._current_tokens, latency, flops))
-                else:
-                    _logger.info("try [{}] with flops {}".format(
-                        self._current_tokens, flops))
-                if flops > self._max_flops or (self._max_latency > 0 and
-                                               latency > self._max_latency):
-                    self._current_tokens = self._controller.next_tokens(
-                        min_tokens)
-                else:
-                    break
-
-            context.train_reader = train_reader
-            context.eval_reader = test_reader
-
-            exe = Executor(context.place)
-            exe.run(startup_p)
-
-            context.optimize_graph.program = train_p
-            context.optimize_graph.compile()
-
-            context.skip_training = (self._retrain_epoch == 0)
-
-    def on_epoch_end(self, context):
-        if context.epoch_id >= self.start_epoch and context.epoch_id < self.end_epoch and (
-                self._retrain_epoch == 0 or
-            (context.epoch_id - self.start_epoch + 1
-             ) % self._retrain_epoch == 0):
-
-            self._current_reward = context.eval_results[self._metric_name][-1]
-            flops = context.eval_graph.flops()
-            if flops > self._max_flops:
-                self._current_reward = 0.0
-            if self._max_latency > 0:
-                test_p = context.search_space.create_net(self._current_tokens)[
-                    2]
-                latency = context.search_space.get_model_latency(test_p)
-                if latency > self._max_latency:
-                    self._current_reward = 0.0
-                _logger.info("reward: {}; latency: {}; flops: {}; tokens: {}".
-                             format(self._current_reward, latency, flops,
-                                    self._current_tokens))
-            else:
-                _logger.info("reward: {}; flops: {}; tokens: {}".format(
-                    self._current_reward, flops, self._current_tokens))
-            self._current_tokens = self._search_agent.update(
-                self._current_tokens, self._current_reward)
--- a/python/paddle/fluid/contrib/slim/nas/lock.py
+++ b/python/paddle/fluid/contrib/slim/nas/lock.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import os
-__All__ = ['lock', 'unlock']
-if os.name == 'nt':
-
-    def lock(file):
-        raise NotImplementedError('Windows is not supported.')
-
-    def unlock(file):
-        raise NotImplementedError('Windows is not supported.')
-
-elif os.name == 'posix':
-    from fcntl import flock, LOCK_EX, LOCK_UN
-
-    def lock(file):
-        """Lock the file in local file system."""
-        flock(file.fileno(), LOCK_EX)
-
-    def unlock(file):
-        """Unlock the file in local file system."""
-        flock(file.fileno(), LOCK_UN)
-else:
-    raise RuntimeError("File Locker only support NT and Posix platforms!")
--- a/python/paddle/fluid/contrib/slim/nas/search_agent.py
+++ b/python/paddle/fluid/contrib/slim/nas/search_agent.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import logging
-import socket
-from ....log_helper import get_logger
-
-__all__ = ['SearchAgent']
-
-_logger = get_logger(
-    __name__, logging.INFO, fmt='%(asctime)s-%(levelname)s: %(message)s')
-
-
-class SearchAgent(object):
-    """
-    Search agent.
-    """
-
-    def __init__(self, server_ip=None, server_port=None, key=None):
-        """
-        Args:
-            server_ip(str): The ip that controller server listens on. None means getting the ip automatically. Default: None.
-            server_port(int): The port that controller server listens on. 0 means getting usable port automatically. Default: 0.
-            key(str): The key used to identify legal agent for controller server. Default: "light-nas"
-        """
-        self.server_ip = server_ip
-        self.server_port = server_port
-        self.socket_client = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
-        self._key = key
-
-    def update(self, tokens, reward):
-        """
-        Update the controller according to latest tokens and reward.
-        Args:
-            tokens(list<int>): The tokens generated in last step.
-            reward(float): The reward of tokens.
-        """
-        socket_client = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
-        socket_client.connect((self.server_ip, self.server_port))
-        tokens = ",".join([str(token) for token in tokens])
-        socket_client.send("{}\t{}\t{}".format(self._key, tokens, reward)
-                           .encode())
-        tokens = socket_client.recv(1024).decode()
-        tokens = [int(token) for token in tokens.strip("\n").split(",")]
-        return tokens
-
-    def next_tokens(self):
-        """
-        Get next tokens.
-        """
-        socket_client = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
-        socket_client.connect((self.server_ip, self.server_port))
-        socket_client.send("next_tokens".encode())
-        tokens = socket_client.recv(1024).decode()
-        tokens = [int(token) for token in tokens.strip("\n").split(",")]
-        return tokens
--- a/python/paddle/fluid/contrib/slim/nas/search_space.py
+++ b/python/paddle/fluid/contrib/slim/nas/search_space.py
-#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""The search space used to search neural architecture"""
-
-__all__ = ['SearchSpace']
-
-
-class SearchSpace(object):
-    """Controller for Neural Architecture Search.
-    """
-
-    def __init__(self, *args, **kwargs):
-        pass
-
-    def init_tokens(self):
-        """Get init tokens in search space.
-        """
-        raise NotImplementedError('Abstract method.')
-
-    def range_table(self):
-        """Get range table of current search space.
-        """
-        raise NotImplementedError('Abstract method.')
-
-    def create_net(self, tokens):
-        """Create networks for training and evaluation according to tokens.
-        Args:
-            tokens(list<int>): The tokens which represent a network.
-        Return:
-            (tuple): startup_program, train_program, evaluation_program, train_metrics, test_metrics
-        """
-        raise NotImplementedError('Abstract method.')
-
-    def get_model_latency(self, program):
-        """Get model latency according to program.
-        Args:
-            program(Program): The program to get latency.
-        Return:
-            (float): model latency.
-        """
-        raise NotImplementedError('Abstract method.')
--- a/python/paddle/fluid/contrib/slim/prune/__init__.py
+++ b/python/paddle/fluid/contrib/slim/prune/__init__.py
-#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from . import pruner
-from .pruner import *
-from . import prune_strategy
-from .prune_strategy import *
-from . import auto_prune_strategy
-from .auto_prune_strategy import *
-
-__all__ = pruner.__all__
-__all__ += prune_strategy.__all__
-__all__ += auto_prune_strategy.__all__
--- a/python/paddle/fluid/contrib/slim/prune/auto_prune_strategy.py
+++ b/python/paddle/fluid/contrib/slim/prune/auto_prune_strategy.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from .prune_strategy import PruneStrategy
-import re
-import logging
-import functools
-import copy
-from ....log_helper import get_logger
-
-__all__ = ['AutoPruneStrategy']
-
-_logger = get_logger(
-    __name__, logging.INFO, fmt='%(asctime)s-%(levelname)s: %(message)s')
-
-
-class AutoPruneStrategy(PruneStrategy):
-    """
-    Automatic pruning strategy.
-    """
-
-    def __init__(self,
-                 pruner=None,
-                 controller=None,
-                 start_epoch=0,
-                 end_epoch=10,
-                 min_ratio=0.5,
-                 max_ratio=0.7,
-                 metric_name='top1_acc',
-                 pruned_params='conv.*_weights',
-                 retrain_epoch=0,
-                 uniform_range=None,
-                 init_tokens=None):
-        """
-        Args:
-            pruner(slim.Pruner): The pruner used to prune the parameters. Default: None.
-            controller(searcher.Controller): The searching controller. Default: None.
-            start_epoch(int): The 'on_epoch_begin' function will be called in start_epoch. Default: 0
-            end_epoch(int): The 'on_epoch_end' function will be called in end_epoch. Default: 0
-            min_ratio(float): The maximum pruned ratio. Default: 0.7
-            max_ratio(float): The minimum pruned ratio. Default: 0.5
-            metric_name(str): The metric used to evaluate the model.
-                         It should be one of keys in out_nodes of graph wrapper. Default: 'top1_acc'
-            pruned_params(str): The pattern str to match the parameter names to be pruned. Default: 'conv.*_weights'
-            retrain_epoch(int): The training epochs in each searching step. Default: 0
-            uniform_range(int): The token range in each position of tokens generated by controller. None means getting the range automatically. Default: None.
-            init_tokens(list<int>): The initial tokens. None means getting the initial tokens automatically. Default: None.
-        """
-        super(AutoPruneStrategy, self).__init__(pruner, start_epoch, end_epoch,
-                                                0.0, metric_name, pruned_params)
-        self._max_ratio = max_ratio
-        self._min_ratio = min_ratio
-        self._controller = controller
-        self._metric_name = metric_name
-        self._pruned_param_names = []
-        self._retrain_epoch = retrain_epoch
-        self._uniform_range = uniform_range
-        self._init_tokens = init_tokens
-        self._current_tokens = None
-
-    def on_compression_begin(self, context):
-        """
-        Prepare some information for searching strategy.
-        step 1: Find all the parameters to be pruned.
-        step 2: Get initial tokens and setup controller.
-        """
-        pruned_params = []
-        for param in context.eval_graph.all_parameters():
-            if re.match(self.pruned_params, param.name()):
-                self._pruned_param_names.append(param.name())
-
-        if self._init_tokens is not None:
-            self._current_tokens = self._init_tokens
-        else:
-            self._current_tokens = self._get_init_tokens(context)
-
-        if self._uniform_range is not None:
-            self._range_table = [round(self._uniform_range, 2) / 0.01] * len(
-                self._pruned_param_names)
-        else:
-            self._range_table = copy.deepcopy(self._current_tokens)
-        _logger.info('init tokens: {}'.format(self._current_tokens))
-        _logger.info("range_table: {}".format(self._range_table))
-        constrain_func = functools.partial(
-            self._constrain_func, context=context)
-
-        self._controller.reset(self._range_table, self._current_tokens,
-                               constrain_func)
-
-    def _constrain_func(self, tokens, context=None):
-        """Check whether the tokens meet constraint."""
-        ori_flops = context.eval_graph.flops()
-        ratios = self._tokens_to_ratios(tokens)
-        params = self._pruned_param_names
-        param_shape_backup = {}
-        self._prune_parameters(
-            context.eval_graph,
-            context.scope,
-            params,
-            ratios,
-            context.place,
-            only_graph=True,
-            param_shape_backup=param_shape_backup)
-        context.eval_graph.update_groups_of_conv()
-        flops = context.eval_graph.flops()
-        for param in param_shape_backup.keys():
-            context.eval_graph.var(param).set_shape(param_shape_backup[param])
-        flops_ratio = (1 - float(flops) / ori_flops)
-        if flops_ratio >= self._min_ratio and flops_ratio <= self._max_ratio:
-            _logger.info("Success try [{}]; flops: -{}".format(tokens,
-                                                               flops_ratio))
-            return True
-        else:
-            _logger.info("Failed try [{}]; flops: -{}".format(tokens,
-                                                              flops_ratio))
-            return False
-
-    def _get_init_tokens(self, context):
-        """Get initial tokens.
-        """
-        ratios = self._get_uniform_ratios(context)
-        _logger.info('Get init ratios: {}'.format(
-            [round(r, 2) for r in ratios]))
-        return self._ratios_to_tokens(ratios)
-
-    def _ratios_to_tokens(self, ratios):
-        """Convert pruned ratios to tokens.
-        """
-        return [int(ratio / 0.01) for ratio in ratios]
-
-    def _tokens_to_ratios(self, tokens):
-        """Convert tokens to pruned ratios.
-        """
-        return [token * 0.01 for token in tokens]
-
-    def _get_uniform_ratios(self, context):
-        """
-        Search a group of uniform ratios.
-        """
-        min_ratio = 0.
-        max_ratio = 1.
-        target = (self._min_ratio + self._max_ratio) / 2
-        flops = context.eval_graph.flops()
-        model_size = context.eval_graph.numel_params()
-        ratios = None
-        while min_ratio < max_ratio:
-            ratio = (max_ratio + min_ratio) / 2
-            ratios = [ratio] * len(self._pruned_param_names)
-            param_shape_backup = {}
-            self._prune_parameters(
-                context.eval_graph,
-                context.scope,
-                self._pruned_param_names,
-                ratios,
-                context.place,
-                only_graph=True,
-                param_shape_backup=param_shape_backup)
-
-            pruned_flops = 1 - (float(context.eval_graph.flops()) / flops)
-            pruned_size = 1 - (float(context.eval_graph.numel_params()) /
-                               model_size)
-            for param in param_shape_backup.keys():
-                context.eval_graph.var(param).set_shape(param_shape_backup[
-                    param])
-
-            if abs(pruned_flops - target) < 1e-2:
-                break
-            if pruned_flops > target:
-                max_ratio = ratio
-            else:
-                min_ratio = ratio
-        _logger.info('Get ratios: {}'.format([round(r, 2) for r in ratios]))
-        return ratios
-
-    def on_epoch_begin(self, context):
-        """
-        step 1: Get a new tokens from controller.
-        step 2: Pruning eval_graph and optimize_program by tokens
-        """
-        if context.epoch_id >= self.start_epoch and context.epoch_id <= self.end_epoch and (
-                self._retrain_epoch == 0 or
-            (context.epoch_id - self.start_epoch) % self._retrain_epoch == 0):
-            _logger.info("on_epoch_begin")
-            params = self._pruned_param_names
-            ratios = self._tokens_to_ratios(self._current_tokens)
-
-            self._param_shape_backup = {}
-            self._param_backup = {}
-            self._prune_parameters(
-                context.optimize_graph,
-                context.scope,
-                params,
-                ratios,
-                context.place,
-                param_backup=self._param_backup,
-                param_shape_backup=self._param_shape_backup)
-            self._prune_graph(context.eval_graph, context.optimize_graph)
-            context.optimize_graph.update_groups_of_conv()
-            context.eval_graph.update_groups_of_conv()
-            context.optimize_graph.compile(
-                mem_opt=False)  # to update the compiled program
-            context.skip_training = (self._retrain_epoch == 0)
-
-    def on_epoch_end(self, context):
-        """
-        step 1: Get reward of current tokens and update controller.
-        step 2: Restore eval_graph and optimize_graph
-        """
-        if context.epoch_id >= self.start_epoch and context.epoch_id < self.end_epoch and (
-                self._retrain_epoch == 0 or
-            (context.epoch_id - self.start_epoch + 1
-             ) % self._retrain_epoch == 0):
-            _logger.info("on_epoch_end")
-            reward = context.eval_results[self._metric_name][-1]
-            self._controller.update(self._current_tokens, reward)
-
-            self._current_tokens = self._controller.next_tokens()
-            # restore pruned parameters
-            for param_name in self._param_backup.keys():
-                param_t = context.scope.find_var(param_name).get_tensor()
-                param_t.set(self._param_backup[param_name], context.place)
-            self._param_backup = {}
-            # restore shape of parameters
-            for param in self._param_shape_backup.keys():
-                context.optimize_graph.var(param).set_shape(
-                    self._param_shape_backup[param])
-            self._param_shape_backup = {}
-            self._prune_graph(context.eval_graph, context.optimize_graph)
-
-            context.optimize_graph.update_groups_of_conv()
-            context.eval_graph.update_groups_of_conv()
-            context.optimize_graph.compile(
-                mem_opt=False)  # to update the compiled program
-
-        elif context.epoch_id == self.end_epoch:  # restore graph for final training
-            # restore pruned parameters
-            for param_name in self._param_backup.keys():
-                param_t = context.scope.find_var(param_name).get_tensor()
-                param_t.set(self.param_backup[param_name], context.place)
-            # restore shape of parameters
-            for param in self._param_shape_backup.keys():
-                context.eval_graph.var(param).set_shape(
-                    self._param_shape_backup[param])
-                context.optimize_graph.var(param).set_shape(
-                    self._param_shape_backup[param])
-
-            context.optimize_graph.update_groups_of_conv()
-            context.eval_graph.update_groups_of_conv()
-
-            params, ratios = self._get_prune_ratios(
-                self._controller._best_tokens)
-            self._prune_parameters(context.optimize_graph, context.scope,
-                                   params, ratios, context.place)
-
-            self._prune_graph(context.eval_graph, context.optimize_graph)
-            context.optimize_graph.update_groups_of_conv()
-            context.eval_graph.update_groups_of_conv()
-            context.optimize_graph.compile(
-                mem_opt=True)  # to update the compiled program
-
-            context.skip_training = False
--- a/python/paddle/fluid/contrib/slim/prune/prune_strategy.py
+++ b/python/paddle/fluid/contrib/slim/prune/prune_strategy.py
--- a/python/paddle/fluid/contrib/slim/prune/pruner.py
+++ b/python/paddle/fluid/contrib/slim/prune/pruner.py
-# Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import numpy as np
-import collections
-from .... import layers
-
-__all__ = ['Pruner', 'StructurePruner']
-
-
-class Pruner(object):
-    """
-    Base class of all pruners.
-    """
-
-    def __init__(self):
-        pass
-
-    def prune(self, param):
-        pass
-
-
-class StructurePruner(Pruner):
-    """
-    Pruner used to pruning parameters by groups.
-    """
-
-    def __init__(self, pruning_axis, criterions):
-        """
-        Args:
-            pruning_axis(dict): The key is the name of parameter to be pruned,
-                                '*' means all the parameters.
-                                The value is the axis to be used. Given a parameter
-                                with shape [3, 4], the result of pruning 50% on axis 1
-                                is a parameter with shape [3, 2].
-            criterions(dict): The key is the name of parameter to be pruned,
-                              '*' means all the parameters.
-                              The value is the criterion used to sort groups for pruning.
-                              It only supports 'l1_norm' currently.
-        """
-        self.pruning_axis = pruning_axis
-        self.criterions = criterions
-
-    def cal_pruned_idx(self, name, param, ratio, axis=None):
-        """
-        Calculate the index to be pruned on axis by given pruning ratio.
-        Args:
-            name(str): The name of parameter to be pruned.
-            param(np.array): The data of parameter to be pruned.
-            ratio(float): The ratio to be pruned.
-            axis(int): The axis to be used for pruning given parameter.
-                       If it is None, the value in self.pruning_axis will be used.
-                       default: None.
-        Returns:
-            list<int>: The indexes to be pruned on axis.
-        """
-        criterion = self.criterions[
-            name] if name in self.criterions else self.criterions['*']
-        if axis is None:
-            assert self.pruning_axis is not None, "pruning_axis should set if axis is None."
-            axis = self.pruning_axis[
-                name] if name in self.pruning_axis else self.pruning_axis['*']
-        prune_num = int(round(param.shape[axis] * ratio))
-        reduce_dims = [i for i in range(len(param.shape)) if i != axis]
-        if criterion == 'l1_norm':
-            criterions = np.sum(np.abs(param), axis=tuple(reduce_dims))
-        pruned_idx = criterions.argsort()[:prune_num]
-        return pruned_idx
-
-    def prune_tensor(self, tensor, pruned_idx, pruned_axis, lazy=False):
-        """
-        Pruning a array by indexes on given axis.
-        Args:
-            tensor(numpy.array): The target array to be pruned.
-            pruned_idx(list<int>): The indexes to be pruned.
-            pruned_axis(int): The axis of given array to be pruned on. 
-            lazy(bool): True means setting the pruned elements to zero.
-                        False means remove the pruned elements from memory.
-                        default: False.
-        Returns:
-            numpy.array: The pruned array.
-        """
-        mask = np.zeros(tensor.shape[pruned_axis], dtype=bool)
-        mask[pruned_idx] = True
-
-        def func(data):
-            return data[~mask]
-
-        def lazy_func(data):
-            data[mask] = 0
-            return data
-
-        if lazy:
-            return np.apply_along_axis(lazy_func, pruned_axis, tensor)
-        else:
-            return np.apply_along_axis(func, pruned_axis, tensor)
--- a/python/paddle/fluid/contrib/slim/quantization/__init__.py
+++ b/python/paddle/fluid/contrib/slim/quantization/__init__.py
@@ -16,10 +16,6 @@ from __future__ import print_function

 from . import quantization_pass
 from .quantization_pass import *
-from . import quantization_strategy
-from .quantization_strategy import *
-from . import mkldnn_post_training_strategy
-from .mkldnn_post_training_strategy import *
 from . import quant_int8_mkldnn_pass
 from .quant_int8_mkldnn_pass import *
 from . import quant2_int8_mkldnn_pass
@@ -29,8 +25,7 @@ from .post_training_quantization import *
 from . import imperative
 from .imperative import *

-__all__ = quantization_pass.__all__ + quantization_strategy.__all__
-__all__ += mkldnn_post_training_strategy.__all__
+__all__ = quantization_pass.__all__
 __all__ += quant_int8_mkldnn_pass.__all__
 __all__ += quant2_int8_mkldnn_pass.__all__
 __all__ += post_training_quantization.__all__

--- a/python/paddle/fluid/contrib/slim/quantization/mkldnn_post_training_strategy.py
+++ b/python/paddle/fluid/contrib/slim/quantization/mkldnn_post_training_strategy.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import os
-import logging
-import six
-import numpy as np
-from .... import core
-from ..core.strategy import Strategy
-from ....log_helper import get_logger
-
-__all__ = ['MKLDNNPostTrainingQuantStrategy']
-
-_logger = get_logger(
-    __name__, logging.INFO, fmt='%(asctime)s-%(levelname)s: %(message)s')
-
-
-class MKLDNNPostTrainingQuantStrategy(Strategy):
-    """
-    The strategy for MKL-DNN Post Training quantization strategy.
-    """
-
-    def __init__(self,
-                 int8_model_save_path=None,
-                 fp32_model_path=None,
-                 cpu_math_library_num_threads=1):
-        """
-        Args:
-            int8_model_save_path(str): int8_model_save_path is used to save an int8 ProgramDesc
-                        with fp32 weights which is used for MKL-DNN int8 inference. For post training quantization,
-                        MKLDNNPostTrainingQuantStrategy only supports converting a fp32 ProgramDesc
-                        with fp32 weights to an int8 ProgramDesc with fp32 weights now. The saved
-                        int8 ProgramDesc with fp32 weights only can be executed with MKL-DNN enabled.
-                        None means it doesn't save int8 ProgramDesc with fp32 weights. default: None.
-            fp32_model_path(str): fp32_model_path is used to load an original fp32 ProgramDesc with fp32 weights.
-                        None means it doesn't have a fp32 ProgramDesc with fp32 weights. default: None.
-            cpu_math_library_num_threads(int): The number of cpu math library threads which is used on
-                        MKLDNNPostTrainingQuantStrategy. 1 means it only uses one cpu math library
-                        thread. default: 1
-        """
-
-        super(MKLDNNPostTrainingQuantStrategy, self).__init__(0, 0)
-        self.int8_model_save_path = int8_model_save_path
-        if fp32_model_path is None:
-            raise Exception("fp32_model_path is None")
-        self.fp32_model_path = fp32_model_path
-        self.cpu_math_library_num_threads = cpu_math_library_num_threads
-
-    def on_compression_begin(self, context):
-        """
-        Prepare the data and quantify the model
-        """
-
-        super(MKLDNNPostTrainingQuantStrategy,
-              self).on_compression_begin(context)
-        _logger.info('InferQuantStrategy::on_compression_begin')
-
-        # Prepare the Analysis Config
-        infer_config = core.AnalysisConfig("AnalysisConfig")
-        infer_config.switch_ir_optim(True)
-        infer_config.disable_gpu()
-        infer_config.set_model(self.fp32_model_path)
-        infer_config.enable_mkldnn()
-        infer_config.set_cpu_math_library_num_threads(
-            self.cpu_math_library_num_threads)
-
-        # Prepare the data for calculating the quantization scales
-        warmup_reader = context.eval_reader()
-        if six.PY2:
-            data = warmup_reader.next()
-
-        if six.PY3:
-            data = warmup_reader.__next__()
-
-        num_images = len(data)
-        image_data = [img.tolist() for (img, _) in data]
-        image_data = np.array(image_data).astype("float32").reshape(
-            [num_images, ] + list(data[0][0].shape))
-        image_data = image_data.ravel()
-        images = core.PaddleTensor(image_data, "x")
-        images.shape = [num_images, ] + list(data[0][0].shape)
-
-        label_data = [label for (_, label) in data]
-        labels = core.PaddleTensor(
-            np.array(label_data).astype("int64").reshape([num_images, 1]), "y")
-
-        warmup_data = [images, labels]
-
-        # Enable the INT8 Quantization
-        infer_config.enable_quantizer()
-        infer_config.quantizer_config().set_quant_data(warmup_data)
-        infer_config.quantizer_config().set_quant_batch_size(num_images)
-
-        # Run INT8 MKL-DNN Quantization
-        predictor = core.create_paddle_predictor(infer_config)
-        if self.int8_model_save_path:
-            if not os.path.exists(self.int8_model_save_path):
-                os.makedirs(self.int8_model_save_path)
-            predictor.SaveOptimModel(self.int8_model_save_path)
-
-        _logger.info(
-            'Finish MKLDNNPostTrainingQuantStrategy::on_compresseion_begin')
--- a/python/paddle/fluid/contrib/slim/quantization/quantization_strategy.py
+++ b/python/paddle/fluid/contrib/slim/quantization/quantization_strategy.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import logging
-import sys
-import numpy as np
-from .... import Executor
-from .... import io
-from .... import core, scope_guard
-from ....compiler import CompiledProgram
-from ....compiler import BuildStrategy
-from ....framework import IrGraph, Variable, Program
-from ....log_helper import get_logger
-from ..core.strategy import Strategy
-from .quantization_pass import *
-
-__all__ = ['QuantizationStrategy']
-
-_logger = get_logger(
-    __name__, logging.INFO, fmt='%(asctime)s-%(levelname)s: %(message)s')
-
-
-class QuantizationStrategy(Strategy):
-    """
-    The strategy for Quantization.
-    """
-
-    def __init__(self,
-                 start_epoch=0,
-                 end_epoch=0,
-                 float_model_save_path=None,
-                 mobile_model_save_path=None,
-                 int8_model_save_path=None,
-                 activation_bits=8,
-                 weight_bits=8,
-                 activation_quantize_type='abs_max',
-                 weight_quantize_type='abs_max',
-                 save_in_nodes=None,
-                 save_out_nodes=None):
-        """
-        Args:
-            start_epoch(int): The 'on_epoch_begin' function will be called in start_epoch. default: 0
-            end_epoch(int): The 'on_epoch_end' function will be called in end_epoch. default: 0
-            float_model_save_path(str): The path to save model with float weights.
-                            None means it doesn't save float model. default: None.
-            mobile_model_save_path(str): The path to save model for paddle-mobile execution.
-                            None means it doesn't save mobile model. default: None.
-            int8_model_save_path(str): The path to save model with int8_t weight.
-                            None means it doesn't save int8 model. default: None.
-            activation_bits(int): quantization bit number for activation. default: 8.
-            weight_bits(int): quantization bit number for weights. The bias is not quantized.
-                              default: 8.
-            activation_quantize_type(str): quantization type for activation,
-                now support 'abs_max', 'range_abs_max' and 'moving_average_abs_max'.
-                If use 'abs_max' mode, the quantization scale will be calculated
-                dynamically each step in both training and testing period. If use
-                'range_abs_max', a static quantization scale will be calculated
-                during training and used in inference.
-            weight_quantize_type (str): quantization type for weights, support 'abs_max' and 'channel_wise_abs_max'.
-            The 'range_abs_max' usually is not used for weight, since weights are fixed once the model is well trained.
-            save_in_nodes(list<str>): A list of variable names used to prune graph
-                                      for saving inference model.
-            save_out_nodes(list<str>): A list of variable names used to prune graph
-                                      for saving inference model.
-
-        """
-        super(QuantizationStrategy, self).__init__(start_epoch, end_epoch)
-        self.start_epoch = start_epoch
-        self.end_epoch = end_epoch
-        self.float_model_save_path = float_model_save_path
-        self.mobile_model_save_path = mobile_model_save_path
-        self.int8_model_save_path = int8_model_save_path
-        self.activation_bits = activation_bits
-        self.weight_bits = weight_bits
-        self.activation_quantize_type = activation_quantize_type
-        self.weight_quantize_type = weight_quantize_type
-        self.save_out_nodes = save_out_nodes
-        self.save_in_nodes = save_in_nodes
-
-    def restore_from_checkpoint(self, context):
-        """
-        Restore graph when the compression task is inited from checkpoint.
-        """
-        # It is inited from checkpoint and has missed start epoch.
-        if context.epoch_id != 0 and context.epoch_id > self.start_epoch:
-            _logger.info("Restore quantization task from checkpoint")
-            self._modify_graph_for_quantization(context)
-            _logger.info("Finish restoring quantization task from checkpoint")
-
-    def _modify_graph_for_quantization(self, context):
-        """
-        Insert fake_quantize_op and fake_dequantize_op before training and testing.
-        """
-        train_ir_graph = IrGraph(
-            core.Graph(context.optimize_graph.program.clone().desc),
-            for_test=False)
-        test_ir_graph = IrGraph(
-            core.Graph(context.eval_graph.program.clone().desc), for_test=True)
-        transform_pass = QuantizationTransformPass(
-            scope=context.scope,
-            place=context.place,
-            weight_bits=self.weight_bits,
-            activation_bits=self.activation_bits,
-            activation_quantize_type=self.activation_quantize_type,
-            weight_quantize_type=self.weight_quantize_type)
-        transform_pass.apply(train_ir_graph)
-        transform_pass.apply(test_ir_graph)
-        # Put persistables created by transform_pass into context.optimize_graph.persistables
-        # for saving checkpoint.
-        program_persistables = set()
-        for var in context.optimize_graph.program.list_vars():
-            if var.persistable:
-                program_persistables.add(var.name)
-
-        program = Program()
-        for var_node in train_ir_graph.all_persistable_nodes():
-            if var_node.name() not in program_persistables:
-                var_desc = var_node.var()
-                var = program.global_block().create_var(
-                    name=var_node.name(),
-                    shape=var_desc.shape(),
-                    dtype=var_desc.dtype(),
-                    type=var_desc.type(),
-                    lod_level=var_desc.lod_level())
-                context.optimize_graph.persistables[var.name] = var
-
-        build_strategy = BuildStrategy()
-        build_strategy.enable_inplace = False
-        build_strategy.memory_optimize = False
-        build_strategy.fuse_all_reduce_ops = False
-        # for quantization training
-        context.optimize_graph.compiled_graph = CompiledProgram(
-            train_ir_graph.graph).with_data_parallel(
-                loss_name=context.optimize_graph.out_nodes['loss'],
-                build_strategy=build_strategy)
-
-        context.eval_graph.program = test_ir_graph.to_program()
-
-        # for saving inference model after training
-        context.put('quantization_test_ir_graph_backup', test_ir_graph)
-
-    def on_epoch_begin(self, context):
-        """
-        Insert fake_quantize_op and fake_dequantize_op before training and testing.
-        """
-        super(QuantizationStrategy, self).on_epoch_begin(context)
-        if self.start_epoch == context.epoch_id:
-            _logger.info('QuantizationStrategy::on_epoch_begin')
-            self._modify_graph_for_quantization(context)
-            _logger.info('Finish QuantizationStrategy::on_epoch_begin')
-
-    def on_epoch_end(self, context):
-        """
-        Free and save inference model.
-        """
-        super(QuantizationStrategy, self).on_compression_end(context)
-
-        if context.epoch_id == self.end_epoch:
-            _logger.info('QuantizationStrategy::on_epoch_end')
-            test_ir_graph = context.get('quantization_test_ir_graph_backup')
-            # freeze the graph after training
-            freeze_pass = QuantizationFreezePass(
-                scope=context.scope,
-                place=context.place,
-                weight_bits=self.weight_bits,
-                activation_bits=self.activation_bits,
-                weight_quantize_type=self.weight_quantize_type)
-            freeze_pass.apply(test_ir_graph)
-
-            # for other strategies
-            context.eval_graph.program = test_ir_graph.to_program()
-
-            if self.save_out_nodes == None:
-                out_vars = [
-                    context.eval_graph.var(var_name)._var
-                    for var_name in context.eval_graph.out_nodes.values()
-                ]
-            else:
-                out_vars = [
-                    context.eval_graph.var(var_name)._var
-                    for var_name in self.save_out_nodes
-                ]
-
-            if self.save_in_nodes == None:
-                in_vars = list(context.eval_graph.in_nodes.values())
-            else:
-                in_vars = self.save_in_nodes
-
-            # save float model
-            if self.float_model_save_path:
-                executor = Executor(context.place)
-                with scope_guard(context.scope):
-                    io.save_inference_model(
-                        self.float_model_save_path,
-                        in_vars,
-                        out_vars,
-                        executor,
-                        main_program=test_ir_graph.to_program(),
-                        model_filename='model',
-                        params_filename='weights',
-                        export_for_deployment=True)
-
-            # save int8 model
-            if self.int8_model_save_path:
-                convert_int8_pass = ConvertToInt8Pass(
-                    scope=context.scope, place=context.place)
-                convert_int8_pass.apply(test_ir_graph)
-
-                executor = Executor(context.place)
-
-                with scope_guard(context.scope):
-                    io.save_inference_model(
-                        self.int8_model_save_path,
-                        in_vars,
-                        out_vars,
-                        executor,
-                        main_program=test_ir_graph.to_program(),
-                        model_filename='model',
-                        params_filename='weights',
-                        export_for_deployment=True)
-
-            # save mobile model
-            if self.mobile_model_save_path:
-                if not self.int8_model_save_path:
-                    # convert the weights as int8_t type
-                    convert_int8_pass = ConvertToInt8Pass(
-                        scope=context.scope, place=context.place)
-                    convert_int8_pass.apply(test_ir_graph)
-                # make some changes on the graph for the mobile inference
-                mobile_pass = TransformForMobilePass()
-                mobile_pass.apply(test_ir_graph)
-                executor = Executor(context.place)
-                with scope_guard(context.scope):
-                    io.save_inference_model(
-                        self.mobile_model_save_path,
-                        in_vars,
-                        out_vars,
-                        executor,
-                        main_program=test_ir_graph.to_program(),
-                        model_filename='model',
-                        params_filename='weights',
-                        export_for_deployment=True)
-            _logger.info('Finish QuantizationStrategy::on_epoch_end')
--- a/python/paddle/fluid/contrib/slim/searcher/__init__.py
+++ b/python/paddle/fluid/contrib/slim/searcher/__init__.py
-#   Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from . import controller
-from .controller import *
-
-__all__ = controller.__all__
--- a/python/paddle/fluid/contrib/slim/searcher/controller.py
+++ b/python/paddle/fluid/contrib/slim/searcher/controller.py
-#   Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserve.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""The controller used to search hyperparameters or neural architecture"""
-
-import numpy as np
-import copy
-import math
-import logging
-from ....log_helper import get_logger
-
-__all__ = ['EvolutionaryController', 'SAController']
-
-_logger = get_logger(
-    __name__, logging.INFO, fmt='%(asctime)s-%(levelname)s: %(message)s')
-
-
-class EvolutionaryController(object):
-    """Abstract controller for all evolutionary searching method.
-    """
-
-    def __init__(self, *args, **kwargs):
-        pass
-
-    def update(self, tokens, reward):
-        """Update the status of controller according current tokens and reward.
-        Args:
-            tokens(list<int>): A solution of searching task.
-            reward(list<int>): The reward of tokens.
-        """
-        raise NotImplementedError('Abstract method.')
-
-    def reset(self, range_table, constrain_func=None):
-        """Reset the controller.
-        Args:
-            range_table(list<int>): It is used to define the searching space of controller.
-                                    The tokens[i] generated by controller should be in [0, range_table[i]).
-            constrain_func(function): It is used to check whether tokens meet the constraint.
-                                     None means there is no constraint. Default: None.
-        """
-        raise NotImplementedError('Abstract method.')
-
-    def next_tokens(self):
-        """Generate new tokens.
-        """
-        raise NotImplementedError('Abstract method.')
-
-
-class SAController(EvolutionaryController):
-    """Simulated annealing controller."""
-
-    def __init__(self,
-                 range_table=None,
-                 reduce_rate=0.85,
-                 init_temperature=1024,
-                 max_iter_number=300):
-        """Initialize.
-        Args:
-            range_table(list<int>): Range table.
-            reduce_rate(float): The decay rate of temperature.
-            init_temperature(float): Init temperature.
-            max_iter_number(int): max iteration number.
-        """
-        super(SAController, self).__init__()
-        self._range_table = range_table
-        self._reduce_rate = reduce_rate
-        self._init_temperature = init_temperature
-        self._max_iter_number = max_iter_number
-        self._reward = -1
-        self._tokens = None
-        self._max_reward = -1
-        self._best_tokens = None
-        self._iter = 0
-
-    def __getstate__(self):
-        d = {}
-        for key in self.__dict__:
-            if key != "_constrain_func":
-                d[key] = self.__dict__[key]
-        return d
-
-    def reset(self, range_table, init_tokens, constrain_func=None):
-        """
-        Reset the status of current controller.
-        Args:
-            range_table(list<int>): The range of value in each position of tokens generated by current controller. The range of tokens[i] is [0, range_table[i]).
-            init_tokens(list<int>): The initial tokens.
-            constrain_func(function): The callback function used to check whether the tokens meet constraint. None means there is no constraint. Default: None.
-        """
-        self._range_table = range_table
-        self._constrain_func = constrain_func
-        self._tokens = init_tokens
-        self._iter = 0
-
-    def update(self, tokens, reward):
-        """
-        Update the controller according to latest tokens and reward.
-        Args:
-            tokens(list<int>): The tokens generated in last step.
-            reward(float): The reward of tokens.
-        """
-        self._iter += 1
-        temperature = self._init_temperature * self._reduce_rate**self._iter
-        if (reward > self._reward) or (np.random.random() <= math.exp(
-            (reward - self._reward) / temperature)):
-            self._reward = reward
-            self._tokens = tokens
-        if reward > self._max_reward:
-            self._max_reward = reward
-            self._best_tokens = tokens
-        _logger.info("iter: {}; max_reward: {}; best_tokens: {}".format(
-            self._iter, self._max_reward, self._best_tokens))
-        _logger.info("current_reward: {}; current tokens: {}".format(
-            self._reward, self._tokens))
-
-    def next_tokens(self, control_token=None):
-        """
-        Get next tokens.
-        """
-        if control_token:
-            tokens = control_token[:]
-        else:
-            tokens = self._tokens
-        new_tokens = tokens[:]
-        index = int(len(self._range_table) * np.random.random())
-        new_tokens[index] = (
-            new_tokens[index] + np.random.randint(self._range_table[index] - 1)
-            + 1) % self._range_table[index]
-        _logger.info("change index[{}] from {} to {}".format(index, tokens[
-            index], new_tokens[index]))
-        if self._constrain_func is None:
-            return new_tokens
-        for _ in range(self._max_iter_number):
-            if not self._constrain_func(new_tokens):
-                index = int(len(self._range_table) * np.random.random())
-                new_tokens = tokens[:]
-                new_tokens[index] = np.random.randint(self._range_table[index])
-            else:
-                break
-        return new_tokens
--- a/python/paddle/fluid/contrib/slim/tests/CMakeLists.txt
+++ b/python/paddle/fluid/contrib/slim/tests/CMakeLists.txt
@@ -138,41 +138,6 @@ if(LINUX AND WITH_MKLDNN)
 	# Models should be already downloaded for INT8v2 unit tests

 	set(INT8_INSTALL_DIR "${INFERENCE_DEMO_INSTALL_DIR}/int8v2")
-	set(INT8_IC_TEST_FILE "test_mkldnn_int8_quantization_strategy.py")
-	set(INT8_IC_TEST_FILE_PATH "${CMAKE_CURRENT_SOURCE_DIR}/${INT8_IC_TEST_FILE}")
-
-	# googlenet int8
-	set(INT8_GOOGLENET_MODEL_DIR "${INT8_INSTALL_DIR}/googlenet")
-	inference_analysis_python_api_int8_test_custom_warmup_batch_size(test_slim_int8_googlenet ${INT8_GOOGLENET_MODEL_DIR} ${IMAGENET_DATA_PATH} ${INT8_IC_TEST_FILE_PATH} 10)
-
-	# mobilenet int8
-	set(INT8_MOBILENET_MODEL_DIR "${INT8_INSTALL_DIR}/mobilenetv1")
-	inference_analysis_python_api_int8_test(test_slim_int8_mobilenet ${INT8_MOBILENET_MODEL_DIR} ${IMAGENET_DATA_PATH} ${INT8_IC_TEST_FILE_PATH})
-	inference_analysis_python_api_int8_test_mkldnn(test_slim_int8_mobilenet_mkldnn ${INT8_MOBILENET_MODEL_DIR} ${IMAGENET_DATA_PATH} ${INT8_IC_TEST_FILE_PATH})
-
-	# temporarily adding WITH_SLIM_MKLDNN_FULL_TEST FLAG for QA testing the following UTs locally,
-	# since the following UTs cost too much time on CI test.
-	if (WITH_SLIM_MKLDNN_FULL_TEST)
-		# resnet50 int8
-		set(INT8_RESNET50_MODEL_DIR "${INT8_INSTALL_DIR}/resnet50")
-		inference_analysis_python_api_int8_test(test_slim_int8_resnet50 ${INT8_RESNET50_MODEL_DIR} ${IMAGENET_DATA_PATH} ${INT8_IC_TEST_FILE_PATH})
-
-		# mobilenetv2 int8
-		set(INT8_MOBILENETV2_MODEL_DIR "${INT8_INSTALL_DIR}/mobilenetv2")
-		inference_analysis_python_api_int8_test(test_slim_int8_mobilenetv2 ${INT8_MOBILENETV2_MODEL_DIR} ${IMAGENET_DATA_PATH} ${INT8_IC_TEST_FILE_PATH})
-
-		# resnet101 int8
-		set(INT8_RESNET101_MODEL_DIR "${INT8_INSTALL_DIR}/resnet101")
-		inference_analysis_python_api_int8_test(test_slim_int8_resnet101 ${INT8_RESNET101_MODEL_DIR} ${IMAGENET_DATA_PATH} ${INT8_IC_TEST_FILE_PATH})
-
-		# vgg16 int8
-		set(INT8_VGG16_MODEL_DIR "${INT8_INSTALL_DIR}/vgg16")
-		inference_analysis_python_api_int8_test(test_slim_int8_vgg16 ${INT8_VGG16_MODEL_DIR} ${IMAGENET_DATA_PATH} ${INT8_IC_TEST_FILE_PATH})
-
-		# vgg19 int8
-		set(INT8_VGG19_MODEL_DIR "${INT8_INSTALL_DIR}/vgg19")
-		inference_analysis_python_api_int8_test(test_slim_int8_vgg19 ${INT8_VGG19_MODEL_DIR} ${IMAGENET_DATA_PATH} ${INT8_IC_TEST_FILE_PATH})
-	endif()

 	#### QUANT & INT8 comparison python api tests


--- a/python/paddle/fluid/contrib/slim/tests/auto_pruning/compress.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/auto_pruning/compress.yaml
-version: 1.0
-pruners:
-    pruner_1:
-        class: 'StructurePruner'
-        pruning_axis:
-            '*': 0
-        criterions:
-            '*': 'l1_norm'
-controllers:
-    sa_controller:
-        class: 'SAController'
-        reduce_rate: 0.9
-        init_temperature: 1024
-        max_iter_number: 300
-strategies:
-    auto_pruning_strategy:
-        class: 'AutoPruneStrategy'
-        pruner: 'pruner_1'
-        controller: 'sa_controller'
-        start_epoch: 0
-        end_epoch: 2
-        max_ratio: 0.7
-        min_ratio: 0.5
-        pruned_params: '.*_sep_weights'
-        metric_name: 'acc_top5'
-compressor:
-    epoch: 2
-    checkpoint_path: './checkpoints_auto_pruning/'
-    strategies:
-        - auto_pruning_strategy
--- a/python/paddle/fluid/contrib/slim/tests/configs/compress.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/configs/compress.yaml
-version: 1.0
-compressor:
-    epoch: 1 
-    checkpoint_path: './checkpoints/'
--- a/python/paddle/fluid/contrib/slim/tests/configs/filter_pruning.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/configs/filter_pruning.yaml
-#start_epoch:         The 'on_epoch_begin' function will be called in start_epoch. default: 0.
-#end_epoch:           The 'on_epoch_end' function will be called in end_epoch. default: 10.
-#delta_rate:          The delta used to generate ratios when calculating sensitivities.
-#target_ratio:        The flops ratio to be pruned from current model.
-#metric_name:         The metric used to evaluate the model.
-#pruned_params:       The pattern str to match the parameter names to be pruned.
-#sensitivities_file:  The sensitivities file.
-#num_steps:           The number of pruning steps.
-#eval_rate:           The rate of sampled data used to calculate sensitivities.
-version: 1.0
-pruners:
-    pruner_1:
-        class: 'StructurePruner'
-        pruning_axis:
-            '*': 0
-        criterions:
-            '*': 'l1_norm'
-strategies:
-    sensitive_pruning_strategy:
-        class: 'SensitivePruneStrategy'
-        pruner: 'pruner_1'
-        start_epoch: 0
-        delta_rate: 0.1
-        target_ratio: 0.3
-        num_steps: 1
-        eval_rate: 0.5
-        pruned_params: '.*_sep_weights'
-        sensitivities_file: 'mobilenet_acc_top1_sensitive.data'
-        metric_name: 'acc_top1'
-compressor:
-    epoch: 120
-    checkpoint_path: './checkpoints/'
-    strategies:
-        - sensitive_pruning_strategy
--- a/python/paddle/fluid/contrib/slim/tests/distillation/compress.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/distillation/compress.yaml
-#start_epoch(int): The epoch when to merge student graph and teacher graph for
-#                  distillation training. default: 0
-#
-#end_epoch(int): The epoch when to finish distillation training. default: 0
-#
-#student_feature_map(str): The name of feature map from student network.
-#
-#teacher_feature_map(str): The name of feature map from teacher network.
-#                          It's shape should be the same with student network.
-#
-#student_pairs(list<tuple>): Each tuple, with two variable names, in student_pairs indicates
-#                            a section in student network. The variables in a tuple should
-#                            have the same feature map size.
-#
-#teacher_pairs(list<tuple>): Each tuple, with two variable names, in teacher_pairs indicates
-#                            a section in teacher network. The variables in a tuple should
-#                            have the same feature map size. Varibale named teacher_pairs[i][j]
-#                            should has the save channel number with that of variable named 
-#                            student_pairs[i][j].
-#
-#distillation_loss_weight(float): The weight of the loss.
-version: 1.0
-distillers:
-    fsp_distiller:
-        class: 'FSPDistiller'
-#        teacher_pairs: [['teacher_depthwise_conv2d_1.tmp_0', 'teacher_conv2d_3.tmp_0']]
-#        student_pairs: [['student_depthwise_conv2d_1.tmp_0', 'student_conv2d_3.tmp_0']]
-        teacher_pairs: [['teacher_conv2_1_dw.tmp_0', 'teacher_conv1.tmp_0']]
-        student_pairs: [['student_conv2_1_dw.tmp_0', 'student_conv1.tmp_0']]
-        distillation_loss_weight: 1
-    l2_distiller:
-        class: 'L2Distiller'
-        teacher_feature_map: 'teacher.tmp_1'
-        student_feature_map: 'student.tmp_1'
-        distillation_loss_weight: 1
-    soft_label_distiller:
-        class: 'SoftLabelDistiller'
-        student_temperature: 1.0
-        teacher_temperature: 1.0 
-        teacher_feature_map: 'teacher.tmp_2'
-        student_feature_map: 'student.tmp_2'
-        distillation_loss_weight: 0.001
-strategies:
-    distillation_strategy:
-        class: 'DistillationStrategy'
-        distillers: ['fsp_distiller', 'l2_distiller', 'soft_label_distiller']
-        start_epoch: 0
-        end_epoch: 1
-compressor:
-    epoch: 1
-    checkpoint_path: './distillation_checkpoints/'
-    strategies:
-        - distillation_strategy
--- a/python/paddle/fluid/contrib/slim/tests/filter_pruning/compress.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/filter_pruning/compress.yaml
-#start_epoch:         The 'on_epoch_begin' function will be called in start_epoch. default: 0.
-#end_epoch:           The 'on_epoch_end' function will be called in end_epoch. default: 10.
-#delta_rate:          The delta used to generate ratios when calculating sensitivities.
-#target_ratio:        The flops ratio to be pruned from current model.
-#metric_name:         The metric used to evaluate the model.
-#pruned_params:       The pattern str to match the parameter names to be pruned.
-#sensitivities_file:  The sensitivities file.
-#num_steps:           The number of pruning steps.
-#eval_rate:           The rate of sampled data used to calculate sensitivities.
-version: 1.0
-pruners:
-    pruner_1:
-        class: 'StructurePruner'
-        pruning_axis:
-            '*': 0
-        criterions:
-            '*': 'l1_norm'
-strategies:
-    sensitive_pruning_strategy:
-        class: 'SensitivePruneStrategy'
-        pruner: 'pruner_1'
-        start_epoch: 1
-        delta_rate: 0.2
-        target_ratio: 0.08
-        num_steps: 1
-        eval_rate: 0.5
-        pruned_params: '_conv6_sep_weights'
-        sensitivities_file: 'mobilenet_acc_top1_sensitive.data'
-        metric_name: 'acc_top1'
-compressor:
-    epoch: 2
-    checkpoint_path: './checkpoints_pruning/'
-    strategies:
-        - sensitive_pruning_strategy
--- a/python/paddle/fluid/contrib/slim/tests/filter_pruning/uniform_restore.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/filter_pruning/uniform_restore.yaml
-version: 1.0
-pruners:
-    pruner_1:
-        class: 'StructurePruner'
-        pruning_axis:
-            '*': 0
-        criterions:
-            '*': 'l1_norm'
-strategies:
-    uniform_pruning_strategy:
-        class: 'UniformPruneStrategy'
-        pruner: 'pruner_1'
-        start_epoch: 0
-        target_ratio: 0.5
-        pruned_params: 'conv.*'
-        metric_name: 'acc_top1'
-compressor:
-    epoch: 2
-    checkpoint_path: './checkpoints_uniform_restore_tmp/'
-    strategies:
-        - uniform_pruning_strategy
--- a/python/paddle/fluid/contrib/slim/tests/filter_pruning/uniform_restore_0.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/filter_pruning/uniform_restore_0.yaml
-version: 1.0
-pruners:
-    pruner_1:
-        class: 'StructurePruner'
-        pruning_axis:
-            '*': 0
-        criterions:
-            '*': 'l1_norm'
-strategies:
-    uniform_pruning_strategy:
-        class: 'UniformPruneStrategy'
-        pruner: 'pruner_1'
-        start_epoch: 0
-        target_ratio: 0.5
-        pruned_params: 'conv.*'
-        metric_name: 'acc_top1'
-compressor:
-    epoch: 1
-    checkpoint_path: './checkpoints_uniform_restore/'
-    strategies:
-        - uniform_pruning_strategy
--- a/python/paddle/fluid/contrib/slim/tests/filter_pruning/uniform_restore_1.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/filter_pruning/uniform_restore_1.yaml
-version: 1.0
-pruners:
-    pruner_1:
-        class: 'StructurePruner'
-        pruning_axis:
-            '*': 0
-        criterions:
-            '*': 'l1_norm'
-strategies:
-    uniform_pruning_strategy:
-        class: 'UniformPruneStrategy'
-        pruner: 'pruner_1'
-        start_epoch: 0
-        target_ratio: 0.5
-        pruned_params: 'conv.*'
-        metric_name: 'acc_top1'
-compressor:
-    epoch: 2
-    checkpoint_path: './checkpoints_uniform_restore/'
-    strategies:
-        - uniform_pruning_strategy
--- a/python/paddle/fluid/contrib/slim/tests/light_nas/compress.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/light_nas/compress.yaml
-version: 1.0
-controllers:
-    sa_controller:
-        class: 'SAController'
-        reduce_rate: 0.9
-        init_temperature: 1024
-        max_iter_number: 300
-strategies:
-    light_nas_strategy:
-        class: 'LightNASStrategy'
-        controller: 'sa_controller'
-        target_flops: 629145600
-        target_latency: 1
-        end_epoch: 2
-        retrain_epoch: 1
-        metric_name: 'acc_top1'
-        is_server: 1
-        max_client_num: 100
-        search_steps: 2
-compressor:
-    epoch: 2
-    strategies:
-        - light_nas_strategy
--- a/python/paddle/fluid/contrib/slim/tests/light_nas/light_nas_space.py
+++ b/python/paddle/fluid/contrib/slim/tests/light_nas/light_nas_space.py
-# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from paddle.fluid.contrib.slim.nas import SearchSpace
-from light_nasnet import LightNASNet
-import paddle.fluid as fluid
-import paddle
-import json
-import random
-
-total_images = 1281167
-lr = 0.1
-num_epochs = 1
-batch_size = 256
-lr_strategy = "cosine_decay"
-l2_decay = 4e-5
-momentum_rate = 0.9
-image_shape = [1, 28, 28]
-
-__all__ = ['LightNASSpace']
-
-NAS_FILTER_SIZE = [[18, 24, 30], [24, 32, 40], [48, 64, 80], [72, 96, 120],
-                   [120, 160, 192]]
-NAS_LAYERS_NUMBER = [[1, 2, 3], [2, 3, 4], [3, 4, 5], [2, 3, 4], [2, 3, 4]]
-NAS_KERNEL_SIZE = [3, 5]
-NAS_FILTERS_MULTIPLIER = [3, 4, 5, 6]
-NAS_SHORTCUT = [0, 1]
-NAS_SE = [0, 1]
-
-
-def get_bottleneck_params_list(var):
-    """Get bottleneck_params_list from var.
-    Args:
-        var: list, variable list.
-    Returns:
-        list, bottleneck_params_list.
-    """
-    params_list = [
-        1, 16, 1, 1, 3, 1, 0, \
-        6, 24, 2, 2, 3, 1, 0, \
-        6, 32, 3, 2, 3, 1, 0, \
-        6, 64, 4, 2, 3, 1, 0, \
-        6, 96, 3, 1, 3, 1, 0, \
-        6, 160, 3, 2, 3, 1, 0, \
-        6, 320, 1, 1, 3, 1, 0, \
-    ]
-    for i in range(5):
-        params_list[i * 7 + 7] = NAS_FILTERS_MULTIPLIER[var[i * 6]]
-        params_list[i * 7 + 8] = NAS_FILTER_SIZE[i][var[i * 6 + 1]]
-        params_list[i * 7 + 9] = NAS_LAYERS_NUMBER[i][var[i * 6 + 2]]
-        params_list[i * 7 + 11] = NAS_KERNEL_SIZE[var[i * 6 + 3]]
-        params_list[i * 7 + 12] = NAS_SHORTCUT[var[i * 6 + 4]]
-        params_list[i * 7 + 13] = NAS_SE[var[i * 6 + 5]]
-    return params_list
-
-
-class LightNASSpace(SearchSpace):
-    def __init__(self):
-        super(LightNASSpace, self).__init__()
-
-    def init_tokens(self):
-        """Get init tokens in search space.
-        """
-        return [
-            0, 1, 2, 0, 1, 0, 0, 2, 1, 1, 1, 0, 3, 2, 0, 1, 1, 0, 3, 1, 0, 0, 1,
-            0, 3, 2, 2, 1, 1, 0
-        ]
-
-    def range_table(self):
-        """Get range table of current search space.
-        """
-        # [NAS_FILTER_SIZE, NAS_LAYERS_NUMBER, NAS_KERNEL_SIZE, NAS_FILTERS_MULTIPLIER, NAS_SHORTCUT, NAS_SE]
-        return [
-            4, 3, 3, 2, 2, 2, 4, 3, 3, 2, 2, 2, 4, 3, 3, 2, 2, 2, 4, 3, 3, 2, 2,
-            2, 4, 3, 3, 2, 2, 2
-        ]
-
-    def get_model_latency(self, program):
-        """Get model latency according to program.
-        Returns a random number since it's only for testing.
-        Args:
-            program(Program): The program to get latency.
-        Return:
-            (float): model latency.
-        """
-        return random.randint(1, 2)
-
-    def create_net(self, tokens=None):
-        """Create a network for training by tokens.
-        """
-        if tokens is None:
-            tokens = self.init_tokens()
-
-        bottleneck_params_list = get_bottleneck_params_list(tokens)
-
-        startup_prog = fluid.Program()
-        train_prog = fluid.Program()
-        test_prog = fluid.Program()
-        train_py_reader, train_cost, train_acc1, train_acc5, global_lr = build_program(
-            is_train=True,
-            main_prog=train_prog,
-            startup_prog=startup_prog,
-            bottleneck_params_list=bottleneck_params_list)
-        test_py_reader, test_cost, test_acc1, test_acc5 = build_program(
-            is_train=False,
-            main_prog=test_prog,
-            startup_prog=startup_prog,
-            bottleneck_params_list=bottleneck_params_list)
-        test_prog = test_prog.clone(for_test=True)
-        train_batch_size = batch_size / 1
-        test_batch_size = batch_size
-        train_reader = paddle.batch(
-            paddle.dataset.mnist.train(),
-            batch_size=train_batch_size,
-            drop_last=True)
-        test_reader = paddle.batch(
-            paddle.dataset.mnist.test(), batch_size=test_batch_size)
-
-        with fluid.program_guard(train_prog, startup_prog):
-            train_py_reader.decorate_paddle_reader(train_reader)
-
-        with fluid.program_guard(test_prog, startup_prog):
-            test_py_reader.decorate_paddle_reader(test_reader)
-        return startup_prog, train_prog, test_prog, (
-            train_cost, train_acc1, train_acc5,
-            global_lr), (test_cost, test_acc1,
-                         test_acc5), train_py_reader, test_py_reader
-
-
-def build_program(is_train,
-                  main_prog,
-                  startup_prog,
-                  bottleneck_params_list=None):
-    with fluid.program_guard(main_prog, startup_prog):
-        py_reader = fluid.layers.py_reader(
-            capacity=16,
-            shapes=[[-1] + image_shape, [-1, 1]],
-            lod_levels=[0, 0],
-            dtypes=["float32", "int64"],
-            use_double_buffer=False)
-        with fluid.unique_name.guard():
-            image, label = fluid.layers.read_file(py_reader)
-            model = LightNASNet()
-            avg_cost, acc_top1, acc_top5 = net_config(
-                image,
-                label,
-                model,
-                class_dim=10,
-                bottleneck_params_list=bottleneck_params_list,
-                scale_loss=1.0)
-
-            avg_cost.persistable = True
-            acc_top1.persistable = True
-            acc_top5.persistable = True
-            if is_train:
-                params = model.params
-                params["total_images"] = total_images
-                params["lr"] = lr
-                params["num_epochs"] = num_epochs
-                params["learning_strategy"]["batch_size"] = batch_size
-                params["learning_strategy"]["name"] = lr_strategy
-                params["l2_decay"] = l2_decay
-                params["momentum_rate"] = momentum_rate
-                optimizer = optimizer_setting(params)
-                optimizer.minimize(avg_cost)
-                global_lr = optimizer._global_learning_rate()
-
-        if is_train:
-            return py_reader, avg_cost, acc_top1, acc_top5, global_lr
-        else:
-            return py_reader, avg_cost, acc_top1, acc_top5
-
-
-def net_config(image,
-               label,
-               model,
-               class_dim=1000,
-               bottleneck_params_list=None,
-               scale_loss=1.0):
-    bottleneck_params_list = [
-        bottleneck_params_list[i:i + 7]
-        for i in range(0, len(bottleneck_params_list), 7)
-    ]
-    out = model.net(input=image,
-                    bottleneck_params_list=bottleneck_params_list,
-                    class_dim=class_dim)
-    cost, pred = fluid.layers.softmax_with_cross_entropy(
-        out, label, return_softmax=True)
-    if scale_loss > 1:
-        avg_cost = fluid.layers.mean(x=cost) * float(scale_loss)
-    else:
-        avg_cost = fluid.layers.mean(x=cost)
-    acc_top1 = fluid.layers.accuracy(input=pred, label=label, k=1)
-    acc_top5 = fluid.layers.accuracy(input=pred, label=label, k=5)
-    return avg_cost, acc_top1, acc_top5
-
-
-def optimizer_setting(params):
-    """optimizer setting.
-    Args:
-        params: dict, params.
-    """
-    ls = params["learning_strategy"]
-    l2_decay = params["l2_decay"]
-    momentum_rate = params["momentum_rate"]
-    if ls["name"] == "piecewise_decay":
-        if "total_images" not in params:
-            total_images = IMAGENET1000
-        else:
-            total_images = params["total_images"]
-        batch_size = ls["batch_size"]
-        step = int(total_images / batch_size + 1)
-        bd = [step * e for e in ls["epochs"]]
-        base_lr = params["lr"]
-        lr = []
-        lr = [base_lr * (0.1**i) for i in range(len(bd) + 1)]
-        optimizer = fluid.optimizer.Momentum(
-            learning_rate=fluid.layers.piecewise_decay(
-                boundaries=bd, values=lr),
-            momentum=momentum_rate,
-            regularization=fluid.regularizer.L2Decay(l2_decay))
-    elif ls["name"] == "cosine_decay":
-        if "total_images" not in params:
-            total_images = IMAGENET1000
-        else:
-            total_images = params["total_images"]
-        batch_size = ls["batch_size"]
-        step = int(total_images / batch_size + 1)
-        lr = params["lr"]
-        num_epochs = params["num_epochs"]
-        optimizer = fluid.optimizer.Momentum(
-            learning_rate=fluid.layers.cosine_decay(
-                learning_rate=lr, step_each_epoch=step, epochs=num_epochs),
-            momentum=momentum_rate,
-            regularization=fluid.regularizer.L2Decay(l2_decay))
-    elif ls["name"] == "cosine_warmup_decay":
-        if "total_images" not in params:
-            total_images = IMAGENET1000
-        else:
-            total_images = params["total_images"]
-        batch_size = ls["batch_size"]
-        l2_decay = params["l2_decay"]
-        momentum_rate = params["momentum_rate"]
-        step = int(math.ceil(float(total_images) / batch_size))
-        lr = params["lr"]
-        num_epochs = params["num_epochs"]
-        optimizer = fluid.optimizer.Momentum(
-            learning_rate=cosine_decay_with_warmup(
-                learning_rate=lr, step_each_epoch=step, epochs=num_epochs),
-            momentum=momentum_rate,
-            regularization=fluid.regularizer.L2Decay(l2_decay))
-    elif ls["name"] == "linear_decay":
-        if "total_images" not in params:
-            total_images = IMAGENET1000
-        else:
-            total_images = params["total_images"]
-        batch_size = ls["batch_size"]
-        num_epochs = params["num_epochs"]
-        start_lr = params["lr"]
-        end_lr = 0
-        total_step = int((total_images / batch_size) * num_epochs)
-        lr = fluid.layers.polynomial_decay(
-            start_lr, total_step, end_lr, power=1)
-        optimizer = fluid.optimizer.Momentum(
-            learning_rate=lr,
-            momentum=momentum_rate,
-            regularization=fluid.regularizer.L2Decay(l2_decay))
-    elif ls["name"] == "adam":
-        lr = params["lr"]
-        optimizer = fluid.optimizer.Adam(learning_rate=lr)
-    else:
-        lr = params["lr"]
-        optimizer = fluid.optimizer.Momentum(
-            learning_rate=lr,
-            momentum=momentum_rate,
-            regularization=fluid.regularizer.L2Decay(l2_decay))
-    return optimizer
--- a/python/paddle/fluid/contrib/slim/tests/light_nas/light_nasnet.py
+++ b/python/paddle/fluid/contrib/slim/tests/light_nas/light_nasnet.py
--- a/python/paddle/fluid/contrib/slim/tests/mobilenet.py
+++ b/python/paddle/fluid/contrib/slim/tests/mobilenet.py
--- a/python/paddle/fluid/contrib/slim/tests/quantization/compress.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/quantization/compress.yaml
-#start_epoch(int): The epoch to insert quantization operators. default: 0
-#
-#end_epoch(int): The epoch to save inference model. default: 0
-#
-#float_model_save_path(str): The path to save model with float weights.
-#                None means it doesn't save float model. default: None.
-#
-#mobile_model_save_path(str): The path to save model for paddle-mobile execution.
-#                None means it doesn't save mobile model. default: None.
-#
-#int8_model_save_path(str): The path to save model with int8_t weight.
-#                None means it doesn't save int8 model. default: None.
-#
-#activation_bits(int): quantization bit number for activation. default: 8.
-#
-#weight_bits(int): quantization bit number for weights. The bias is not quantized.
-#                  default: 8.
-#
-#activation_quantize_type(str): quantization type for activation,
-#    now support 'abs_max', 'range_abs_max' and 'moving_average_abs_max'.
-#    If use 'abs_max' mode, the quantization scale will be calculated
-#    dynamically each step in both training and testing period. If use
-#    'range_abs_max', a static quantization scale will be calculated
-#    during training and used in inference.
-#
-#save_in_nodes(list<str>): A list of variable names used to prune graph
-#                          for saving inference model.
-#
-#save_out_nodes(list<str>): A list of variable names used to prune graph
-#                                      for saving inference model.
-version: 1.0
-strategies:
-    quantization_strategy:
-        class: 'QuantizationStrategy'
-        start_epoch: 0
-        end_epoch: 0
-        float_model_save_path: './output/float'
-        mobile_model_save_path: './output/mobile'
-        int8_model_save_path: './output/int8'
-        weight_bits: 8
-        activation_bits: 8
-        weight_quantize_type: 'abs_max'
-        activation_quantize_type: 'abs_max'
-        save_in_nodes: ['image']
-        save_out_nodes: ['quan.tmp_2']
-compressor:
-    epoch: 1
-    checkpoint_path: './checkpoints_quan/'
-    strategies:
-        - quantization_strategy
--- a/python/paddle/fluid/contrib/slim/tests/quantization/compress_1.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/quantization/compress_1.yaml
-#start_epoch(int): The epoch to insert quantization operators. default: 0
-#
-#end_epoch(int): The epoch to save inference model. default: 0
-#
-#float_model_save_path(str): The path to save model with float weights.
-#                None means it doesn't save float model. default: None.
-#
-#mobile_model_save_path(str): The path to save model for paddle-mobile execution.
-#                None means it doesn't save mobile model. default: None.
-#
-#int8_model_save_path(str): The path to save model with int8_t weight.
-#                None means it doesn't save int8 model. default: None.
-#
-#activation_bits(int): quantization bit number for activation. default: 8.
-#
-#weight_bits(int): quantization bit number for weights. The bias is not quantized.
-#                  default: 8.
-#
-#activation_quantize_type(str): quantization type for activation,
-#    now support 'abs_max', 'range_abs_max' and 'moving_average_abs_max'.
-#    If use 'abs_max' mode, the quantization scale will be calculated
-#    dynamically each step in both training and testing period. If use
-#    'range_abs_max', a static quantization scale will be calculated
-#    during training and used in inference.
-#
-#save_in_nodes(list<str>): A list of variable names used to prune graph
-#                          for saving inference model.
-#
-#save_out_nodes(list<str>): A list of variable names used to prune graph
-#                                      for saving inference model.
-version: 1.0
-strategies:
-    quantization_strategy:
-        class: 'QuantizationStrategy'
-        start_epoch: 0
-        end_epoch: 0
-        float_model_save_path: './output/float'
-        mobile_model_save_path: './output/mobile'
-        int8_model_save_path: './output/int8'
-        weight_bits: 8
-        activation_bits: 8
-        weight_quantize_type: 'abs_max'
-        activation_quantize_type: 'abs_max'
-        save_in_nodes: ['image']
-        save_out_nodes: ['quan.tmp_2']
-compressor:
-    epoch: 2
-    checkpoint_path: './checkpoints_quan/'
-    strategies:
-        - quantization_strategy
--- a/python/paddle/fluid/contrib/slim/tests/quantization/compress_2.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/quantization/compress_2.yaml
--- a/python/paddle/fluid/contrib/slim/tests/quantization/config_mkldnn_int8.yaml
+++ b/python/paddle/fluid/contrib/slim/tests/quantization/config_mkldnn_int8.yaml
--- a/python/paddle/fluid/contrib/slim/tests/slim_int8_mkldnn_post_training_quantization.md
+++ b/python/paddle/fluid/contrib/slim/tests/slim_int8_mkldnn_post_training_quantization.md
--- a/python/paddle/fluid/contrib/slim/tests/test_auto_pruning.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_auto_pruning.py
--- a/python/paddle/fluid/contrib/slim/tests/test_compressor.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_compressor.py
--- a/python/paddle/fluid/contrib/slim/tests/test_factory.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_factory.py
--- a/python/paddle/fluid/contrib/slim/tests/test_filter_pruning.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_filter_pruning.py
--- a/python/paddle/fluid/contrib/slim/tests/test_graph_wrapper.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_graph_wrapper.py
--- a/python/paddle/fluid/contrib/slim/tests/test_light_nas.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_light_nas.py
--- a/python/paddle/fluid/contrib/slim/tests/test_mkldnn_int8_quantization_strategy.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_mkldnn_int8_quantization_strategy.py
--- a/python/paddle/fluid/contrib/slim/tests/test_quantization_strategy.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_quantization_strategy.py
--- a/python/paddle/fluid/contrib/slim/tests/test_reader.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_reader.py
--- a/python/paddle/fluid/contrib/slim/tests/test_slim_distillation_strategy.py
+++ b/python/paddle/fluid/contrib/slim/tests/test_slim_distillation_strategy.py
--- a/python/setup.py.in
+++ b/python/setup.py.in
@@ -166,14 +166,8 @@ packages=['paddle',
          'paddle.fluid.contrib.quantize',
          'paddle.fluid.contrib.reader',
          'paddle.fluid.contrib.slim',
-          'paddle.fluid.contrib.slim.core',
-          'paddle.fluid.contrib.slim.graph',
-          'paddle.fluid.contrib.slim.prune',
          'paddle.fluid.contrib.slim.quantization',
          'paddle.fluid.contrib.slim.quantization.imperative',
-          'paddle.fluid.contrib.slim.distillation',
-          'paddle.fluid.contrib.slim.nas',
-          'paddle.fluid.contrib.slim.searcher',
          'paddle.fluid.contrib.utils',
          'paddle.fluid.contrib.extend_optimizer',
          'paddle.fluid.contrib.mixed_precision',