add mindspore hub for download ckpt file

add mindspore.hub and change model_zoo

add mindspore hub for download ckpt file
add mindspore.hub and change model_zoo
783b823a · chenzomi · e62137f7 · 783b823a · 783b823a · 783b823a
60 changed file
--- a/mindspore/hub.py
+++ b/mindspore/hub.py
+# Copyright 2020 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+"""
+hub for loading models:
+Users can load pre-trained models using mindspore.hub.load() API.
+"""
+import os
+import re
+import shutil
+import tarfile
+import hashlib
+from urllib.request import urlretrieve
+import requests
+from bs4 import BeautifulSoup
+
+import mindspore
+import mindspore.nn as nn
+from mindspore import log as logger
+from mindspore.train.serialization import load_checkpoint, load_param_into_net
+
+DOWNLOAD_BASIC_URL = "http://download.mindspore.cn/model_zoo"
+OFFICIAL_NAME = "official"
+DEFAULT_CACHE_DIR = '~/.cache'
+MODEL_TARGET_CV = ['alexnet', 'fasterrcnn', 'googlenet',
+                   'lenet', 'resnet', 'ssd', 'vgg', 'yolo']
+MODEL_TARGET_NLP = ['bert', 'mass', 'transformer']
+
+
+def _packing_targz(output_filename, savepath="./"):
+    """
+    Packing the input filename to filename.tar.gz in source dir.
+    """
+    try:
+        with tarfile.open(output_filename, "w:gz") as tar:
+            tar.add(savepath, arcname=os.path.basename(savepath))
+    except Exception as e:
+        raise OSError("Cannot tar file {} for - {}".format(output_filename, e))
+
+
+def _unpacking_targz(input_filename, savepath="./"):
+    """
+    Unpacking the input filename to dirs.
+    """
+    try:
+        t = tarfile.open(input_filename)
+        t.extractall(path=savepath)
+    except Exception as e:
+        raise OSError("Cannot untar file {} for - {}".format(input_filename, e))
+
+
+def _remove_path_if_exists(path):
+    if os.path.exists(path):
+        if os.path.isfile(path):
+            os.remove(path)
+        else:
+            shutil.rmtree(path)
+
+
+def _create_path_if_not_exists(path):
+    if os.path.exists(path):
+        if os.path.isfile(path):
+            os.remove(path)
+        else:
+            os.mkdir(path)
+
+
+def _get_weights_file(url, hash_md5=None, savepath='./'):
+    """
+    get checkpoint weight from giving url.
+
+    Args:
+       url(string): checkpoint tar.gz url path.
+       hash_md5(string): checkpoint file md5.
+       savepath(string): checkpoint download save path.
+
+    Returns:
+       string.
+    """
+
+    def reporthook(a, b, c):
+        percent = a * b * 100.0 / c
+        show_str = ('[%%-%ds]' % 70) % (int(percent * 80) * '#')
+        print("\rDownloading:", show_str, " %5.1f%%" % (percent), end="")
+
+    def md5sum(file_name, hash_md5):
+        fp = open(file_name, 'rb')
+        content = fp.read()
+        fp.close()
+        m = hashlib.md5()
+        m.update(content.encode('utf-8'))
+        download_md5 = m.hexdigest()
+        return download_md5 == hash_md5
+
+    _create_path_if_not_exists(savepath)
+    ckpt_name = os.path.basename(url.split("/")[-1])
+    # identify file exist or not
+    file_path = os.path.join(savepath, ckpt_name)
+    if os.path.isfile(file_path):
+        if hash_md5 and md5sum(file_path, hash_md5):
+            print('File already exists!')
+            return file_path
+
+    file_path = file_path[:-7] if ".tar.gz" in file_path else file_path
+    _remove_path_if_exists(file_path)
+
+    # download the checkpoint file
+    print('Downloading data from url {}'.format(url))
+    try:
+        urlretrieve(url, file_path, reporthook=reporthook)
+    except HTTPError as e:
+        raise Exception(e.code, e.msg, url)
+    except URLError as e:
+        raise Exception(e.errno, e.reason, url)
+    print('\nDownload finished!')
+
+    # untar file_path
+    _unpacking_targz(file_path)
+
+    #     # get the file size
+    file_path = os.path.join(savepath, ckpt_name)
+    filesize = os.path.getsize(file_path)
+    # turn the file size to Mb format
+    print('File size = %.2f Mb' % (filesize / 1024 / 1024))
+    return file_path
+
+
+def _get_url_paths(url, ext='.tar.gz'):
+    response = requests.get(url)
+    if response.ok:
+        response_text = response.text
+    else:
+        return response.raise_for_status()
+    soup = BeautifulSoup(response_text, 'html.parser')
+    parent = [url + node.get('href') for node in soup.find_all('a')
+              if node.get('href').endswith(ext)]
+    return parent
+
+
+def _get_file_from_url(base_url, base_name):
+    idx = 0
+    urls = _get_url_paths(base_url)
+    files = [url.split('/')[-1] for url in urls]
+    for i, name in enumerate(files):
+        if re.match(base_name + '*', name) is not None:
+            idx = i
+            break
+    return urls[idx]
+
+
+def load_weights(network, network_name=None, force_reload=True, **kwargs):
+    r"""
+    Load a model from mindspore, with pretrained weights.
+
+    Args:
+        network (Cell): Cell network.
+        network_name (string, optional): Cell network name get from network. Default: None.
+        force_reload (bool, optional): Whether to force a fresh download unconditionally. Default: False.
+        **kwargs (optional): The corresponding kwargs for download for model.
+            device_target (string, optional): Runtime device target. Default: 'ascend'.
+            dataset (string, optional): Dataset to train the network. Default: 'cifar10'.
+
+    Example:
+        >>> mindspore.hub.load(network, network_name='lenet',
+                               **{'device_target': 'ascend', 'dataset':'cifar10', 'version': 'beta0.5'})
+    """
+    if not isinstance(network, nn.Cell):
+        logger.error("Failed to combine the net and the parameters.")
+        msg = ("Argument net should be a Cell, but got {}.".format(type(network)))
+        raise TypeError(msg)
+
+    if network_name is None:
+        if hasattr(network, network_name):
+            network_name = network.network_name
+        else:
+            msg = "Should input network name, but got None."
+            raise TypeError(msg)
+
+    device_target = kwargs['device_target'] if kwargs['device_target'] else 'ascend'
+    dataset = kwargs['dataset'] if kwargs['dataset'] else 'imagenet'
+    version = kwargs['version'] if kwargs['version'] else mindspore.version.__version__
+
+    if network_name.split("_")[0] in MODEL_TARGET_CV:
+        model_type = "cv"
+    elif network_name.split("_")[0] in MODEL_TARGET_NLP:
+        model_type = "nlp"
+
+    download_base_url = "/".join([DOWNLOAD_BASIC_URL,
+                                  OFFICIAL_NAME, model_type])
+    download_file_name = "_".join(
+        [network_name, device_target, version, dataset, OFFICIAL_NAME])
+    download_url = _get_file_from_url(download_base_url, download_file_name)
+
+    if force_reload:
+        ckpt_path = _get_weights_file(download_url, None, DEFAULT_CACHE_DIR)
+    else:
+        raise ValueError("Unsupported not force reload.")
+
+    ckpt_file = os.path.join(ckpt_path, network_name + ".ckpt")
+    param_dict = load_checkpoint(ckpt_file)
+    load_param_into_net(network, param_dict)
--- a/mindspore/nn/layer/conv.py
+++ b/mindspore/nn/layer/conv.py
@@ -880,6 +880,8 @@ class DepthwiseConv2d(Cell):
        self.dilation = dilation
        self.group = group
        self.has_bias = has_bias
+        self.weight_init = weight_init
+        self.bias_init = bias_init
        self.conv = P.DepthwiseConv2dNative(channel_multiplier=1,
                                            kernel_size=self.kernel_size,
                                            pad_mode=self.pad_mode,

--- a/model_zoo/lenet_quant/README.md
+++ b/model_zoo/lenet_quant/README.md
--- a/model_zoo/lenet_quant/eval.py
+++ b/model_zoo/lenet_quant/eval.py
--- a/model_zoo/lenet_quant/eval_quant.py
+++ b/model_zoo/lenet_quant/eval_quant.py
--- a/model_zoo/lenet_quant/export.py
+++ b/model_zoo/lenet_quant/export.py
--- a/model_zoo/lenet_quant/src/config.py
+++ b/model_zoo/lenet_quant/src/config.py
--- a/model_zoo/lenet_quant/src/dataset.py
+++ b/model_zoo/lenet_quant/src/dataset.py
--- a/model_zoo/lenet_quant/src/lenet.py
+++ b/model_zoo/lenet_quant/src/lenet.py
--- a/model_zoo/lenet_quant/src/lenet_fusion.py
+++ b/model_zoo/lenet_quant/src/lenet_fusion.py
--- a/model_zoo/lenet_quant/src/loss_monitor.py
+++ b/model_zoo/lenet_quant/src/loss_monitor.py
@@ -48,10 +48,16 @@ class LossMonitor(Callback):
        self.lr_init = lr_init

    def epoch_begin(self, run_context):
+        """
+        epoch begin
+        """
        self.losses = []
        self.epoch_time = time.time()

    def epoch_end(self, run_context):
+        """
+        epoch end
+        """
        cb_params = run_context.original_args()
        epoch_mseconds = (time.time() - self.epoch_time) * 1000
        per_step_mseconds = epoch_mseconds / cb_params.batch_num
@@ -62,9 +68,15 @@ class LossMonitor(Callback):
        print("*" * 60)

    def step_begin(self, run_context):
+        """
+        step begin
+        """
        self.step_time = time.time()

    def step_end(self, run_context):
+        """
+        step end
+        """
        cb_params = run_context.original_args()
        step_mseconds = (time.time() - self.step_time) * 1000
        step_loss = cb_params.net_outputs

--- a/model_zoo/lenet_quant/train.py
+++ b/model_zoo/lenet_quant/train.py
--- a/model_zoo/lenet_quant/train_quant.py
+++ b/model_zoo/lenet_quant/train_quant.py
--- a/model_zoo/mobilenetv2/Readme.md
+++ b/model_zoo/mobilenetv2/Readme.md
--- a/model_zoo/mobilenetv2/eval.py
+++ b/model_zoo/mobilenetv2/eval.py
--- a/model_zoo/mobilenetv2/scripts/run_infer.sh
+++ b/model_zoo/mobilenetv2/scripts/run_infer.sh
--- a/model_zoo/mobilenetv2/scripts/run_train.sh
+++ b/model_zoo/mobilenetv2/scripts/run_train.sh
--- a/model_zoo/mobilenetv2/src/config.py
+++ b/model_zoo/mobilenetv2/src/config.py
--- a/model_zoo/mobilenetv2/src/dataset.py
+++ b/model_zoo/mobilenetv2/src/dataset.py
--- a/model_zoo/mobilenetv2/src/launch.py
+++ b/model_zoo/mobilenetv2/src/launch.py
--- a/model_zoo/mobilenetv2/src/lr_generator.py
+++ b/model_zoo/mobilenetv2/src/lr_generator.py
--- a/model_zoo/mobilenetv2/src/mobilenetV2.py
+++ b/model_zoo/mobilenetv2/src/mobilenetV2.py
--- a/model_zoo/mobilenetv2/train.py
+++ b/model_zoo/mobilenetv2/train.py
--- a/model_zoo/mobilenetv2_quant/Readme.md
+++ b/model_zoo/mobilenetv2_quant/Readme.md
--- a/model_zoo/mobilenetv2_quant/eval.py
+++ b/model_zoo/mobilenetv2_quant/eval.py
--- a/model_zoo/mobilenetv2_quant/export.py
+++ b/model_zoo/mobilenetv2_quant/export.py
--- a/model_zoo/mobilenetv2_quant/scripts/run_infer.sh
+++ b/model_zoo/mobilenetv2_quant/scripts/run_infer.sh
--- a/model_zoo/mobilenetv2_quant/scripts/run_infer_quant.sh
+++ b/model_zoo/mobilenetv2_quant/scripts/run_infer_quant.sh
--- a/model_zoo/mobilenetv2_quant/scripts/run_train.sh
+++ b/model_zoo/mobilenetv2_quant/scripts/run_train.sh
--- a/model_zoo/mobilenetv2_quant/scripts/run_train_quant.sh
+++ b/model_zoo/mobilenetv2_quant/scripts/run_train_quant.sh
--- a/model_zoo/mobilenetv2_quant/src/config.py
+++ b/model_zoo/mobilenetv2_quant/src/config.py
--- a/model_zoo/mobilenetv2_quant/src/dataset.py
+++ b/model_zoo/mobilenetv2_quant/src/dataset.py
--- a/model_zoo/mobilenetv2_quant/src/launch.py
+++ b/model_zoo/mobilenetv2_quant/src/launch.py
--- a/model_zoo/mobilenetv2_quant/src/lr_generator.py
+++ b/model_zoo/mobilenetv2_quant/src/lr_generator.py
--- a/model_zoo/mobilenetv2_quant/src/mobilenetV2.py
+++ b/model_zoo/mobilenetv2_quant/src/mobilenetV2.py
--- a/model_zoo/mobilenetv2_quant/src/utils.py
+++ b/model_zoo/mobilenetv2_quant/src/utils.py
--- a/model_zoo/mobilenetv2_quant/train.py
+++ b/model_zoo/mobilenetv2_quant/train.py
--- a/model_zoo/mobilenetv3/Readme.md
+++ b/model_zoo/mobilenetv3/Readme.md
--- a/model_zoo/mobilenetv3/eval.py
+++ b/model_zoo/mobilenetv3/eval.py
--- a/model_zoo/mobilenetv3/scripts/run_infer.sh
+++ b/model_zoo/mobilenetv3/scripts/run_infer.sh
--- a/model_zoo/mobilenetv3/scripts/run_train.sh
+++ b/model_zoo/mobilenetv3/scripts/run_train.sh
--- a/model_zoo/mobilenetv3/src/config.py
+++ b/model_zoo/mobilenetv3/src/config.py
--- a/model_zoo/mobilenetv3/src/dataset.py
+++ b/model_zoo/mobilenetv3/src/dataset.py
--- a/model_zoo/mobilenetv3/src/launch.py
+++ b/model_zoo/mobilenetv3/src/launch.py
--- a/model_zoo/mobilenetv3/src/lr_generator.py
+++ b/model_zoo/mobilenetv3/src/lr_generator.py
--- a/model_zoo/mobilenetv3/src/mobilenetV3.py
+++ b/model_zoo/mobilenetv3/src/mobilenetV3.py
--- a/model_zoo/mobilenetv3/train.py
+++ b/model_zoo/mobilenetv3/train.py
--- a/model_zoo/resnet50_quant/Readme.md
+++ b/model_zoo/resnet50_quant/Readme.md
--- a/model_zoo/resnet50_quant/eval.py
+++ b/model_zoo/resnet50_quant/eval.py
--- a/model_zoo/resnet50_quant/models/resnet_quant.py
+++ b/model_zoo/resnet50_quant/models/resnet_quant.py
--- a/model_zoo/resnet50_quant/scripts/run_infer.sh
+++ b/model_zoo/resnet50_quant/scripts/run_infer.sh
--- a/model_zoo/resnet50_quant/scripts/run_train.sh
+++ b/model_zoo/resnet50_quant/scripts/run_train.sh
--- a/model_zoo/resnet50_quant/src/config.py
+++ b/model_zoo/resnet50_quant/src/config.py
--- a/model_zoo/resnet50_quant/src/crossentropy.py
+++ b/model_zoo/resnet50_quant/src/crossentropy.py
--- a/model_zoo/resnet50_quant/src/dataset.py
+++ b/model_zoo/resnet50_quant/src/dataset.py
--- a/model_zoo/resnet50_quant/src/launch.py
+++ b/model_zoo/resnet50_quant/src/launch.py
--- a/model_zoo/resnet50_quant/src/lr_generator.py
+++ b/model_zoo/resnet50_quant/src/lr_generator.py
--- a/model_zoo/resnet50_quant/src/utils.py
+++ b/model_zoo/resnet50_quant/src/utils.py
--- a/model_zoo/resnet50_quant/train.py
+++ b/model_zoo/resnet50_quant/train.py
--- a/tests/ut/python/train/quant/test_quant.py
+++ b/tests/ut/python/train/quant/test_quant.py
@@ -20,7 +20,7 @@ import mindspore.context as context
 from mindspore import Tensor
 from mindspore import nn
 from mindspore.train.quant import quant as qat
-from model_zoo.mobilenetv2_quant.src.mobilenetV2 import mobilenetV2
+from model_zoo.official.cv.mobilenetv2_quant.src.mobilenetV2 import mobilenetV2

 context.set_context(mode=context.GRAPH_MODE, device_target="GPU")