remove create module code and update demo script

5eade5ce · wuzewu · 7bdce56e · 5eade5ce · 5eade5ce · 5eade5ce
49 changed file
--- a/demo/image-classification/README.md
+++ b/demo/image-classification/README.md
-# PaddleHub图像分类迁移
+# PaddleHub 图像分类
-## 关于图像分类
+## 关于
-https://github.com/PaddlePaddle/models/tree/develop/fluid/PaddleCV/image_classification
-## 创建Module
+本示例将展示如何使用PaddleHub Finetune API以及[图像分类](https://github.com/PaddlePaddle/models/tree/develop/fluid/PaddleCV/image_classification)预训练模型完成分类任务。
-本目录包含了创建一个基于ImageNet 2012数据集预训练的图像分类模型(ResNet/MobileNet)的Module的脚本。
-通过以下脚本来一键创建一个ResNet50 Module
+## 准备工作
+在运行本目录的脚本前，需要先安装1.3.0版本以上的PaddlePaddle（如果您本地已经安装了符合条件的PaddlePaddle版本，那么可以跳过`准备工作`这一步）。
+如果您的机器支持GPU，我们建议下载GPU版本的PaddlePaddle，使用GPU进行训练和预测的效率都比使用CPU要高。
 ```shell
-sh create_module.sh
+# 安装GPU版本的PaddlePaddle
+$ pip install --upgrade paddlepaddle-gpu
 ```
-NOTE:
-* 如果进行下面示例的脚本或者代码，请确保执行上述脚本
+如果您的机器不支持GPU，可以通过下面的命令来安装CPU版本的PaddlePaddle
-* 关于创建Module的API和细节，请查看`create_module.py`
-## 使用Module预测
-该Module创建完成后，可以通过命令行或者python API两种方式进行预测
-### 命令行方式
-`infer.sh`给出了使用命令行调用Module预测的示例脚本
-通过以下命令试验下效果
 ```shell
-sh infer.sh
+# 安装CPU版本的PaddlePaddle
+$ pip install --upgrade paddlepaddle
 ```
-### 通过python API
-`infer_by_code.py`给出了使用python API调用Module预测的示例代码
+在安装过程中如果遇到问题，您可以到[Paddle官方网站](http://www.paddlepaddle.org/)上查看解决方案。
-通过以下命令试验下效果
+## 开始Finetune
+在完成安装PaddlePaddle与PaddleHub后，通过执行脚本`sh run_classifier.sh`即可开始使用进行finetune。
+脚本支持的参数如下：
 ```shell
-python infer_by_code.py
+--batch_size: 批处理大小，请结合显存情况进行调整，若出现显存不足，请适当调低这一参数。默认为16
+--num_epoch: finetune迭代的轮数。默认为1
+--module: 使用哪个Module作为finetune的特征提取器，脚本支持{resnet50/resnet101/resnet152/mobilenet/nasnet/pnasnet}等模型。默认为resnet50
+--checkpoint_dir: 模型保存路径，PaddleHub会自动保存验证集上表现最好的模型。默认为paddlehub_finetune_ckpt
+--dataset: 使用什么数据集进行finetune, 脚本支持分别是{flowers/dogcat}。默认为flowers
+--use_gpu: 使用使用GPU进行训练，如果机器支持GPU且安装了GPU版本的PaddlePaddle，我们建议您打开这个开关。默认关闭
 ```
-## 对预训练模型进行Finetune
+## 进行预测
-通过以下命令进行Finetune
+当完成finetune后，finetune过程在验证集上表现最优的模型会被保存在`${CHECKPOINT_DIR}/best_model`目录下，其中`${CHECKPOINT_DIR}`目录为finetune时所选择的保存checkpoint的目录。
+我们使用该模型来进行预测。执行脚本`sh predict.sh`即可开始使用进行预测。
+脚本支持的参数如下：
 ```shell
-sh finetune.sh
+--module: 使用哪个Module作为finetune的特征提取器，脚本支持{resnet50/resnet101/resnet152/mobilenet/nasnet/pnasnet}等模型。默认为resnet50
+--checkpoint_dir: 模型保存路径，PaddleHub会自动保存验证集上表现最好的模型。默认为paddlehub_finetune_ckpt
+--dataset: 使用什么数据集进行finetune, 脚本支持分别是{flowers/dogcat}。默认为flowers
+--use_gpu: 使用使用GPU进行训练，如果本机支持GPU且安装了GPU版本的PaddlePaddle，我们建议您打开这个开关。默认关闭
 ```
-更多关于Finetune的资料，请查看[基于PaddleHub的迁移学习](https://github.com/PaddlePaddle/PaddleHub/blob/develop/docs/transfer_learning_turtorial.md)
+`注意`：进行预测时，所选择的module，checkpoint_dir，dataset必须和finetune所用的一样
--- a/demo/image-classification/img_classifier.py
+++ b/demo/image-classification/img_classifier.py
@@ -7,12 +7,12 @@ import numpy as np
 # yapf: disable
 parser = argparse.ArgumentParser(__doc__)
-parser.add_argument("--target",         type=str,   default="finetune",                 help="Number of epoches for fine-tuning.")
+parser.add_argument("--num_epoch",      type=int,   default=1,                          help="Number of epoches for fine-tuning.")
-parser.add_argument("--num_epoch",      type=int,   default=3,                          help="Number of epoches for fine-tuning.")
+parser.add_argument("--use_gpu",        type=bool,  default=False,                      help="Whether use GPU for fine-tuning.")
-parser.add_argument("--use_gpu",        type=bool,  default=False,                      help="Whether use GPU for finetuning or predict")
+parser.add_argument("--checkpoint_dir", type=str,   default="paddlehub_finetune_ckpt",  help="Path to save log data.")
-parser.add_argument("--checkpoint_dir", type=str,   default="paddlehub_finetune_ckpt",  help="Path to training data.")
 parser.add_argument("--batch_size",     type=int,   default=16,                         help="Total examples' number in batch for training.")
-parser.add_argument("--module",         type=str,   default="resnet50",                 help="Total examples' number in batch for training.")
+parser.add_argument("--module",         type=str,   default="resnet50",                 help="Module used as feature extractor.")
+parser.add_argument("--dataset",        type=str,   default="flowers",                  help="Dataset to finetune.")
 # yapf: enable.
 module_map = {
@@ -25,33 +25,25 @@ module_map = {
 }
-def get_reader(module, dataset=None):
+def finetune(args):
-    return hub.reader.ImageClassificationReader(
+    module = hub.Module(name=args.module)
+    input_dict, output_dict, program = module.context(trainable=True)
+    dataset = hub.dataset.Flowers()
+    data_reader = hub.reader.ImageClassificationReader(
        image_width=module.get_expected_image_width(),
        image_height=module.get_expected_image_height(),
        images_mean=module.get_pretrained_images_mean(),
        images_std=module.get_pretrained_images_std(),
        dataset=dataset)
+    feature_map = output_dict["feature_map"]
+    task = hub.create_img_cls_task(
+        feature=feature_map, num_classes=dataset.num_labels)
-def get_task(module, num_classes):
-    input_dict, output_dict, program = module.context(trainable=True)
-    with fluid.program_guard(program):
-        img = input_dict["image"]
-        feature_map = output_dict["feature_map"]
-        task = hub.create_img_cls_task(
-            feature=feature_map, num_classes=num_classes)
-    return task
-def finetune(args):
-    module = hub.Module(name=args.module)
-    input_dict, output_dict, program = module.context(trainable=True)
-    dataset = hub.dataset.Flowers()
-    data_reader = get_reader(module, dataset)
-    task = get_task(module, dataset.num_labels)
    img = input_dict["image"]
    feed_list = [img.name, task.variable('label').name]
    config = hub.RunConfig(
        use_cuda=args.use_gpu,
        num_epoch=args.num_epoch,
@@ -64,54 +56,6 @@ def finetune(args):
        task, feed_list=feed_list, data_reader=data_reader, config=config)
-def predict(args):
-    module = hub.Module(name=args.module)
-    input_dict, output_dict, program = module.context(trainable=True)
-    data_reader = get_reader(module)
-    task = get_task(module, 5)
-    img = input_dict["image"]
-    feed_list = [img.name]
-    label_map = {
-        0: "roses",
-        1: "tulips",
-        2: "daisy",
-        3: "sunflowers",
-        4: "dandelion"
-    }
-    with fluid.program_guard(task.inference_program()):
-        place = fluid.CUDAPlace(0) if args.use_gpu else fluid.CPUPlace()
-        exe = fluid.Executor(place)
-        pretrained_model_dir = os.path.join(args.checkpoint_dir, "best_model")
-        if not os.path.exists(pretrained_model_dir):
-            hub.logger.error(
-                "pretrained model dir %s didn't exist" % pretrained_model_dir)
-            exit(1)
-        fluid.io.load_persistables(exe, pretrained_model_dir)
-        feeder = fluid.DataFeeder(feed_list=feed_list, place=place)
-        data = ["test/test_img_roses.jpg", "test/test_img_daisy.jpg"]
-        predict_reader = data_reader.data_generator(
-            phase="predict", batch_size=1, data=data)
-        for index, batch in enumerate(predict_reader()):
-            result, = exe.run(
-                feed=feeder.feed(batch), fetch_list=[task.variable('probs')])
-            predict_result = label_map[np.argsort(result[0])[::-1][0]]
-            print("input %i is %s, and the predict result is %s" %
-                  (index, data[index], predict_result))
-def main(args):
-    if args.target == "finetune":
-        finetune(args)
-    elif args.target == "predict":
-        predict(args)
-    else:
-        hub.logger.error("target should in %s" % ["finetune", "predict"])
-        exit(1)
 if __name__ == "__main__":
    args = parser.parse_args()
    if not args.module in module_map:
@@ -119,4 +63,4 @@ if __name__ == "__main__":
        exit(1)
    args.module = module_map[args.module]
-    main(args)
+    finetune(args)
--- a/demo/image-classification/predict.py
+++ b/demo/image-classification/predict.py
+import argparse
+import os
+import paddle.fluid as fluid
+import paddlehub as hub
+import numpy as np
+# yapf: disable
+parser = argparse.ArgumentParser(__doc__)
+parser.add_argument("--use_gpu",        type=bool,  default=False,                      help="Whether use GPU for predict.")
+parser.add_argument("--checkpoint_dir", type=str,   default="paddlehub_finetune_ckpt",  help="Path to save log data.")
+parser.add_argument("--module",         type=str,   default="resnet50",                 help="Module used as a feature extractor.")
+parser.add_argument("--dataset",        type=str,   default="flowers",                  help="Dataset to finetune.")
+# yapf: enable.
+module_map = {
+    "resnet50": "resnet_v2_50_imagenet",
+    "resnet101": "resnet_v2_101_imagenet",
+    "resnet152": "resnet_v2_152_imagenet",
+    "mobilenet": "mobilenet_v2_imagenet",
+    "nasnet": "nasnet_imagenet",
+    "pnasnet": "pnasnet_imagenet"
+}
+def predict(args):
+    if args.dataset == "dogcat":
+        dataset = hub.dataset.DogCat()
+    elif args.dataset == "flowers":
+        dataset = hub.dataset.Flowers()
+    label_map = dataset.label_dict()
+    num_labels = len(label_map)
+    module = hub.Module(name=args.module)
+    input_dict, output_dict, program = module.context()
+    data_reader = hub.reader.ImageClassificationReader(
+        image_width=module.get_expected_image_width(),
+        image_height=module.get_expected_image_height(),
+        images_mean=module.get_pretrained_images_mean(),
+        images_std=module.get_pretrained_images_std(),
+        dataset=None)
+    img = input_dict["image"]
+    feature_map = output_dict["feature_map"]
+    task = hub.create_img_cls_task(feature=feature_map, num_classes=num_labels)
+    img = input_dict["image"]
+    feed_list = [img.name]
+    with fluid.program_guard(task.inference_program()):
+        place = fluid.CUDAPlace(0) if args.use_gpu else fluid.CPUPlace()
+        exe = fluid.Executor(place)
+        pretrained_model_dir = os.path.join(args.checkpoint_dir, "best_model")
+        if not os.path.exists(pretrained_model_dir):
+            hub.logger.error(
+                "pretrained model dir %s didn't exist" % pretrained_model_dir)
+            exit(1)
+        fluid.io.load_persistables(exe, pretrained_model_dir)
+        feeder = fluid.DataFeeder(feed_list=feed_list, place=place)
+        data = ["test/test_img_roses.jpg", "test/test_img_daisy.jpg"]
+        predict_reader = data_reader.data_generator(
+            phase="predict", batch_size=1, data=data)
+        for index, batch in enumerate(predict_reader()):
+            result, = exe.run(
+                feed=feeder.feed(batch), fetch_list=[task.variable('probs')])
+            predict_result = label_map[np.argsort(result[0])[::-1][0]]
+            print("input %i is %s, and the predict result is %s" %
+                  (index, data[index], predict_result))
+if __name__ == "__main__":
+    args = parser.parse_args()
+    if not args.module in module_map:
+        hub.logger.error("module should in %s" % module_map.keys())
+        exit(1)
+    args.module = module_map[args.module]
+    predict(args)
--- a/demo/image-classification/run_classifier.sh
+++ b/demo/image-classification/run_classifier.sh
@@ -28,4 +28,4 @@ done
 export CUDA_VISIBLE_DEVICES=${cuda_visible_devices}
-python -u img_classifier.py --target finetune --use_gpu ${use_gpu} --batch_size ${batch_size} --checkpoint_dir ${checkpoint_dir} --num_epoch ${num_epoch} --module ${module}
+python -u img_classifier.py --use_gpu ${use_gpu} --batch_size ${batch_size} --checkpoint_dir ${checkpoint_dir} --num_epoch ${num_epoch} --module ${module}
--- a/demo/image-classification/run_predict.sh
+++ b/demo/image-classification/run_predict.sh
@@ -22,4 +22,4 @@ done
 export CUDA_VISIBLE_DEVICES=${cuda_visible_devices}
-python -u img_classifier.py --target predict --use_gpu ${use_gpu} --checkpoint_dir ${checkpoint_dir} --module ${module}
+python -u predict.py --use_gpu ${use_gpu} --checkpoint_dir ${checkpoint_dir} --module ${module}
--- a/demo/lac/README.md
+++ b/demo/lac/README.md
-## 关于LAC
+# LAC
-https://github.com/baidu/lac
-## 创建Module
+## 关于
-本目录包含了创建一个基于LAC预训练模型的Module的脚本。
-通过以下脚本来一键创建一个LAC Module
+本示例展示如何使用LAC Module进行预测。
+LAC是中文词法分析模型，可以用于进行中文句子的分词/词性标注/命名实体识别等功能，关于模型的训练细节，请查看[LAC](https://github.com/baidu/lac)
+## 准备工作
+在运行本目录的脚本前，需要先安装1.3.0版本以上的PaddlePaddle（如果您本地已经安装了符合条件的PaddlePaddle版本，那么可以跳过`准备工作`这一步）。
+如果您的机器支持GPU，我们建议下载GPU版本的PaddlePaddle，使用GPU进行训练和预测的效率都比使用CPU要高。
 ```shell
-sh create_module.sh
+# 安装GPU版本的PaddlePaddle
+$ pip install --upgrade paddlepaddle-gpu
 ```
-NOTE:
-* 如果进行下面示例的脚本或者代码，请确保执行上述脚本
-* 关于创建Module的API和细节，请查看`create_module.py`
-## 使用Module预测
+如果您的机器不支持GPU，可以通过下面的命令来安装CPU版本的PaddlePaddle
-该Module创建完成后，可以通过命令行或者python API两种方式进行预测
-### 命令行方式
+```shell
+# 安装CPU版本的PaddlePaddle
+$ pip install --upgrade paddlepaddle
+```
+在安装过程中如果遇到问题，您可以到[Paddle官方网站](http://www.paddlepaddle.org/)上查看解决方案。
+## 命令行方式预测
 `infer.sh`给出了使用命令行调用Module预测的示例脚本
 通过以下命令试验下效果
 ```shell
-sh infer.sh
+$ sh infer.sh
 ```
-### 通过python API
+## 通过python API预测
 `infer_by_code.py`给出了使用python API调用Module预测的示例代码
 通过以下命令试验下效果
 ```shell
 python infer_by_code.py
 ```
--- a/demo/lac/create_module.py
+++ b/demo/lac/create_module.py
-import numpy as np
-import paddle
-import paddle.fluid as fluid
-import reader
-import paddlehub as hub
-import processor
-import os
-from network import lex_net
-def create_module():
-    word_dict_path = "resources/word.dic"
-    label_dict_path = "resources/tag.dic"
-    word_rep_dict_path = "resources/q2b.dic"
-    pretrained_model = "resources/model"
-    word2id_dict = reader.load_reverse_dict(word_dict_path)
-    label2id_dict = reader.load_reverse_dict(label_dict_path)
-    word_rep_dict = reader.load_dict(word_rep_dict_path)
-    word_dict_len = max(map(int, word2id_dict.values())) + 1
-    label_dict_len = max(map(int, label2id_dict.values())) + 1
-    avg_cost, crf_decode, word, target = lex_net(word_dict_len, label_dict_len)
-    place = fluid.CPUPlace()
-    exe = fluid.Executor(place)
-    exe.run(fluid.default_startup_program())
-    # load the lac pretrained model
-    def if_exist(var):
-        return os.path.exists(os.path.join(pretrained_model, var.name))
-    fluid.io.load_vars(exe, pretrained_model, predicate=if_exist)
-    # assets
-    assets = [word_dict_path, label_dict_path, word_rep_dict_path]
-    # create a module and save as lac.hub_module
-    sign = hub.create_signature(
-        name="lexical_analysis",
-        inputs=[word],
-        outputs=[crf_decode],
-        for_predict=True)
-    hub.create_module(
-        sign_arr=[sign],
-        module_dir="lac.hub_module",
-        exe=exe,
-        module_info="resources/module_info.yml",
-        processor=processor.Processor,
-        assets=assets)
-if __name__ == "__main__":
-    create_module()
--- a/demo/lac/create_module.sh
+++ b/demo/lac/create_module.sh
-#!/bin/bash
-set -o nounset
-set -o errexit
-script_path=$(cd `dirname $0`; pwd)
-module_path=lac.hub_module
-if [ -d $script_path/$module_path ]
-then
-    echo "$module_path already existed!"
-    exit 0
-fi
-cd $script_path/resources/
-if [ ! -d senta_model ]
-then
-    sh download.sh
-fi
-cd $script_path/
-python create_module.py
-echo "Successfully create $module_path"
--- a/demo/lac/infer.sh
+++ b/demo/lac/infer.sh
-python ../../paddlehub/commands/hub.py run lac.hub_module/ --signature lexical_analysis --config resources/test/test.yml  --input_file resources/test/test.txt
+python ../../paddlehub/commands/hub.py run lac --input_file test/test.txt
--- a/demo/lac/infer_by_code.py
+++ b/demo/lac/infer_by_code.py
@@ -4,7 +4,7 @@ import paddlehub as hub
 def infer_with_input_text():
    # get lac module
-    lac = hub.Module(module_dir="lac.hub_module")
+    lac = hub.Module(name="lac")
    test_text = ["今天是个好日子", "天气预报说今天要下雨", "下一班地铁马上就要到了"]
@@ -24,14 +24,14 @@ def infer_with_input_text():
 def infer_with_input_file():
    # get lac module
-    lac = hub.Module(module_dir="lac.hub_module")
+    lac = hub.Module(name="lac")
    # get the input keys for signature 'lexical_analysis'
    data_format = lac.processor.data_format(sign_name='lexical_analysis')
    key = list(data_format.keys())[0]
    # parse input file
-    test_file = os.path.join("resources", "test", "test.txt")
+    test_file = os.path.join("test", "test.txt")
    test_text = hub.io.parser.txt_parser.parse(test_file)
    # set input dict

--- a/demo/lac/network.py
+++ b/demo/lac/network.py
-import sys
-import os
-import math
-import paddle.fluid as fluid
-from paddle.fluid.initializer import NormalInitializer
-def lex_net(word_dict_len, label_dict_len):
-    """
-    define the lexical analysis network structure
-    """
-    word_emb_dim = 128
-    grnn_hidden_dim = 256
-    emb_lr = 5
-    crf_lr = 0.2
-    bigru_num = 2
-    init_bound = 0.1
-    IS_SPARSE = True
-    def _bigru_layer(input_feature):
-        """
-        define the bidirectional gru layer
-        """
-        pre_gru = fluid.layers.fc(
-            input=input_feature,
-            size=grnn_hidden_dim * 3,
-            param_attr=fluid.ParamAttr(
-                initializer=fluid.initializer.Uniform(
-                    low=-init_bound, high=init_bound),
-                regularizer=fluid.regularizer.L2DecayRegularizer(
-                    regularization_coeff=1e-4)))
-        gru = fluid.layers.dynamic_gru(
-            input=pre_gru,
-            size=grnn_hidden_dim,
-            param_attr=fluid.ParamAttr(
-                initializer=fluid.initializer.Uniform(
-                    low=-init_bound, high=init_bound),
-                regularizer=fluid.regularizer.L2DecayRegularizer(
-                    regularization_coeff=1e-4)))
-        pre_gru_r = fluid.layers.fc(
-            input=input_feature,
-            size=grnn_hidden_dim * 3,
-            param_attr=fluid.ParamAttr(
-                initializer=fluid.initializer.Uniform(
-                    low=-init_bound, high=init_bound),
-                regularizer=fluid.regularizer.L2DecayRegularizer(
-                    regularization_coeff=1e-4)))
-        gru_r = fluid.layers.dynamic_gru(
-            input=pre_gru_r,
-            size=grnn_hidden_dim,
-            is_reverse=True,
-            param_attr=fluid.ParamAttr(
-                initializer=fluid.initializer.Uniform(
-                    low=-init_bound, high=init_bound),
-                regularizer=fluid.regularizer.L2DecayRegularizer(
-                    regularization_coeff=1e-4)))
-        bi_merge = fluid.layers.concat(input=[gru, gru_r], axis=1)
-        return bi_merge
-    def _net_conf(word, target):
-        """
-        Configure the network
-        """
-        word_embedding = fluid.layers.embedding(
-            input=word,
-            size=[word_dict_len, word_emb_dim],
-            dtype='float32',
-            is_sparse=IS_SPARSE,
-            param_attr=fluid.ParamAttr(
-                learning_rate=emb_lr,
-                name="word_emb",
-                initializer=fluid.initializer.Uniform(
-                    low=-init_bound, high=init_bound)))
-        input_feature = word_embedding
-        for i in range(bigru_num):
-            bigru_output = _bigru_layer(input_feature)
-            input_feature = bigru_output
-        emission = fluid.layers.fc(
-            size=label_dict_len,
-            input=bigru_output,
-            param_attr=fluid.ParamAttr(
-                initializer=fluid.initializer.Uniform(
-                    low=-init_bound, high=init_bound),
-                regularizer=fluid.regularizer.L2DecayRegularizer(
-                    regularization_coeff=1e-4)))
-        crf_cost = fluid.layers.linear_chain_crf(
-            input=emission,
-            label=target,
-            param_attr=fluid.ParamAttr(name='crfw', learning_rate=crf_lr))
-        crf_decode = fluid.layers.crf_decoding(
-            input=emission, param_attr=fluid.ParamAttr(name='crfw'))
-        avg_cost = fluid.layers.mean(x=crf_cost)
-        return avg_cost, crf_decode
-    word = fluid.layers.data(name='word', shape=[1], dtype='int64', lod_level=1)
-    target = fluid.layers.data(
-        name="target", shape=[1], dtype='int64', lod_level=1)
-    avg_cost, crf_decode = _net_conf(word, target)
-    return avg_cost, crf_decode, word, target
--- a/demo/lac/processor.py
+++ b/demo/lac/processor.py
-import paddle
-import paddle.fluid as fluid
-import paddlehub as hub
-import numpy as np
-import os
-import io
-from paddlehub import BaseProcessor
-class Processor(BaseProcessor):
-    def __init__(self, module):
-        self.module = module
-        assets_path = self.module.helper.assets_path()
-        word_dict_path = os.path.join(assets_path, "word.dic")
-        label_dict_path = os.path.join(assets_path, "tag.dic")
-        word_rep_dict_path = os.path.join(assets_path, "q2b.dic")
-        self.id2word_dict = self.load_dict(word_dict_path)
-        self.word2id_dict = self.load_reverse_dict(word_dict_path)
-        self.id2label_dict = self.load_dict(label_dict_path)
-        self.label2id_dict = self.load_reverse_dict(label_dict_path)
-        self.q2b_dict = self.load_dict(word_rep_dict_path)
-    def load_dict(self, dict_path):
-        result_dict = {}
-        for line in io.open(dict_path, "r", encoding='utf8'):
-            terms = line.strip("\n").split("\t")
-            if len(terms) != 2:
-                continue
-            result_dict[terms[0]] = terms[1]
-        return result_dict
-    def load_reverse_dict(self, dict_path):
-        result_dict = {}
-        for line in io.open(dict_path, "r", encoding='utf8'):
-            terms = line.strip("\n").split("\t")
-            if len(terms) != 2:
-                continue
-            result_dict[terms[1]] = terms[0]
-        return result_dict
-    def preprocess(self, sign_name, data_dict):
-        result = {'text': []}
-        for sentence in data_dict['text']:
-            result_i = {}
-            result_i['origin'] = sentence
-            line = sentence.strip()
-            word_idx = []
-            for word in line:
-                if ord(word) < 0x20:
-                    word = ' '
-                if word in self.q2b_dict:
-                    word = self.q2b_dict[word]
-                if word in self.word2id_dict:
-                    word_idx.append(int(self.word2id_dict[word]))
-                else:
-                    word_idx.append(int(self.word2id_dict["OOV"]))
-            result_i['attach'] = line
-            result_i['processed'] = [x for x in word_idx]
-            result['text'].append(result_i)
-        return result
-    def postprocess(self, sign_name, data_out, data_info, **kwargs):
-        if sign_name == "lexical_analysis":
-            result = []
-            crf_decode = data_out[0]
-            lod_info = (crf_decode.lod())[0]
-            np_data = np.array(crf_decode)
-            for index in range(len(lod_info) - 1):
-                seg_result = {"word": [], "tag": []}
-                word_index = 0
-                outstr = ""
-                offset = 0
-                cur_full_word = ""
-                cur_full_tag = ""
-                words = data_info['text'][index]['attach']
-                for tag_index in range(lod_info[index], lod_info[index + 1]):
-                    cur_word = words[word_index]
-                    cur_tag = self.id2label_dict[str(np_data[tag_index][0])]
-                    if cur_tag.endswith("-B") or cur_tag.endswith("O"):
-                        if len(cur_full_word) != 0:
-                            seg_result['word'].append(cur_full_word)
-                            seg_result['tag'].append(cur_full_tag)
-                        cur_full_word = cur_word
-                        cur_full_tag = self.get_real_tag(cur_tag)
-                    else:
-                        cur_full_word += cur_word
-                    word_index += 1
-                seg_result['word'].append(cur_full_word)
-                seg_result['tag'].append(cur_full_tag)
-                result.append(seg_result)
-            return result
-    def get_real_tag(self, origin_tag):
-        if origin_tag == "O":
-            return "O"
-        return origin_tag[0:len(origin_tag) - 2]
-    def data_format(self, sign_name):
-        if sign_name == "lexical_analysis":
-            return {
-                "text": {
-                    "type": hub.DataType.TEXT,
-                    "feed_key": self.module.signatures[sign_name].inputs[0].name
-                }
-            }
-        return None
--- a/demo/lac/reader.py
+++ b/demo/lac/reader.py
-"""
-The file_reader converts raw corpus to input.
-"""
-import os
-import __future__
-import io
-def file_reader(file_dir,
-                word2id_dict,
-                label2id_dict,
-                word_replace_dict,
-                filename_feature=""):
-    """
-    define the reader to read files in file_dir
-    """
-    word_dict_len = max(map(int, word2id_dict.values())) + 1
-    label_dict_len = max(map(int, label2id_dict.values())) + 1
-    def reader():
-        """
-        the data generator
-        """
-        index = 0
-        for root, dirs, files in os.walk(file_dir):
-            for filename in files:
-                if not filename.startswith(filename_feature):
-                    continue
-                for line in io.open(
-                        os.path.join(root, filename), 'r', encoding='utf8'):
-                    index += 1
-                    bad_line = False
-                    line = line.strip("\n")
-                    if len(line) == 0:
-                        continue
-                    seg_tag = line.rfind("\t")
-                    word_part = line[0:seg_tag]
-                    label_part = line[seg_tag + 1:]
-                    word_idx = []
-                    words = word_part
-                    for word in words:
-                        if ord(word) < 0x20:
-                            word = ' '
-                        if word in word_replace_dict:
-                            word = word_replace_dict[word]
-                        if word in word2id_dict:
-                            word_idx.append(int(word2id_dict[word]))
-                        else:
-                            word_idx.append(int(word2id_dict["OOV"]))
-                    target_idx = []
-                    labels = label_part.strip().split(" ")
-                    for label in labels:
-                        if label in label2id_dict:
-                            target_idx.append(int(label2id_dict[label]))
-                        else:
-                            target_idx.append(int(label2id_dict["O"]))
-                    if len(word_idx) != len(target_idx):
-                        continue
-                    yield word_idx, target_idx
-    return reader
-def test_reader(file_dir,
-                word2id_dict,
-                label2id_dict,
-                word_replace_dict,
-                filename_feature=""):
-    """
-    define the reader to read test files in file_dir
-    """
-    word_dict_len = max(map(int, word2id_dict.values())) + 1
-    label_dict_len = max(map(int, label2id_dict.values())) + 1
-    def reader():
-        """
-        the data generator
-        """
-        index = 0
-        for root, dirs, files in os.walk(file_dir):
-            for filename in files:
-                if not filename.startswith(filename_feature):
-                    continue
-                for line in io.open(
-                        os.path.join(root, filename), 'r', encoding='utf8'):
-                    index += 1
-                    bad_line = False
-                    line = line.strip("\n")
-                    if len(line) == 0:
-                        continue
-                    seg_tag = line.rfind("\t")
-                    if seg_tag == -1:
-                        seg_tag = len(line)
-                    word_part = line[0:seg_tag]
-                    label_part = line[seg_tag + 1:]
-                    word_idx = []
-                    words = word_part
-                    for word in words:
-                        if ord(word) < 0x20:
-                            word = ' '
-                        if word in word_replace_dict:
-                            word = word_replace_dict[word]
-                        if word in word2id_dict:
-                            word_idx.append(int(word2id_dict[word]))
-                        else:
-                            word_idx.append(int(word2id_dict["OOV"]))
-                    yield word_idx, words
-    return reader
-def load_dict(dict_path):
-    """
-    Load a dict. The first column is the key and the second column is the value.
-    """
-    result_dict = {}
-    for line in io.open(dict_path, "r", encoding='utf8'):
-        terms = line.strip("\n").split("\t")
-        if len(terms) != 2:
-            continue
-        result_dict[terms[0]] = terms[1]
-    return result_dict
-def load_reverse_dict(dict_path):
-    """
-    Load a dict. The first column is the value and the second column is the key.
-    """
-    result_dict = {}
-    for line in io.open(dict_path, "r", encoding='utf8'):
-        terms = line.strip("\n").split("\t")
-        if len(terms) != 2:
-            continue
-        result_dict[terms[1]] = terms[0]
-    return result_dict
--- a/demo/lac/resources/customization.dic
+++ b/demo/lac/resources/customization.dic
--- a/demo/lac/resources/download.sh
+++ b/demo/lac/resources/download.sh
-#!/bin/bash
-set -o nounset
-set -o errexit
-script_path=$(cd `dirname $0`; pwd)
-cd $script_path
-wget --no-check-certificate https://paddlehub.bj.bcebos.com/paddle_model/lac.tar.gz
-tar xvzf lac.tar.gz
-rm lac.tar.gz
--- a/demo/lac/resources/module_info.yml
+++ b/demo/lac/resources/module_info.yml
-name: lac
-type: nlp/lexical_analysis
-author: paddlepaddle
-author_email: paddle-dev@baidu.com
-summary: "'Lexical Analysis of Chinese', which abbreviated as LAC, is a model used to process lexical analysis. People can use LAC to process Chinese text segmentation, part-of-speech tagging and named entity recognition"
-version: 1.0.0
--- a/demo/lac/resources/q2b.dic
+++ b/demo/lac/resources/q2b.dic
-、	,
-。	.
-—	-
-～	~
-‖	|
-…	.
-‘	'
-’	'
-“	"
-”	"
-〔	(
-〕	)
-〈	<
-〉	>
-「	'
-」	'
-『	"
-』	"
-〖	[
-〗	]
-【	[
-】	]
-∶	:
-＄	$
-！	!
-＂	"
-＃	#
-％	%
-＆	&
-＇	'
-（	(
-）	)
-＊	*
-＋	+
-，	,
-－	-
-．	.
-／	/
-０	0
-１	1
-２	2
-３	3
-４	4
-５	5
-６	6
-７	7
-８	8
-９	9
-：	:
-；	;
-＜	<
-＝	=
-＞	>
-？	?
-＠	@
-Ａ	a
-Ｂ	b
-Ｃ	c
-Ｄ	d
-Ｅ	e
-Ｆ	f
-Ｇ	g
-Ｈ	h
-Ｉ	i
-Ｊ	j
-Ｋ	k
-Ｌ	l
-Ｍ	m
-Ｎ	n
-Ｏ	o
-Ｐ	p
-Ｑ	q
-Ｒ	r
-Ｓ	s
-Ｔ	t
-Ｕ	u
-Ｖ	v
-Ｗ	w
-Ｘ	x
-Ｙ	y
-Ｚ	z
-［	[
-＼	\
-］	]
-＾	^
-＿	_
-｀	`
-ａ	a
-ｂ	b
-ｃ	c
-ｄ	d
-ｅ	e
-ｆ	f
-ｇ	g
-ｈ	h
-ｉ	i
-ｊ	j
-ｋ	k
-ｌ	l
-ｍ	m
-ｎ	n
-ｏ	o
-ｐ	p
-ｑ	q
-ｒ	r
-ｓ	s
-ｔ	t
-ｕ	u
-ｖ	v
-ｗ	w
-ｘ	x
-ｙ	y
-ｚ	z
-｛	{
-｜	|
-｝	}
-￣	~
-〝	"
-〞	"
-﹐	,
-﹑	,
-﹒	.
-﹔	;
-﹕	:
-﹖	?
-﹗	!
-﹙	(
-﹚	)
-﹛	{
-﹜	{
-﹝	[
-﹞	]
-﹟	#
-﹠	&
-﹡	*
-﹢	+
-﹣	-
-﹤	<
-﹥	>
-﹦	=
-﹨	\
-﹩	$
-﹪	%
-﹫	@
- 	,
-A	a
-B	b
-C	c
-D	d
-E	e
-F	f
-G	g
-H	h
-I	i
-J	j
-K	k
-L	l
-M	m
-N	n
-O	o
-P	p
-Q	q
-R	r
-S	s
-T	t
-U	u
-V	v
-W	w
-X	x
-Y	y
-Z	z
--- a/demo/lac/resources/strong_punc.dic
+++ b/demo/lac/resources/strong_punc.dic
-!
-。
-！
-;
-；
--- a/demo/lac/resources/tag.dic
+++ b/demo/lac/resources/tag.dic
-0	a-B
-1	a-I
-2	ad-B
-3	ad-I
-4	an-B
-5	an-I
-6	c-B
-7	c-I
-8	d-B
-9	d-I
-10	f-B
-11	f-I
-12	m-B
-13	m-I
-14	n-B
-15	n-I
-16	nr-B
-17	nr-I
-18	ns-B
-19	ns-I
-20	nt-B
-21	nt-I
-22	nw-B
-23	nw-I
-24	nz-B
-25	nz-I
-26	p-B
-27	p-I
-28	q-B
-29	q-I
-30	r-B
-31	r-I
-32	s-B
-33	s-I
-34	t-B
-35	t-I
-36	u-B
-37	u-I
-38	v-B
-39	v-I
-40	vd-B
-41	vd-I
-42	vn-B
-43	vn-I
-44	w-B
-45	w-I
-46	xc-B
-47	xc-I
-48	PER-B
-49	PER-I
-50	LOC-B
-51	LOC-I
-52	ORG-B
-53	ORG-I
-54	TIME-B
-55	TIME-I
-56	O
--- a/demo/lac/resources/word.dic
+++ b/demo/lac/resources/word.dic
--- a/demo/lac/resources/test/test.txt
+++ b/demo/lac/resources/test/test.txt
--- a/demo/lac/resources/test/test.yml
+++ b/demo/lac/resources/test/test.yml
--- a/demo/senta/README.md
+++ b/demo/senta/README.md
-## 关于Senta
+# senta
-https://github.com/baidu/Senta
+## 关于
+本示例展示如何使用senta Module进行预测。
+senta是中文情感分析模型，可以用于进行中文句子的情感分析，输出结果为`{正向/中性/负向}`中的一个，关于模型的训练细节，请查看[senta](https://github.com/baidu/senta)
+## 准备工作
+在运行本目录的脚本前，需要先安装1.3.0版本以上的PaddlePaddle（如果您本地已经安装了符合条件的PaddlePaddle版本，那么可以跳过`准备工作`这一步）。
+如果您的机器支持GPU，我们建议下载GPU版本的PaddlePaddle，使用GPU进行训练和预测的效率都比使用CPU要高。
+```shell
+# 安装GPU版本的PaddlePaddle
+$ pip install --upgrade paddlepaddle-gpu
+```
+如果您的机器不支持GPU，可以通过下面的命令来安装CPU版本的PaddlePaddle
-## 创建Module
-本目录包含了创建一个基于senta预训练模型的Module的脚本。
-通过以下脚本来一键创建一个senta Module
 ```shell
-$ sh create_module.sh
+# 安装CPU版本的PaddlePaddle
+$ pip install --upgrade paddlepaddle
 ```
-NOTE:
-* 如果进行下面示例的脚本或者代码，请确保执行上述脚本
-* 关于创建Module的API和细节，请查看`create_module.py`
-## 使用Module预测
+在安装过程中如果遇到问题，您可以到[Paddle官方网站](http://www.paddlepaddle.org/)上查看解决方案。
-该Module创建完成后，可以通过命令行或者python API两种方式进行预测
-### 命令行方式
+## 命令行方式预测
 `infer.sh`给出了使用命令行调用Module预测的示例脚本
 通过以下命令试验下效果
 ```shell
 $ sh infer.sh
 ```
-### 通过python API
+## 通过python API预测
 `infer_by_code.py`给出了使用python API调用Module预测的示例代码
 通过以下命令试验下效果
 ```shell
-$ python infer_by_code.py
+python infer_by_code.py
 ```
--- a/demo/senta/create_module.py
+++ b/demo/senta/create_module.py
-import io
-import paddle.fluid as fluid
-import processor
-import numpy as np
-import nets
-import paddlehub as hub
-def load_vocab(file_path):
-    """
-    load the given vocabulary
-    """
-    vocab = {}
-    with io.open(file_path, 'r', encoding='utf8') as f:
-        wid = 0
-        for line in f:
-            line = line.rstrip()
-            parts = line.split('\t')
-            vocab[parts[0]] = int(parts[1])
-    vocab["<unk>"] = len(vocab)
-    return vocab
-def create_module():
-    network = nets.bilstm_net
-    # word seq data
-    data = fluid.layers.data(
-        name="words", shape=[1], dtype="int64", lod_level=1)
-    # label data
-    label = fluid.layers.data(name="label", shape=[1], dtype="int64")
-    word_dict_path = "./resources/train.vocab"
-    word_dict = load_vocab(word_dict_path)
-    cost, acc, pred = network(data, label, len(word_dict) + 1)
-    place = fluid.CPUPlace()
-    exe = fluid.Executor(place)
-    model_path = "./resources/senta_model"
-    fluid.io.load_inference_model(model_path, exe)
-    # assets
-    assets = [word_dict_path]
-    # create a module
-    sign = hub.create_signature(
-        name="sentiment_classify",
-        inputs=[data],
-        outputs=[pred],
-        for_predict=True)
-    hub.create_module(
-        sign_arr=[sign],
-        module_dir="senta.hub_module",
-        exe=exe,
-        module_info="resources/module_info.yml",
-        processor=processor.Processor,
-        assets=assets)
-if __name__ == "__main__":
-    create_module()
--- a/demo/senta/create_module.sh
+++ b/demo/senta/create_module.sh
-#!/bin/bash
-set -o nounset
-set -o errexit
-script_path=$(cd `dirname $0`; pwd)
-module_path=senta.hub_module
-if [ -d $script_path/$module_path ]
-then
-    echo "$module_path already existed!"
-    exit 0
-fi
-cd $script_path/resources/
-if [ ! -d senta_model ]
-then
-    sh download.sh
-fi
-cd $script_path/
-python create_module.py
-echo "Successfully create $module_path"
--- a/demo/senta/infer.sh
+++ b/demo/senta/infer.sh
-python ../../paddlehub/commands/hub.py run senta.hub_module/ --signature sentiment_classify --config resources/test/test.yml  --input_file resources/test/test.txt
+python ../../paddlehub/commands/hub.py run senta --input_file test/test.txt
--- a/demo/senta/infer_by_code.py
+++ b/demo/senta/infer_by_code.py
@@ -4,7 +4,7 @@ import paddlehub as hub
 def infer_with_input_text():
    # get senta module
-    senta = hub.Module(module_dir="senta.hub_module")
+    senta = hub.Module(name="senta")
    test_text = ["这家餐厅很好吃", "这部电影真的很差劲"]
@@ -24,14 +24,14 @@ def infer_with_input_text():
 def infer_with_input_file():
    # get senta module
-    senta = hub.Module(module_dir="senta.hub_module")
+    senta = hub.Module(name="senta")
    # get the input keys for signature 'sentiment_classify'
    data_format = senta.processor.data_format(sign_name='sentiment_classify')
    key = list(data_format.keys())[0]
    # parse input file
-    test_file = os.path.join("resources", "test", "test.txt")
+    test_file = os.path.join("test", "test.txt")
    test_text = hub.io.parser.txt_parser.parse(test_file)
    # set input dict

--- a/demo/senta/nets.py
+++ b/demo/senta/nets.py
-import paddle.fluid as fluid
-def bilstm_net(data,
-               label,
-               dict_dim,
-               emb_dim=128,
-               hid_dim=128,
-               hid_dim2=96,
-               class_dim=2,
-               emb_lr=30.0):
-    """
-    Bi-Lstm net
-    """
-    # embedding layer
-    emb = fluid.layers.embedding(
-        input=data,
-        size=[dict_dim, emb_dim],
-        param_attr=fluid.ParamAttr(learning_rate=emb_lr))
-    # bi-lstm layer
-    fc0 = fluid.layers.fc(input=emb, size=hid_dim * 4)
-    rfc0 = fluid.layers.fc(input=emb, size=hid_dim * 4)
-    lstm_h, c = fluid.layers.dynamic_lstm(
-        input=fc0, size=hid_dim * 4, is_reverse=False)
-    rlstm_h, c = fluid.layers.dynamic_lstm(
-        input=rfc0, size=hid_dim * 4, is_reverse=True)
-    # extract last layer
-    lstm_last = fluid.layers.sequence_last_step(input=lstm_h)
-    rlstm_last = fluid.layers.sequence_last_step(input=rlstm_h)
-    lstm_last_tanh = fluid.layers.tanh(lstm_last)
-    rlstm_last_tanh = fluid.layers.tanh(rlstm_last)
-    # concat layer
-    lstm_concat = fluid.layers.concat(input=[lstm_last, rlstm_last], axis=1)
-    # full connect layer
-    fc1 = fluid.layers.fc(input=lstm_concat, size=hid_dim2, act='tanh')
-    # softmax layer
-    prediction = fluid.layers.fc(input=fc1, size=class_dim, act='softmax')
-    cost = fluid.layers.cross_entropy(input=prediction, label=label)
-    avg_cost = fluid.layers.mean(x=cost)
-    acc = fluid.layers.accuracy(input=prediction, label=label)
-    return avg_cost, acc, prediction
--- a/demo/senta/processor.py
+++ b/demo/senta/processor.py
-import os
-import io
-import paddle
-import paddle.fluid as fluid
-import numpy as np
-import paddlehub as hub
-def load_vocab(file_path):
-    """
-    load the given vocabulary
-    """
-    vocab = {}
-    with io.open(file_path, 'r', encoding='utf8') as f:
-        wid = 0
-        for line in f:
-            line = line.rstrip()
-            parts = line.split('\t')
-            vocab[parts[0]] = int(parts[1])
-    vocab["<unk>"] = len(vocab)
-    return vocab
-def get_predict_label(pos_prob):
-    neg_prob = 1 - pos_prob
-    # threshold should be (1, 0.5)
-    neu_threshold = 0.55
-    if neg_prob > neu_threshold:
-        label, key = 0, "负面"
-    elif pos_prob > neu_threshold:
-        label, key = 2, "正面"
-    else:
-        label, key = 1, "中性"
-    return label, key
-class Processor(hub.BaseProcessor):
-    def __init__(self, module):
-        self.module = module
-        assets_path = self.module.helper.assets_path()
-        word_dict_path = os.path.join(assets_path, "train.vocab")
-        self.word_dict = load_vocab(word_dict_path)
-        path = hub.default_module_manager.search_module("lac")
-        if path:
-            self.lac = hub.Module(module_dir=path)
-        else:
-            result, _, path = hub.default_module_manager.install_module("lac")
-            assert path, "can't found necessary module lac"
-            self.lac = hub.Module(module_dir=path)
-    def preprocess(self, sign_name, data_dict):
-        result = {'text': []}
-        processed = self.lac.lexical_analysis(data=data_dict)
-        unk_id = len(self.word_dict)
-        for index, data in enumerate(processed):
-            result_i = {'processed': []}
-            result_i['origin'] = data_dict['text'][index]
-            for word in data['word']:
-                if word in self.word_dict:
-                    _index = self.word_dict[word]
-                else:
-                    _index = unk_id
-                result_i['processed'].append(_index)
-            result['text'].append(result_i)
-        return result
-    def postprocess(self, sign_name, data_out, data_info, **kwargs):
-        if sign_name == "sentiment_classify":
-            result = []
-            pred = fluid.executor.as_numpy(data_out)
-            for index in range(len(data_info['text'])):
-                result_i = {}
-                result_i['text'] = data_info['text'][index]['origin']
-                label, key = get_predict_label(pred[0][index, 1])
-                result_i['sentiment_label'] = label
-                result_i['sentiment_key'] = key
-                result.append(result_i)
-            return result
-    def data_format(self, sign_name):
-        if sign_name == "sentiment_classify":
-            return {
-                "text": {
-                    "type": hub.DataType.TEXT,
-                    "feed_key": self.module.signatures[sign_name].inputs[0].name
-                }
-            }
-        return None
--- a/demo/senta/resources/download.sh
+++ b/demo/senta/resources/download.sh
-#!/bin/bash
-set -o nounset
-set -o errexit
-script_path=$(cd `dirname $0`; pwd)
-cd $script_path
-wget --no-check-certificate https://paddlehub.bj.bcebos.com/paddle_model/senta.tar.gz
-wget --no-check-certificate https://paddlehub.bj.bcebos.com/paddle_model/train.vocab
-tar xvzf senta.tar.gz
-rm senta.tar.gz
--- a/demo/senta/resources/module_info.yml
+++ b/demo/senta/resources/module_info.yml
-name: senta
-type: nlp/sentiment_analysis
-author: paddlepaddle
-author_email: paddle-dev@baidu.com
-summary: "Senta is a model used to analyse sentiment tendency of Chinese sentences. We divide sentiment tendencies into three levels, score 2 means positive, score 1 means neuter, and score 0 means negative"
-version: 1.0.0
--- a/demo/senta/resources/test/test.txt
+++ b/demo/senta/resources/test/test.txt
--- a/demo/senta/resources/test/test.yml
+++ b/demo/senta/resources/test/test.yml
--- a/demo/ssd/README.md
+++ b/demo/ssd/README.md
-## 关于SSD
+# SSD
-https://github.com/PaddlePaddle/models/tree/develop/fluid/PaddleCV/object_detection
-## 创建Module
+## 关于
-本目录包含了创建一个基于POSCAL VOC数据集预训练的SSD模型的Module的脚本。
-通过以下脚本来一键创建一个SSD Module
+本示例展示如何使用SSD Module进行预测。
+SSD是一个目标检测模型，可以检测出图片中的实物的类别和位置，PaddleHub发布的SSD模型通过pascalvoc数据集训练，支持20个数据类别的检测，关于模型的训练细节，请查看[SSD](https://github.com/PaddlePaddle/models/tree/develop/PaddleCV/object_detection)
+## 准备工作
+在运行本目录的脚本前，需要先安装1.3.0版本以上的PaddlePaddle（如果您本地已经安装了符合条件的PaddlePaddle版本，那么可以跳过`准备工作`这一步）。
+如果您的机器支持GPU，我们建议下载GPU版本的PaddlePaddle，使用GPU进行训练和预测的效率都比使用CPU要高。
 ```shell
-sh create_module.sh
+# 安装GPU版本的PaddlePaddle
+$ pip install --upgrade paddlepaddle-gpu
 ```
-NOTE:
-* 如果进行下面示例的脚本或者代码，请确保执行上述脚本
-* 关于创建Module的API和细节，请查看`create_module.py`
-## 使用Module预测
+如果您的机器不支持GPU，可以通过下面的命令来安装CPU版本的PaddlePaddle
-该Module创建完成后，可以通过命令行或者python API两种方式进行预测
-### 命令行方式
+```shell
+# 安装CPU版本的PaddlePaddle
+$ pip install --upgrade paddlepaddle
+```
+在安装过程中如果遇到问题，您可以到[Paddle官方网站](http://www.paddlepaddle.org/)上查看解决方案。
+## 命令行方式预测
 `infer.sh`给出了使用命令行调用Module预测的示例脚本
 通过以下命令试验下效果
 ```shell
-sh infer.sh
+$ sh infer.sh
 ```
-### 通过python API
+## 通过python API预测
 `infer_by_code.py`给出了使用python API调用Module预测的示例代码
 通过以下命令试验下效果
 ```shell
 python infer_by_code.py
 ```
--- a/demo/ssd/create_module.py
+++ b/demo/ssd/create_module.py
-import os
-import numpy as np
-import processor
-import paddlehub as hub
-import paddle
-import paddle.fluid as fluid
-from mobilenet_ssd import mobile_net
-def build_program():
-    image_shape = [3, 300, 300]
-    class_num = 21
-    image = fluid.layers.data(dtype="float32", shape=image_shape, name="image")
-    gt_box = fluid.layers.data(
-        dtype="float32", shape=[4], name="gtbox", lod_level=1)
-    gt_label = fluid.layers.data(
-        dtype="int32", shape=[1], name="label", lod_level=1)
-    difficult = fluid.layers.data(
-        dtype="int32", shape=[1], name="difficult", lod_level=1)
-    with fluid.unique_name.guard():
-        locs, confs, box, box_var = mobile_net(class_num, image, image_shape)
-        nmsed_out = fluid.layers.detection_output(
-            locs, confs, box, box_var, nms_threshold=0.45)
-    return image, nmsed_out
-def create_module():
-    image, nmsed_out = build_program()
-    place = fluid.CPUPlace()
-    exe = fluid.Executor(place)
-    exe.run(fluid.default_startup_program())
-    pretrained_model = "resources/ssd_mobilenet_v1_pascalvoc"
-    def if_exist(var):
-        return os.path.exists(os.path.join(pretrained_model, var.name))
-    fluid.io.load_vars(exe, pretrained_model, predicate=if_exist)
-    assets = ["resources/label_list.txt"]
-    sign = hub.create_signature(
-        "object_detection",
-        inputs=[image],
-        outputs=[nmsed_out],
-        for_predict=True)
-    hub.create_module(
-        sign_arr=[sign],
-        module_dir="ssd_mobilenet_v1_pascal.hub_module",
-        module_info="resources/module_info.yml",
-        exe=exe,
-        processor=processor.Processor,
-        assets=assets)
-if __name__ == '__main__':
-    create_module()
--- a/demo/ssd/create_module.sh
+++ b/demo/ssd/create_module.sh
-#!/bin/bash
-set -o nounset
-set -o errexit
-script_path=$(cd `dirname $0`; pwd)
-module_path=ssd_mobilenet_v1_pascal.hub_module
-if [ -d $script_path/$module_path ]
-then
-    echo "$module_path already existed!"
-    exit 0
-fi
-cd $script_path/resources/
-if [ ! -d ssd_mobilenet_v1_pascalvoc ]
-then
-    sh download.sh
-fi
-cd $script_path/
-python create_module.py
-echo "Successfully create $module_path"
--- a/demo/ssd/infer.sh
+++ b/demo/ssd/infer.sh
-python ../../paddlehub/commands/hub.py run ssd_mobilenet_v1_pascal.hub_module/ --signature object_detection --config resources/test/test.yml  --input_file resources/test/test.txt
+python ../../paddlehub/commands/hub.py run ssd_mobilenet_v1_pascal --input_file test/test.txt
--- a/demo/ssd/infer_by_code.py
+++ b/demo/ssd/infer_by_code.py
@@ -2,11 +2,11 @@ import os
 import paddlehub as hub
-def infer_with_input_text():
+def infer_with_input_path():
    # get ssd module
-    ssd = hub.Module(module_dir="ssd_mobilenet_v1_pascal.hub_module")
+    ssd = hub.Module(name="ssd_mobilenet_v1_pascal")
-    test_img_path = os.path.join("resources", "test", "test_img_bird.jpg")
+    test_img_path = os.path.join("test", "test_img_bird.jpg")
    # get the input keys for signature 'object_detection'
    data_format = ssd.processor.data_format(sign_name='object_detection')
@@ -23,14 +23,14 @@ def infer_with_input_text():
 def infer_with_input_file():
    # get ssd module
-    ssd = hub.Module(module_dir="ssd_mobilenet_v1_pascal.hub_module")
+    ssd = hub.Module(name="ssd_mobilenet_v1_pascal")
    # get the input keys for signature 'object_detection'
    data_format = ssd.processor.data_format(sign_name='object_detection')
    key = list(data_format.keys())[0]
    # parse input file
-    test_file = os.path.join("resources", "test", "test.txt")
+    test_file = os.path.join("test", "test.txt")
    test_images = hub.io.parser.txt_parser.parse(test_file)
    # set input dict

--- a/demo/ssd/mobilenet_ssd.py
+++ b/demo/ssd/mobilenet_ssd.py
-import paddle.fluid as fluid
-from paddle.fluid.initializer import MSRA
-from paddle.fluid.param_attr import ParamAttr
-def conv_bn(input,
-            filter_size,
-            num_filters,
-            stride,
-            padding,
-            channels=None,
-            num_groups=1,
-            act='relu',
-            use_cudnn=True):
-    parameter_attr = ParamAttr(learning_rate=0.1, initializer=MSRA())
-    conv = fluid.layers.conv2d(
-        input=input,
-        num_filters=num_filters,
-        filter_size=filter_size,
-        stride=stride,
-        padding=padding,
-        groups=num_groups,
-        act=None,
-        use_cudnn=use_cudnn,
-        param_attr=parameter_attr,
-        bias_attr=False)
-    return fluid.layers.batch_norm(input=conv, act=act)
-def depthwise_separable(input, num_filters1, num_filters2, num_groups, stride,
-                        scale):
-    depthwise_conv = conv_bn(
-        input=input,
-        filter_size=3,
-        num_filters=int(num_filters1 * scale),
-        stride=stride,
-        padding=1,
-        num_groups=int(num_groups * scale),
-        use_cudnn=False)
-    pointwise_conv = conv_bn(
-        input=depthwise_conv,
-        filter_size=1,
-        num_filters=int(num_filters2 * scale),
-        stride=1,
-        padding=0)
-    return pointwise_conv
-def extra_block(input, num_filters1, num_filters2, num_groups, stride, scale):
-    # 1x1 conv
-    pointwise_conv = conv_bn(
-        input=input,
-        filter_size=1,
-        num_filters=int(num_filters1 * scale),
-        stride=1,
-        num_groups=int(num_groups * scale),
-        padding=0)
-    # 3x3 conv
-    normal_conv = conv_bn(
-        input=pointwise_conv,
-        filter_size=3,
-        num_filters=int(num_filters2 * scale),
-        stride=2,
-        num_groups=int(num_groups * scale),
-        padding=1)
-    return normal_conv
-def mobile_net(num_classes, img, img_shape, scale=1.0):
-    # 300x300
-    tmp = conv_bn(img, 3, int(32 * scale), 2, 1, 3)
-    # 150x150
-    tmp = depthwise_separable(tmp, 32, 64, 32, 1, scale)
-    tmp = depthwise_separable(tmp, 64, 128, 64, 2, scale)
-    # 75x75
-    tmp = depthwise_separable(tmp, 128, 128, 128, 1, scale)
-    tmp = depthwise_separable(tmp, 128, 256, 128, 2, scale)
-    # 38x38
-    tmp = depthwise_separable(tmp, 256, 256, 256, 1, scale)
-    tmp = depthwise_separable(tmp, 256, 512, 256, 2, scale)
-    # 19x19
-    for i in range(5):
-        tmp = depthwise_separable(tmp, 512, 512, 512, 1, scale)
-    module11 = tmp
-    tmp = depthwise_separable(tmp, 512, 1024, 512, 2, scale)
-    # 10x10
-    module13 = depthwise_separable(tmp, 1024, 1024, 1024, 1, scale)
-    module14 = extra_block(module13, 256, 512, 1, 2, scale)
-    # 5x5
-    module15 = extra_block(module14, 128, 256, 1, 2, scale)
-    # 3x3
-    module16 = extra_block(module15, 128, 256, 1, 2, scale)
-    # 2x2
-    module17 = extra_block(module16, 64, 128, 1, 2, scale)
-    mbox_locs, mbox_confs, box, box_var = fluid.layers.multi_box_head(
-        inputs=[module11, module13, module14, module15, module16, module17],
-        image=img,
-        num_classes=num_classes,
-        min_ratio=20,
-        max_ratio=90,
-        min_sizes=[60.0, 105.0, 150.0, 195.0, 240.0, 285.0],
-        max_sizes=[[], 150.0, 195.0, 240.0, 285.0, 300.0],
-        aspect_ratios=[[2.], [2., 3.], [2., 3.], [2., 3.], [2., 3.], [2., 3.]],
-        base_size=img_shape[2],
-        offset=0.5,
-        flip=True)
-    return mbox_locs, mbox_confs, box, box_var
--- a/demo/ssd/processor.py
+++ b/demo/ssd/processor.py
-import paddle
-import paddlehub as hub
-import numpy as np
-import os
-from paddlehub import BaseProcessor
-from PIL import Image
-from PIL import ImageDraw
-from PIL import ImageFont
-def clip_bbox(bbox):
-    xmin = max(min(bbox[0], 1.), 0.)
-    ymin = max(min(bbox[1], 1.), 0.)
-    xmax = max(min(bbox[2], 1.), 0.)
-    ymax = max(min(bbox[3], 1.), 0.)
-    return xmin, ymin, xmax, ymax
-def draw_bounding_box_on_image(image_path, data_list, save_path):
-    image = Image.open(image_path)
-    draw = ImageDraw.Draw(image)
-    for data in data_list:
-        left, right, top, bottom = data['left'], data['right'], data[
-            'top'], data['bottom']
-        draw.line([(left, top), (left, bottom), (right, bottom), (right, top),
-                   (left, top)],
-                  width=4,
-                  fill='red')
-        if image.mode == 'RGB':
-            draw.text((left, top), data['label'], (255, 255, 0))
-    image_name = os.path.split(image_path)[-1]
-    if not os.path.exists(save_path):
-        os.mkdir(save_path)
-    save_path = os.path.join(save_path, image_name)
-    print("image with bbox drawed saved as {}".format(
-        os.path.abspath(save_path)))
-    image.save(save_path)
-class Processor(BaseProcessor):
-    def __init__(self, module):
-        self.module = module
-        label_list_file = os.path.join(self.module.helper.assets_path(),
-                                       "label_list.txt")
-        with open(label_list_file, "r") as file:
-            content = file.read()
-        self.label_list = content.split("\n")
-        self.confs_threshold = 0.5
-    def preprocess(self, sign_name, data_dict):
-        def process_image(img):
-            if img.mode == 'L':
-                img = im.convert('RGB')
-            im_width, im_height = img.size
-            img = img.resize((300, 300), Image.ANTIALIAS)
-            img = np.array(img)
-            # HWC to CHW
-            if len(img.shape) == 3:
-                img = np.swapaxes(img, 1, 2)
-                img = np.swapaxes(img, 1, 0)
-            # RBG to BGR
-            img = img[[2, 1, 0], :, :]
-            img = img.astype('float32')
-            mean_value = [127.5, 127.5, 127.5]
-            mean_value = np.array(mean_value)[:, np.newaxis, np.newaxis].astype(
-                'float32')
-            img -= mean_value
-            img = img * 0.007843
-            return img
-        result = {'image': []}
-        for path in data_dict['image']:
-            img = Image.open(path)
-            im_width, im_height = img.size
-            result_i = {}
-            result_i['path'] = path
-            result_i['width'] = im_width
-            result_i['height'] = im_height
-            result_i['processed'] = process_image(img)
-            result['image'].append(result_i)
-        return result
-    def postprocess(self, sign_name, data_out, data_info, **kwargs):
-        if sign_name == "object_detection":
-            lod_tensor = data_out[0]
-            lod = lod_tensor.lod()[0]
-            results = np.array(data_out[0])
-            output = []
-            for index in range(len(lod) - 1):
-                result_i = results[lod[index]:lod[index + 1]]
-                output_i = {
-                    'path': data_info['image'][index]['path'],
-                    'data': []
-                }
-                for dt in result_i:
-                    if dt[1] < self.confs_threshold:
-                        continue
-                    dt_i = {}
-                    category_id = dt[0]
-                    bbox = dt[2:]
-                    xmin, ymin, xmax, ymax = clip_bbox(dt[2:])
-                    (left, right, top,
-                     bottom) = (xmin * data_info['image'][index]['width'],
-                                xmax * data_info['image'][index]['width'],
-                                ymin * data_info['image'][index]['height'],
-                                ymax * data_info['image'][index]['height'])
-                    dt_i['left'] = left
-                    dt_i['right'] = right
-                    dt_i['top'] = top
-                    dt_i['bottom'] = bottom
-                    dt_i['label'] = self.label_list[int(category_id)]
-                    output_i['data'].append(dt_i)
-                draw_bounding_box_on_image(
-                    output_i['path'], output_i['data'], save_path="test_result")
-                output.append(output_i)
-            return output
-    def data_format(self, sign_name):
-        if sign_name == "object_detection":
-            return {
-                "image": {
-                    'type': hub.DataType.IMAGE,
-                    'feed_key': self.module.signatures[sign_name].inputs[0].name
-                }
-            }
-        return None
--- a/demo/ssd/resources/download.sh
+++ b/demo/ssd/resources/download.sh
-#!/bin/bash
-set -o nounset
-set -o errexit
-script_path=$(cd `dirname $0`; pwd)
-cd $script_path
-wget --no-check-certificate https://paddlehub.bj.bcebos.com/paddle_model/ssd_mobilenet_v1_pascalvoc.tar.gz
-tar xvzf ssd_mobilenet_v1_pascalvoc.tar.gz
-rm ssd_mobilenet_v1_pascalvoc.tar.gz
--- a/demo/ssd/resources/label_list.txt
+++ b/demo/ssd/resources/label_list.txt
-background
-aeroplane
-bicycle
-bird
-boat
-bottle
-bus
-car
-cat
-chair
-cow
-diningtable
-dog
-horse
-motorbike
-person
-pottedplant
-sheep
-sofa
-train
-tvmonitor
--- a/demo/ssd/resources/module_info.yml
+++ b/demo/ssd/resources/module_info.yml
-name: ssd_mobilenet_v1_pascalvoc
-type: CV/object-detection
-author: paddlepaddle
-author_email: paddle-dev@baidu.com
-summary: "SSD(Single Shot MultiBox Detector) is a object detection model use to detect target category and location in a image picture. This model is trained with PASCAL VOC dataset, and therefore provides 20 categories of recognition capability, which mentioned below : aeroplane,bicycle,bird,boat,bottle,bus,car,cat,chair,cow,diningtable,dog,horse,motorbike,person,pottedplant,sheep,sofa,train,tvmonitor"
-version: 1.0.0
--- a/demo/ssd/resources/test/test.txt
+++ b/demo/ssd/resources/test/test.txt
-./resources/test/test_img_sheep.jpg
-./resources/test/test_img_cat.jpg
-./resources/test/test_img_bird.jpg
--- a/demo/ssd/test/test.txt
+++ b/demo/ssd/test/test.txt
+test/test_img_sheep.jpg
+test/test_img_cat.jpg
+test/test_img_bird.jpg
--- a/demo/ssd/resources/test/test.yml
+++ b/demo/ssd/resources/test/test.yml
--- a/demo/ssd/resources/test/test_img_bird.jpg
+++ b/demo/ssd/resources/test/test_img_bird.jpg
--- a/demo/ssd/resources/test/test_img_cat.jpg
+++ b/demo/ssd/resources/test/test_img_cat.jpg
--- a/demo/ssd/resources/test/test_img_sheep.jpg
+++ b/demo/ssd/resources/test/test_img_sheep.jpg