module.py 4.8 KB
Newer Older
文幕地方's avatar
文幕地方 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

D
dyning 已提交
15 16 17 18 19
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import os
W
WenmuZhou 已提交
20 21
import sys
sys.path.insert(0, ".")
D
dyning 已提交
22

L
littletomatodonkey 已提交
23
import copy
文幕地方's avatar
文幕地方 已提交
24
import paddlehub
D
dyning 已提交
25 26 27 28 29 30
from paddlehub.common.logger import logger
from paddlehub.module.module import moduleinfo, runnable, serving
import cv2
import numpy as np
import paddlehub as hub

D
dyning 已提交
31
from tools.infer.utility import base64_to_cv2
D
dyning 已提交
32
from tools.infer.predict_det import TextDetector
L
littletomatodonkey 已提交
33
from tools.infer.utility import parse_args
L
LDOUBLEV 已提交
34
from deploy.hubserving.ocr_system.params import read_params
D
dyning 已提交
35 36 37 38 39 40 41 42


@moduleinfo(
    name="ocr_det",
    version="1.0.0",
    summary="ocr detection service",
    author="paddle-dev",
    author_email="paddle-dev@baidu.com",
文幕地方's avatar
文幕地方 已提交
43
    type="cv/text_detection")
D
dyning 已提交
44
class OCRDet(hub.Module):
45
    def _initialize(self, use_gpu=False, enable_mkldnn=False):
D
dyning 已提交
46 47 48
        """
        initialize with the necessary elements
        """
L
littletomatodonkey 已提交
49
        cfg = self.merge_configs()
D
dyning 已提交
50 51

        cfg.use_gpu = use_gpu
D
dyning 已提交
52 53 54 55 56 57
        if use_gpu:
            try:
                _places = os.environ["CUDA_VISIBLE_DEVICES"]
                int(_places[0])
                print("use gpu: ", use_gpu)
                print("CUDA_VISIBLE_DEVICES: ", _places)
D
dyning 已提交
58
                cfg.gpu_mem = 8000
D
dyning 已提交
59 60 61 62
            except:
                raise RuntimeError(
                    "Environment Variable CUDA_VISIBLE_DEVICES is not set correctly. If you wanna use gpu, please set CUDA_VISIBLE_DEVICES via export CUDA_VISIBLE_DEVICES=cuda_device_id."
                )
D
dyning 已提交
63
        cfg.ir_optim = True
64
        cfg.enable_mkldnn = enable_mkldnn
D
dyning 已提交
65

D
dyning 已提交
66
        self.text_detector = TextDetector(cfg)
D
dyning 已提交
67

L
littletomatodonkey 已提交
68 69 70 71 72 73 74 75 76 77 78 79 80 81
    def merge_configs(self, ):
        # deafult cfg
        backup_argv = copy.deepcopy(sys.argv)
        sys.argv = sys.argv[:1]
        cfg = parse_args()

        update_cfg_map = vars(read_params())

        for key in update_cfg_map:
            cfg.__setattr__(key, update_cfg_map[key])

        sys.argv = copy.deepcopy(backup_argv)
        return cfg

D
dyning 已提交
82 83 84 85 86 87 88 89 90 91 92 93
    def read_images(self, paths=[]):
        images = []
        for img_path in paths:
            assert os.path.isfile(
                img_path), "The {} isn't a valid file.".format(img_path)
            img = cv2.imread(img_path)
            if img is None:
                logger.info("error in loading image:{}".format(img_path))
                continue
            images.append(img)
        return images

W
WenmuZhou 已提交
94
    def predict(self, images=[], paths=[]):
D
dyning 已提交
95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
        """
        Get the text box in the predicted images.
        Args:
            images (list(numpy.ndarray)): images data, shape of each is [H, W, C]. If images not paths
            paths (list[str]): The paths of images. If paths not images
        Returns:
            res (list): The result of text detection box and save path of images.
        """

        if images != [] and isinstance(images, list) and paths == []:
            predicted_data = images
        elif images == [] and isinstance(paths, list) and paths != []:
            predicted_data = self.read_images(paths)
        else:
            raise TypeError("The input data is inconsistent with expectations.")

        assert predicted_data != [], "There is not any image to be predicted. Please check the input data."
W
WenmuZhou 已提交
112

D
dyning 已提交
113 114 115 116
        all_results = []
        for img in predicted_data:
            if img is None:
                logger.info("error in loading image")
D
dyning 已提交
117
                all_results.append([])
D
dyning 已提交
118
                continue
D
dyning 已提交
119
            dt_boxes, elapse = self.text_detector(img)
D
dyning 已提交
120
            logger.info("Predict time : {}".format(elapse))
D
dyning 已提交
121

D
dyning 已提交
122 123
            rec_res_final = []
            for dno in range(len(dt_boxes)):
W
WenmuZhou 已提交
124 125 126
                rec_res_final.append({
                    'text_region': dt_boxes[dno].astype(np.int).tolist()
                })
D
dyning 已提交
127
            all_results.append(rec_res_final)
D
dyning 已提交
128 129 130 131 132 133 134 135
        return all_results

    @serving
    def serving_method(self, images, **kwargs):
        """
        Run as a service.
        """
        images_decode = [base64_to_cv2(image) for image in images]
D
dyning 已提交
136
        results = self.predict(images_decode, **kwargs)
D
dyning 已提交
137 138
        return results

W
WenmuZhou 已提交
139

D
dyning 已提交
140 141
if __name__ == '__main__':
    ocr = OCRDet()
文幕地方's avatar
文幕地方 已提交
142
    ocr._initialize()
D
dyning 已提交
143 144 145 146
    image_path = [
        './doc/imgs/11.jpg',
        './doc/imgs/12.jpg',
    ]
D
dyning 已提交
147
    res = ocr.predict(paths=image_path)
W
WenmuZhou 已提交
148
    print(res)