__init__.py 4.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
W
WenmuZhou 已提交
14

D
dyning 已提交
15
import copy
littletomatodonkey's avatar
littletomatodonkey 已提交
16 17
import importlib

18 19 20
from paddle.jit import to_static
from paddle.static import InputSpec

littletomatodonkey's avatar
littletomatodonkey 已提交
21 22
from .base_model import BaseModel
from .distillation_model import DistillationModel
D
dyning 已提交
23

24
__all__ = ["build_model", "apply_to_static"]
D
dyning 已提交
25

littletomatodonkey's avatar
littletomatodonkey 已提交
26

D
dyning 已提交
27 28
def build_model(config):
    config = copy.deepcopy(config)
littletomatodonkey's avatar
littletomatodonkey 已提交
29 30 31 32 33 34 35
    if not "name" in config:
        arch = BaseModel(config)
    else:
        name = config.pop("name")
        mod = importlib.import_module(__name__)
        arch = getattr(mod, name)(config)
    return arch
36 37 38 39 40


def apply_to_static(model, config, logger):
    if config["Global"].get("to_static", False) is not True:
        return model
41 42 43
    assert "d2s_train_image_shape" in config[
        "Global"], "d2s_train_image_shape must be assigned for static training mode..."
    supported_list = ["DB", "SVTR_LCNet", "TableMaster", "LayoutXLM", "SLANet"]
44 45 46 47 48 49 50 51
    if config["Architecture"]["algorithm"] in ["Distillation"]:
        algo = list(config["Architecture"]["Models"].values())[0]["algorithm"]
    else:
        algo = config["Architecture"]["algorithm"]
    assert algo in supported_list, f"algorithms that supports static training must in in {supported_list} but got {algo}"

    specs = [
        InputSpec(
52
            [None] + config["Global"]["d2s_train_image_shape"], dtype='float32')
53 54
    ]

55
    if algo == "SVTR_LCNet":
56 57 58 59 60 61 62 63 64
        specs.append([
            InputSpec(
                [None, config["Global"]["max_text_length"]],
                dtype='int64'), InputSpec(
                    [None, config["Global"]["max_text_length"]], dtype='int64'),
            InputSpec(
                [None], dtype='int64'), InputSpec(
                    [None], dtype='float64')
        ])
65
    elif algo == "TableMaster":
Z
zhoujun 已提交
66 67 68 69 70 71 72 73 74 75 76 77 78
        specs.append(
            [
                InputSpec(
                    [None, config["Global"]["max_text_length"]], dtype='int64'),
                InputSpec(
                    [None, config["Global"]["max_text_length"], 4],
                    dtype='float32'),
                InputSpec(
                    [None, config["Global"]["max_text_length"], 1],
                    dtype='float32'),
                InputSpec(
                    [None, 6], dtype='float32'),
            ])
79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106
    elif algo == "LayoutXLM":
        specs = [[
            InputSpec(
                shape=[None, 512], dtype="int64"),  # input_ids
            InputSpec(
                shape=[None, 512, 4], dtype="int64"),  # bbox
            InputSpec(
                shape=[None, 512], dtype="int64"),  # attention_mask
            InputSpec(
                shape=[None, 512], dtype="int64"),  # token_type_ids
            InputSpec(
                shape=[None, 3, 224, 224], dtype="float32"),  # image
            InputSpec(
                shape=[None, 512], dtype="int64"),  # label
        ]]
    elif algo == "SLANet":
        specs.append([
            InputSpec(
                [None, config["Global"]["max_text_length"] + 2], dtype='int64'),
            InputSpec(
                [None, config["Global"]["max_text_length"] + 2, 4],
                dtype='float32'),
            InputSpec(
                [None, config["Global"]["max_text_length"] + 2, 1],
                dtype='float32'),
            InputSpec(
                [None, 6], dtype='float64'),
        ])
107 108 109
    model = to_static(model, input_spec=specs)
    logger.info("Successfully to apply @to_static with specs: {}".format(specs))
    return model