test_trt_convert_gelu.py 5.5 KB
Newer Older
1
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
2
#
3 4 5
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
6
#
7
#     http://www.apache.org/licenses/LICENSE-2.0
8
#
9 10 11 12 13 14
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

15
from trt_layer_auto_scan_test import TrtLayerAutoScanTest
16 17 18 19
from program_config import TensorConfig, ProgramConfig
import numpy as np
import paddle.inference as paddle_infer
from functools import partial
20
from typing import Any, Dict, List
W
Wilber 已提交
21
import unittest
22 23 24


class TrtConvertGeluTest(TrtLayerAutoScanTest):
25

26 27 28 29
    def is_program_valid(self, program_config: ProgramConfig) -> bool:
        return True

    def sample_program_configs(self):
30

31 32
        def generate_input1(dims, attrs: List[Dict[str, Any]]):
            if dims == 1:
33
                return np.ones([32]).astype(np.float32)
34
            elif dims == 2:
35
                return np.ones([3, 32]).astype(np.float32)
36
            elif dims == 3:
37
                return np.ones([3, 32, 32]).astype(np.float32)
38
            else:
39
                return np.ones([1, 3, 32, 32]).astype(np.float32)
40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61

        for dims in [1, 2, 3, 4]:
            for approximate in [True, False]:
                self.dims = dims
                dics = [{"approximate": approximate}]

                ops_config = [{
                    "op_type": "gelu",
                    "op_inputs": {
                        "X": ["input_data"]
                    },
                    "op_outputs": {
                        "Out": ["output_data"]
                    },
                    "op_attrs": dics[0]
                }]
                ops = self.generate_op_config(ops_config)

                program_config = ProgramConfig(
                    ops=ops,
                    weights={},
                    inputs={
62 63 64
                        "input_data":
                        TensorConfig(
                            data_gen=partial(generate_input1, dims, dics))
65 66 67 68 69 70 71
                    },
                    outputs=["output_data"])

                yield program_config

    def sample_predictor_configs(
            self, program_config) -> (paddle_infer.Config, List[int], float):
72

73 74 75
        def generate_dynamic_shape(attrs):
            if self.dims == 1:
                self.dynamic_shape.min_input_shape = {"input_data": [1]}
76 77
                self.dynamic_shape.max_input_shape = {"input_data": [64]}
                self.dynamic_shape.opt_input_shape = {"input_data": [32]}
78
            elif self.dims == 2:
79 80 81
                self.dynamic_shape.min_input_shape = {"input_data": [1, 16]}
                self.dynamic_shape.max_input_shape = {"input_data": [4, 32]}
                self.dynamic_shape.opt_input_shape = {"input_data": [3, 32]}
82
            elif self.dims == 3:
83 84 85
                self.dynamic_shape.min_input_shape = {"input_data": [1, 16, 16]}
                self.dynamic_shape.max_input_shape = {"input_data": [4, 32, 32]}
                self.dynamic_shape.opt_input_shape = {"input_data": [3, 32, 32]}
86 87
            else:
                self.dynamic_shape.min_input_shape = {
88
                    "input_data": [1, 3, 16, 16]
89 90
                }
                self.dynamic_shape.max_input_shape = {
91
                    "input_data": [4, 3, 32, 32]
92 93
                }
                self.dynamic_shape.opt_input_shape = {
94
                    "input_data": [1, 3, 32, 32]
95 96 97 98 99 100 101 102
                }

        def clear_dynamic_shape():
            self.dynamic_shape.min_input_shape = {}
            self.dynamic_shape.max_input_shape = {}
            self.dynamic_shape.opt_input_shape = {}

        def generate_trt_nodes_num(attrs, dynamic_shape):
103 104 105 106 107 108
            valid_version = (7, 0, 0)
            compile_version = paddle_infer.get_trt_compile_version()
            runtime_version = paddle_infer.get_trt_runtime_version()
            self.assertTrue(compile_version == runtime_version)
            # Dimension one only runs on Paddle OP
            if self.dims == 1:
109
                return 0, 3
110
            if compile_version >= valid_version:
111
                return 1, 2
112 113 114 115 116
            else:
                if attrs[0]['approximate'] == True:
                    return 0, 3
                else:
                    return 1, 2
117 118

        attrs = [
119
            program_config.ops[i].attrs for i in range(len(program_config.ops))
120 121 122 123 124 125 126 127 128 129 130 131 132 133
        ]

        # for static_shape
        clear_dynamic_shape()
        self.trt_param.precision = paddle_infer.PrecisionType.Float32
        yield self.create_inference_config(), generate_trt_nodes_num(
            attrs, False), 1e-5
        self.trt_param.precision = paddle_infer.PrecisionType.Half
        yield self.create_inference_config(), generate_trt_nodes_num(
            attrs, False), 1e-5

        # for dynamic_shape
        generate_dynamic_shape(attrs)
        self.trt_param.precision = paddle_infer.PrecisionType.Float32
134 135
        yield self.create_inference_config(), generate_trt_nodes_num(
            attrs, True), 1e-5
136
        self.trt_param.precision = paddle_infer.PrecisionType.Half
137 138
        yield self.create_inference_config(), generate_trt_nodes_num(
            attrs, True), 1e-5
139 140 141 142 143 144 145

    def test(self):
        self.run_test()


if __name__ == "__main__":
    unittest.main()