get_phi_kernel_info.py 11.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
#!/bin/python

# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
# 
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
# 
#     http://www.apache.org/licenses/LICENSE-2.0
# 
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import argparse
import json
import yaml
W
Wilber 已提交
20
from typing import List, Dict, Any
21 22 23


def parse_args():
24
    parser = argparse.ArgumentParser("gather phi kernel and infermate info")
25 26 27 28
    parser.add_argument(
        "--paddle_root_path",
        type=str,
        required=True,
W
Wilber 已提交
29
        help="root path of paddle src[WORK_PATH/Paddle].")
30 31 32 33
    parser.add_argument(
        "--kernel_info_file",
        type=str,
        required=True,
34
        help="kernel info file generated by get_phi_kernel_function.sh.")
35 36 37 38
    parser.add_argument(
        "--infermeta_wrap_file",
        type=str,
        required=True,
W
Wilber 已提交
39
        help="inferMeta wrap info file.")
W
Wilber 已提交
40 41
    parser.add_argument(
        "--attr_info_file", type=str, required=True, help="attr info file.")
W
Wilber 已提交
42 43 44 45
    parser.add_argument(
        "--generate_file",
        type=str,
        required=True,
46
        default="../paddle/infrt/kernel/phi/infershaped/infershaped_kernel_launchers.cc",
W
Wilber 已提交
47
        help="generated file.")
48 49 50 51 52 53 54 55 56 57 58
    args = parser.parse_args()
    return args


def get_api_yaml_info(file_path):
    f = open(file_path + "/python/paddle/utils/code_gen/api.yaml", "r")
    cont = f.read()
    return yaml.load(cont, Loader=yaml.FullLoader)


def get_kernel_info(file_path):
W
Wilber 已提交
59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80
    f = open(file_path, "r")
    cont = f.readlines()
    ret = []
    prev = []
    for line in cont:
        info = line.strip().split()
        if not info:
            continue

        if len(prev) == 0:
            ret.append(line.strip())
            prev = info
            continue

        if prev[0] == info[0] and prev[1] == info[1]:
            ret.pop()
        ret.append(line.strip())
        prev = info
    return ret


def get_infermeta_info(file_path):
81 82
    f = open(file_path, "r")
    cont = f.readlines()
83
    return [l.strip() for l in cont if l.strip() != ""]
84 85


W
Wilber 已提交
86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102
def get_attr_info(file_path):
    """
    phi_gpu.argsort.float64.any $axisBool$descending
    """
    ret = {}
    with open(file_path, 'r') as f:
        cont = f.readlines()
        for l in cont:
            datas = l.strip().split(' ')
            if len(datas) == 2:
                attrs = datas[1].split('$')
                ret[datas[0]] = attrs[1:]
            else:
                ret[datas[0]] = None
    return ret


103
def merge(infer_meta_data, kernel_data, wrap_data):
104 105
    meta_map = {}
    for api in infer_meta_data:
106
        if "kernel" not in api or "infer_meta" not in api:
107 108
            continue
        meta_map[api["kernel"]["func"]] = api["infer_meta"]["func"]
109 110 111 112
    wrap_map = {}
    for l in wrap_data:
        wrap_map[l.split()[0]] = l.split()[1]

113 114 115
    full_kernel_data = []
    for l in kernel_data:
        key = l.split()[0]
116 117 118 119
        if key in wrap_map:
            full_kernel_data.append((l + " " + wrap_map[key]).split())
        elif key in meta_map:
            full_kernel_data.append((l + " " + meta_map[key]).split())
120 121 122 123 124 125
        else:
            full_kernel_data.append((l + " unknown").split())

    return full_kernel_data


W
Wilber 已提交
126
def gen_warn_info():
127
    return """// Generated by tools/infrt/gen_phi_kernel_register.py for infrt.
W
Wilber 已提交
128 129 130 131 132 133
// DO NOT edit or include it within paddle.
"""


def gen_include_headers():
    return """
134 135
#include "paddle/infrt/kernel/phi/infershaped/infershaped_kernel_launchers.h"
#include "paddle/infrt/kernel/phi/infershaped/phi_kernel_launcher.h"
136 137 138 139
#include "paddle/phi/backends/all_context.h"
#include "paddle/phi/include/kernels.h"
#include "paddle/phi/include/infermeta.h"
#include "paddle/phi/infermeta/generated.h"
W
Wilber 已提交
140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156
"""


def gen_namespace():
    return ("""
namespace infrt {
namespace kernel {

""", """

}  // namespace kernel
}  // namespace infrt
""")


def gen_context(val):
    if val == "CPU":
157
        return "::phi::CPUContext", "phi_cpu"
W
Wilber 已提交
158
    elif val == "GPU":
159
        return "::phi::GPUContext", "phi_gpu"
W
Wilber 已提交
160
    # elif val == "XPU":
161
    #     return "::phi::XPUContext", "phi_xpu"
W
Wilber 已提交
162 163
    else:
        # raise Exception(f"Unknown context type {val}")
W
Wilber 已提交
164
        return "", ""
W
Wilber 已提交
165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180


def gen_layout(val):
    if val == "ALL_LAYOUT":
        return 'any'
    else:
        # TODO(wilber): now only process ALL_LAYOUT
        raise Exception(f"Unknown layout type {val}")


def gen_kernel_func(val, ctx_name, dtype_name):
    if '<' in val and '>' in val:
        st = val.index('<')
        ed = val.index('>')
        func_name = val[:st]
        template_name = val[st + 1:ed]
181 182
        if '::phi::' in template_name:
            return "&::phi::" + val
W
Wilber 已提交
183
        else:
184
            return "&::phi::" + func_name + "<::phi::" + template_name + ">"
W
Wilber 已提交
185
    else:
186
        return "&::phi::" + val + "<" + dtype_name + ", " + ctx_name + ">"
W
Wilber 已提交
187 188 189 190 191 192


def gen_dtype(vals: List[str]):
    ir_dtypes, origin_dtypes = [], []
    for val in vals:
        if val == "float":
193
            ir_dtypes.append("float32")
W
Wilber 已提交
194 195
            origin_dtypes.append("float")
        elif val == "double":
196
            ir_dtypes.append("float64")
W
Wilber 已提交
197 198
            origin_dtypes.append("double")
        elif val == "float16":
199
            ir_dtypes.append("float16")
W
Wilber 已提交
200 201 202 203 204
            origin_dtypes.append("paddle::experimental::float16")
        elif val == "bfloat16":
            ir_dtypes.append("bf16")
            origin_dtypes.append("paddle::experimental::bfloat16")
        elif val == "bool":
205
            ir_dtypes.append("bool")
W
Wilber 已提交
206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227
            origin_dtypes.append("bool")
        elif val == "int8_t":
            ir_dtypes.append("int8")
            origin_dtypes.append("int8_t")
        elif val == "uint8_t":
            ir_dtypes.append("uint8")
            origin_dtypes.append("uint8_t")
        elif val == "int16_t":
            ir_dtypes.append("int16")
            origin_dtypes.append("int16_t")
        elif val == "int" or val == "int32_t":
            ir_dtypes.append("int32")
            origin_dtypes.append("int32_t")
        elif val == "int64_t":
            ir_dtypes.append("int64")
            origin_dtypes.append("int64_t")
        elif val == "complex<float>" or val == "complex64":
            ir_dtypes.append("complex64")
            origin_dtypes.append("paddle::experimental::complex64")
        elif val == "complex<double>" or val == "complex128":
            ir_dtypes.append("complex128")
            origin_dtypes.append("paddle::experimental::complex128")
J
Jack Zhou 已提交
228 229 230
        elif val == "pstring":
            ir_dtypes.append("pstring")
            origin_dtypes.append("paddle::experimental::pstring")
W
Wilber 已提交
231 232 233 234 235 236 237 238 239 240
        elif val == "ALL_DTYPE":
            ir_dtypes.append("all")
            origin_dtypes.append("all")
        else:
            if "VA_ARGS" in val:
                continue
            raise Exception(f"Unknown data type {val}")
    return ir_dtypes, origin_dtypes


W
Wilber 已提交
241 242 243 244
# Note: Now only process CPUContext and GPUContext.


def gen_register_code_info(item: List[str], attr_data: Dict[str, List[str]]):
W
Wilber 已提交
245
    """
W
Wilber 已提交
246 247
    item: ['add', 'CPU', 'ALL_LAYOUT', 'AddKernel', 'float', 'double', '...'(varaidic types), 'ElementwiseInferMeta']
    attr_data: {'phi_cpu.arg_min.float32.any': ['axisBool', 'keepdimsBool', 'flatten', 'dtype']}
W
Wilber 已提交
248
    """
W
Wilber 已提交
249 250 251 252 253
    ctx_name, ir_ctx_name = gen_context(item[1])
    if (ctx_name == ""):
        return ""
    item[2] = gen_layout(item[2])
    ir_dtypes, origin_dtypes = gen_dtype(item[4:-1])
254
    infer_shape_func = "&::phi::" + item[-1]
W
Wilber 已提交
255

W
Wilber 已提交
256
    res = ""
W
Wilber 已提交
257

W
Wilber 已提交
258 259 260 261 262 263 264 265 266 267 268 269 270 271 272
    if item[-1] == "unknown":
        # TODO(wilber): handle the unknown inferShape func.
        return ""

    for ir_dtype, origin_dtype in zip(ir_dtypes, origin_dtypes):
        kernel_func = gen_kernel_func(item[3], ctx_name, origin_dtype)
        ir_name = ir_ctx_name + '.' + item[0].lower(
        ) + '.' + ir_dtype + '.' + item[2].lower()
        if ir_name in attr_data.keys() and attr_data[ir_name] is not None:
            attr_names = ', '.join(
                ["\"" + a + "\"" for a in attr_data[ir_name]])
            res += f"""
registry->AddKernelWithAttrs("{ir_name}","""

            res += f"""
273
    &KernelLauncherFunc<decltype({kernel_func}),
W
Wilber 已提交
274 275 276 277 278
                                  {kernel_func},
                                  decltype({infer_shape_func}),
                                  {infer_shape_func}>,
    {{{attr_names}}});
"""
W
Wilber 已提交
279

W
Wilber 已提交
280
        else:
W
Wilber 已提交
281
            res += f"""
W
Wilber 已提交
282
registry->AddKernel("{ir_name}","""
W
Wilber 已提交
283 284

            res += f"""
285
    &KernelLauncherFunc<decltype({kernel_func}),
W
Wilber 已提交
286 287
                                  {kernel_func},
                                  decltype({infer_shape_func}),
288
                                  {infer_shape_func}>);
W
Wilber 已提交
289 290
"""

W
Wilber 已提交
291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325
    return res


def gen_register_info(resources: List[List[str]],
                      attr_data: Dict[str, List[str]]):
    """
    resources: [['add', 'CPU', 'ALL_LAYOUT', 'AddKernel', 'float', 'double', '...'(varaidic types), 'ElementwiseInferMeta'], ...]
    attr_data: {'phi_cpu.arg_min.float32.any': ['axisBool', 'keepdimsBool', 'flatten', 'dtype']}
    """
    res = "void RegisterInferShapeLaunchers(host_context::KernelRegistry* registry) {"

    # register cpu kernels.
    for item in resources:
        # The output string is polluted by C++ macros, here the \ is removed
        update_item = [v.strip('\\') for v in item]
        if update_item[1] != "CPU":
            continue
        code = gen_register_code_info(item, attr_data)
        if (code == ""):
            continue
        res += code

    # register gpu kernels.
    res += "\n#ifdef INFRT_WITH_GPU"
    for item in resources:
        # The output string is polluted by C++ macros, here the \ is removed
        update_item = [v.strip('\\') for v in item]
        if update_item[1] != "GPU":
            continue
        code = gen_register_code_info(item, attr_data)
        if (code == ""):
            continue
        res += code
    res += "#endif // INFRT_WITH_GPU"

W
Wilber 已提交
326 327 328 329
    res += "\n}"
    return res


330
def gen_phi_kernel_register_code(resources: List[List[str]],
W
Wilber 已提交
331
                                 attr_data: Dict[str, List[str]],
332
                                 src_file_path: str):
W
Wilber 已提交
333 334 335 336 337
    source_file = open(src_file_path, 'w')
    source_file.write(gen_warn_info())
    source_file.write(gen_include_headers())
    namespace = gen_namespace()
    source_file.write(namespace[0])
W
Wilber 已提交
338
    source_file.write(gen_register_info(resources, attr_data))
W
Wilber 已提交
339 340 341 342
    source_file.write(namespace[1])
    source_file.close()


343 344 345 346
if __name__ == "__main__":
    args = parse_args()
    infer_meta_data = get_api_yaml_info(args.paddle_root_path)
    kernel_data = get_kernel_info(args.kernel_info_file)
W
Wilber 已提交
347
    info_meta_wrap_data = get_infermeta_info(args.infermeta_wrap_file)
W
Wilber 已提交
348
    attr_data = get_attr_info(args.attr_info_file)
349
    out = merge(infer_meta_data, kernel_data, info_meta_wrap_data)
W
Wilber 已提交
350
    gen_phi_kernel_register_code(out, attr_data, args.generate_file)