#pragma once #include "paddle_lite_factory_helper.h" USE_LITE_KERNEL(relu, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(leaky_relu, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(relu_clipped, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(prelu, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(sigmoid, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(tanh, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(swish, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(relu6, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(log, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(exp, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(floor, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(hard_sigmoid, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(rsqrt, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(prior_box, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(affine_channel, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(logical_xor, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(logical_and, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(logical_or, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(logical_not, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(roi_align, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(scale, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(generate_proposals, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(reduce_mean, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(crop, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(range, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(scale, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(axpy, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(beam_search, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(mul, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(norm, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(power, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(calib, kARM, kInt8, kNCHW, fp32_to_int8); USE_LITE_KERNEL(calib, kARM, kInt8, kNCHW, int8_to_fp32); USE_LITE_KERNEL(calib_once, kARM, kInt8, kNCHW, fp32_to_int8); USE_LITE_KERNEL(calib_once, kARM, kInt8, kNCHW, int8_to_fp32); USE_LITE_KERNEL(negative, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(bilinear_interp, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(nearest_interp, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(box_coder, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(less_than, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(equal, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(not_equal, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(less_equal, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(greater_than, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(greater_equal, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(multiclass_nms, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(lod_reset, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(box_clip, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(density_prior_box, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(decode_bboxes, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(squeeze, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(squeeze2, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(gru, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(increment, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(layout, kFPGA, kAny, kNHWC, hwc_to_chw_fpga_fp16); USE_LITE_KERNEL(layout, kFPGA, kAny, kNHWC, hwc_to_chw_arm_float); USE_LITE_KERNEL(layout, kFPGA, kAny, kNHWC, chw_to_hwc_fpga_fp16); USE_LITE_KERNEL(layout_once, kFPGA, kAny, kNHWC, hwc_to_chw_fpga_fp16); USE_LITE_KERNEL(layout_once, kFPGA, kAny, kNHWC, chw_to_hwc_fpga_fp16); USE_LITE_KERNEL(elementwise_add, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(fusion_elementwise_add_activation, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(elementwise_mul, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(is_empty, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(shape, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(split, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(calib, kFPGA, kFP16, kNHWC, fp32_to_fp16_fpga); USE_LITE_KERNEL(calib, kFPGA, kFP16, kNHWC, fp16_to_fp32_fpga); USE_LITE_KERNEL(calib_once, kFPGA, kFP16, kNHWC, fp32_to_fp16_fpga); USE_LITE_KERNEL(calib_once, kFPGA, kFP16, kNHWC, fp16_to_fp32_fpga); USE_LITE_KERNEL(sequence_expand, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(expand, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(gather, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(im2sequence, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(reduce_max, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(density_prior_box, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(feed, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(lookup_table, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(lookup_table_v2, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(reshape, kHost, kAny, kAny, def); USE_LITE_KERNEL(reshape2, kHost, kAny, kAny, def); USE_LITE_KERNEL(flatten, kHost, kAny, kAny, def); USE_LITE_KERNEL(flatten2, kHost, kAny, kAny, def); USE_LITE_KERNEL(conv2d_transpose, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(unsqueeze, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(unsqueeze2, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(softmax, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(layer_norm, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(assign, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(dropout, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(pool2d, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(yolo_box, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(sequence_softmax, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(stack, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(norm, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(transpose, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(transpose2, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(layout, kARM, kFloat, kNCHW, nchw2nhwc); USE_LITE_KERNEL(layout, kARM, kFloat, kNCHW, nhwc2nchw); USE_LITE_KERNEL(layout, kARM, kInt8, kNCHW, int8_nchw2nhwc); USE_LITE_KERNEL(layout, kARM, kInt8, kNCHW, int8_nhwc2nchw); USE_LITE_KERNEL(layout_once, kARM, kFloat, kNCHW, nchw2nhwc); USE_LITE_KERNEL(layout_once, kARM, kFloat, kNCHW, nhwc2nchw); USE_LITE_KERNEL(layout_once, kARM, kInt8, kNCHW, int8_nchw2nhwc); USE_LITE_KERNEL(layout_once, kARM, kInt8, kNCHW, int8_nhwc2nchw); USE_LITE_KERNEL(elementwise_add, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fusion_elementwise_add_activation, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(elementwise_sub, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fusion_elementwise_sub_activation, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(elementwise_mul, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fusion_elementwise_mul_activation, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(elementwise_max, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fusion_elementwise_max_activation, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(elementwise_div, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fusion_elementwise_div_activation, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fetch, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(fill_constant, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fill_constant_batch_size_like, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(while, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(batch_norm, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(io_copy, kFPGA, kAny, kAny, host_to_device); USE_LITE_KERNEL(io_copy, kFPGA, kAny, kAny, device_to_host); USE_LITE_KERNEL(io_copy_once, kFPGA, kAny, kAny, host_to_device_once); USE_LITE_KERNEL(io_copy_once, kFPGA, kAny, kAny, device_to_host_once); USE_LITE_KERNEL(arg_max, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(conv2d, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(beam_search_decode, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(assign_value, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(gru, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(cast, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(conv2d, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(depthwise_conv2d, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(conv2d, kARM, kInt8, kNCHW, int8_out); USE_LITE_KERNEL(conv2d, kARM, kInt8, kNCHW, fp32_out); USE_LITE_KERNEL(depthwise_conv2d, kARM, kInt8, kNCHW, int8_out); USE_LITE_KERNEL(depthwise_conv2d, kARM, kInt8, kNCHW, fp32_out); USE_LITE_KERNEL(write_to_array, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(anchor_generator, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(dropout, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(pad2d, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fc, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fc, kARM, kInt8, kNCHW, int8out); USE_LITE_KERNEL(fc, kARM, kInt8, kNCHW, fp32out); USE_LITE_KERNEL(lrn, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(pool2d, kFPGA, kFP16, kNHWC, def); USE_LITE_KERNEL(read_from_array, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(matmul, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fetch, kHost, kAny, kAny, def); USE_LITE_KERNEL(slice, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(concat, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(shuffle_channel, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(top_k, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(sequence_pool, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(feed, kHost, kAny, kAny, def); USE_LITE_KERNEL(gru_unit, kARM, kFloat, kNCHW, def); USE_LITE_KERNEL(fc, kFPGA, kFP16, kNHWC, def);