CMakeLists.txt 3.3 KB
Newer Older
Y
Yan Chunwei 已提交
1
# Add TRT tests
2 3 4
list(
  APPEND
  CONVERT_FILES
5
  matrix_multiply_op.cc
6
  bmm_op.cc
7 8 9 10 11 12 13 14 15 16
  conv2d_op.cc
  pool2d_op.cc
  elementwise_op.cc
  batch_norm_op.cc
  activation_op.cc
  unary_op.cc
  softmax_op.cc
  concat_op.cc
  dropout_op.cc
  group_norm_op.cc
17
  pad3d_op.cc
18 19
  pad_op.cc
  split_op.cc
20
  square_op.cc
21 22 23 24 25
  prelu_op.cc
  leaky_relu_op.cc
  gelu_op.cc
  layer_norm_op.cc
  multihead_matmul_op.cc
26
  multihead_matmul_roformer_op.cc
27 28
  flash_multihead_matmul_op.cc
  cross_multihead_matmul_op.cc
29
  qk_multihead_matmul_op.cc
30
  grid_sampler_op.cc
31
  shuffle_channel_op.cc
32
  fill_any_like_op.cc
33
  where_op.cc
34
  bitwise_not_op.cc
35
  one_hot_op.cc
36
  swish_op.cc
L
LielinJiang 已提交
37
  silu_op.cc
38 39 40 41 42 43 44 45 46 47 48 49
  instance_norm_op.cc
  stack_op.cc
  transpose_op.cc
  flatten_op.cc
  flatten_contiguous_range_op.cc
  skip_layernorm.cc
  scale_op.cc
  slice_op.cc
  hard_sigmoid_op.cc
  hard_swish_op.cc
  clip_op.cc
  gather_op.cc
X
xjmxyt 已提交
50
  index_select_op.cc
51 52 53 54
  anchor_generator_op.cc
  yolo_box_op.cc
  yolo_box_head_op.cc
  arg_max_op.cc
55
  arg_min_op.cc
56 57 58 59 60 61 62 63 64 65 66 67
  roi_align_op.cc
  affine_channel_op.cc
  multiclass_nms_op.cc
  multiclass_nms3_op.cc
  nearest_interp_op.cc
  reshape_op.cc
  reduce_op.cc
  gather_nd_op.cc
  tile_op.cc
  conv3d_op.cc
  mish_op.cc
  nearest_interp_v2_op.cc
68
  bilinear_interp_v2_op.cc
69 70 71 72 73 74
  pool3d_op.cc
  deformable_conv_op.cc
  strided_slice_op.cc
  preln_skip_layernorm.cc
  roll_op.cc
  transformer_input_convert_op.cc
C
ccrrong 已提交
75
  cast_op.cc
76
  remove_padding_op.cc
C
ccrrong 已提交
77
  equal_op.cc
78
  recover_padding_op.cc
79 80
  preln_residual_bias.cc
  c_allreduce_op.cc
81
  top_k_op.cc
82
  range_op.cc
83
  squeeze2_op.cc
84
  unsqueeze2_op.cc
Z
zhoutianzi666 已提交
85 86
  rnn_op.cc
  fill_constant_batch_size_like_op.cc
87 88
  sum_op.cc
  shape_op.cc
89
  fill_constant_op.cc
W
wenbin 已提交
90
  fused_token_prune_op.cc
91
  celu_op.cc
W
weishengying 已提交
92
  layernorm_shift_partition_op.cc
W
Wang Bojun 已提交
93
  reverse_roll_op.cc
94
  tanhshrink_op.cc
95
  take_along_axis_op.cc
96
  logsigmoid_op.cc
W
wenbin 已提交
97
  preln_layernorm_shift_partition_op.cc
98
  trans_layernorm_op.cc
W
Wang Bojun 已提交
99
  merge_layernorm_op.cc
W
wenbin 已提交
100
  skip_merge_layernorm_op.cc
101
  generic_and_custom_plugin_creater.cc
102
  lookup_table_op.cc
103
  elementwiseadd_transpose_op.cc
W
wenbin 已提交
104 105
  skip_groupnorm_act_op.cc
  preln_groupnorm_act_op.cc
106
  expand_v2_op.cc
107
  cumsum_op.cc
108
  temporal_shift_op.cc)
109

110
if(${TENSORRT_MAJOR_VERSION} GREATER_EQUAL 7)
111 112 113 114
  list(APPEND CONVERT_FILES emb_eltwise_layernorm.cc
       preln_emb_eltwise_layernorm.cc)
endif()

115 116 117 118
if(CUSPARSELT_FOUND AND ${TENSORRT_MAJOR_VERSION} GREATER_EQUAL 8)
  list(APPEND CONVERT_FILES sparse_fc_op.cc sparse_multihead_matmul_op.cc)
endif()

X
xjmxyt 已提交
119 120 121 122 123
if(${TENSORRT_MAJOR_VERSION} GREATER_EQUAL 8 AND ${TENSORRT_MINOR_VERSION}
                                                 GREATER_EQUAL 2)
  list(APPEND CONVERT_FILES set_value_op.cc)
endif()

124 125
nv_library(
  tensorrt_converter
126
  SRCS ${CONVERT_FILES}
W
weishengying 已提交
127 128 129 130 131 132
  DEPS tensorrt_engine
       tensorrt_plugin
       operator
       scope
       framework_proto
       tensorrt_op_teller
133
       op_registry)
134

135 136 137 138 139
nv_test(
  test_op_converter
  SRCS test_op_converter.cc
  DEPS paddle_framework ${GLOB_OPERATOR_DEPS} tensorrt_engine
       tensorrt_converter)
140

W
weishengying 已提交
141 142 143
nv_test(
  test_custom_plugin_creater
  SRCS test_custom_plugin_creater.cc
144 145
  DEPS paddle_framework tensorrt_converter op_meta_info custom_operator
       init_phi)
W
weishengying 已提交
146

147 148 149 150 151
if(WITH_ONNXRUNTIME AND WIN32)
  # Copy onnxruntime for some c++ test in Windows, since the test will
  # be build only in CI, so suppose the generator in Windows is Ninja.
  copy_onnx(test_op_converter)
endif()