CMakeLists.txt 9.2 KB
Newer Older
W
Wu Yi 已提交
1
include(operators)
D
dzhwinter 已提交
2

W
Wu Yi 已提交
3 4 5
# clean cache and pybind_file content first when rebuild
unset(GLOB_OP_LIB CACHE)
unset(OP_LIBRARY CACHE)
6 7 8 9
set(pybind_file ${PADDLE_BINARY_DIR}/paddle/fluid/pybind/pybind.h.tmp CACHE INTERNAL "pybind.h file")
set(pybind_file_final ${PADDLE_BINARY_DIR}/paddle/fluid/pybind/pybind.h)
file(WRITE ${pybind_file} "// Generated by the paddle/fluid/operators/CMakeLists.txt.  DO NOT EDIT!\n\n")

Q
qijun 已提交
10
add_subdirectory(math)
11
add_subdirectory(eigen)
W
Wu Yi 已提交
12 13 14 15 16 17 18 19
add_subdirectory(controlflow)
add_subdirectory(detection)
add_subdirectory(elementwise)
add_subdirectory(fused)
add_subdirectory(metrics)
add_subdirectory(optimizers)
add_subdirectory(reduce_ops)
add_subdirectory(sequence_ops)
T
tensor-tang 已提交
20
add_subdirectory(jit)
L
lidanqing 已提交
21 22 23
if(WITH_MKLDNN)
    add_subdirectory(mkldnn)
endif()
Q
QI JUN 已提交
24

T
tangwei12 已提交
25

T
typhoonzero 已提交
26
if(WITH_DISTRIBUTE)
27
    add_subdirectory(collective)
W
Wu Yi 已提交
28
endif()
29

T
tangwei12 已提交
30 31 32 33
if (WITH_PSCORE)
    add_subdirectory(pscore)
endif()

34 35
add_subdirectory(amp)

W
wopeizl 已提交
36
add_subdirectory(reader)
T
typhoonzero 已提交
37

W
Wu Yi 已提交
38 39
if (NOT WIN32)
    add_subdirectory(nccl)
S
sneaxiy 已提交
40 41
endif()

42
if (WITH_GPU AND TENSORRT_FOUND)
W
Wu Yi 已提交
43
    add_subdirectory(tensorrt)
44
endif()
45

D
denglin-github 已提交
46 47 48 49
if (WITH_DLNNE)
    add_subdirectory(dlnne)
endif()

石晓伟 已提交
50 51 52 53
if (WITH_LITE)
    add_subdirectory(lite)
endif()

W
Wilber 已提交
54
SET(OP_HEADER_DEPS xxhash executor)
石晓伟 已提交
55

56
if (WITH_GPU)
57 58 59
    if (${CMAKE_CUDA_COMPILER_VERSION} LESS 11.0)
        SET(OP_HEADER_DEPS ${OP_HEADER_DEPS} cub)
    endif()
60 61
endif()

62 63 64 65
if (WITH_POCKETFFT)
    SET(OP_HEADER_DEPS ${OP_HEADER_DEPS} pocketfft)
endif()

66

A
Aurelius84 已提交
67
SET(OP_MKL_DEPS "")
68
if (NOT WITH_MKL OR NOT WITH_AVX)
A
Aurelius84 已提交
69 70 71
    SET(OP_MKL_DEPS ${OP_MKL_DEPS} match_matrix_tensor_op)
    SET(OP_MKL_DEPS ${OP_MKL_DEPS} var_conv_2d_op)
endif()
72
if(WITH_COVERAGE OR WIN32 OR WITH_NV_JETSON)
A
Aurelius84 已提交
73
    SET(OP_MKL_DEPS ${OP_MKL_DEPS} pyramid_hash_op)
K
Kevin 已提交
74 75
endif()

76 77 78 79 80
if(WITH_UNITY_BUILD)
    # Load Unity Build rules for operators in paddle/fluid/operators.
    include(unity_build_rule.cmake)
endif()

81
register_operators(EXCLUDES py_layer_op py_func_op warpctc_op dgc_op sparse_attention_op lstm_op run_program_op eye_op recurrent_op
82
        sync_batch_norm_op spectral_op ${OP_MKL_DEPS} DEPS ${OP_HEADER_DEPS})
武毅 已提交
83

T
tangwei12 已提交
84
op_library(run_program_op SRCS run_program_op.cc run_program_op.cu.cc DEPS executor_cache ${OP_HEADER_DEPS})
85

86 87
if (WITH_GPU OR WITH_ROCM)
    if(WITH_ROCM)
88
        op_library(warpctc_op DEPS dynload_warpctc sequence_padding sequence_scale SRCS warpctc_op.cc warpctc_op.cu)
Q
qingqing01 已提交
89
    # warpctc_op needs cudnn 7 above
90
    elseif(${CUDNN_MAJOR_VERSION} VERSION_LESS 7)
91
        op_library(warpctc_op DEPS dynload_warpctc sequence_padding sequence_scale SRCS warpctc_op.cc warpctc_op.cu)
W
Wu Yi 已提交
92 93
    else()
        op_library(warpctc_op DEPS dynload_warpctc sequence_padding sequence_scale)
W
Wu Yi 已提交
94
    endif()
95 96
    op_library(sync_batch_norm_op)
    file(APPEND ${pybind_file} "USE_CUDA_ONLY_OP(sync_batch_norm);\n")
97
    if ((NOT WIN32) AND (NOT WITH_ROCM) AND (NOT PADDLE_WITH_ARM) AND (NOT ${CMAKE_CUDA_COMPILER_VERSION} VERSION_LESS 11.2) )
98 99 100
        op_library(sparse_attention_op)
        file(APPEND ${pybind_file} "USE_CUDA_ONLY_OP(sparse_attention);\n")
    endif()
W
Wu Yi 已提交
101 102
else()
    op_library(warpctc_op DEPS dynload_warpctc sequence_padding sequence_scale)
W
Wu Yi 已提交
103
endif()
T
tangwei12 已提交
104

105

106
if (WITH_GPU AND (NOT WITH_ROCM))
107 108 109 110 111 112
    if (MKL_FOUND AND WITH_ONEMKL)
        op_library(spectral_op SRCS spectral_op.cc spectral_op.cu DEPS dynload_cuda dynload_mklrt ${OP_HEADER_DEPS})
        target_include_directories(spectral_op PRIVATE ${MKL_INCLUDE})
    else()
        op_library(spectral_op SRCS spectral_op.cc spectral_op.cu DEPS dynload_cuda ${OP_HEADER_DEPS})
    endif()
113
else()
114 115 116 117 118 119
    if (MKL_FOUND AND WITH_ONEMKL)
        op_library(spectral_op SRCS spectral_op.cc DEPS dynload_mklrt ${OP_HEADER_DEPS})
        target_include_directories(spectral_op PRIVATE ${MKL_INCLUDE})
    else()
        op_library(spectral_op SRCS spectral_op.cc DEPS ${OP_HEADER_DEPS})
    endif()
120 121
endif()

T
tangwei12 已提交
122 123 124
op_library(lstm_op DEPS ${OP_HEADER_DEPS}  lstm_compute)
op_library(eye_op DEPS ${OP_HEADER_DEPS})
op_library(recurrent_op DEPS ${OP_HEADER_DEPS})
125

126
set(COMMON_OP_DEPS ${OP_HEADER_DEPS})
127

G
gongweibao 已提交
128
if (WITH_DGC)
129 130 131 132 133
    op_library(dgc_op DEPS dgc)
    file(APPEND ${pybind_file} "USE_CUDA_ONLY_OP(dgc);\n")
    set(COMMON_OP_DEPS ${COMMON_OP_DEPS} dgc)
endif()

134
cc_library(common_infer_shape_functions SRCS common_infer_shape_functions.cc DEPS operator)
A
Aurelius84 已提交
135

136
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} selected_rows_functor selected_rows lapack_function
Y
yaoxuefeng 已提交
137
lod_tensor maxouting unpooling pooling lod_rank_table context_project
138
sequence_pooling segment_pooling executor device_memory_aligment generator)
P
peizhilin 已提交
139
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} dynload_warpctc)
X
xuezhong 已提交
140
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} sequence_padding sequence_scale cos_sim_functor memory jit_kernel_helper concat_and_split cross_entropy softmax vol2col im2col sampler sample_prob tree2col)
W
Weilong Wu 已提交
141
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} sequence2batch lstm_compute matrix_bit_code gru_compute activation_functions beam_search fc matrix_inverse matrix_solve)
Y
yaoxuefeng 已提交
142
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} box_wrapper boost ps_gpu_wrapper)
143
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} common_infer_shape_functions)
144
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} eigen_function)
145
if (WITH_GPU OR WITH_ROCM)
146
  set(COMMON_OP_DEPS ${COMMON_OP_DEPS} depthwise_conv prelu bert_encoder_functor)
W
Wu Yi 已提交
147
endif()
148
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} device_memory_aligment)
149
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} layer)
H
Huihuang Zheng 已提交
150
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} tensor_formatter)
151
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} op_version_registry)
152 153 154
if (WITH_ASCEND)
  set(COMMON_OP_DEPS ${COMMON_OP_DEPS} ascend_wrapper)
endif()
155

156
if (WITH_ASCEND_CL)
157
  cc_test(assign_op_npu_test SRCS assign_op_npu_test.cc DEPS assign_op)
158 159 160 161
  cc_library(npu_op_runner SRCS npu_op_runner.cc DEPS operator npu_info)
  set(COMMON_OP_DEPS ${COMMON_OP_DEPS} npu_op_runner)
endif()

W
Wu Yi 已提交
162 163 164 165 166 167 168 169
# FIXME(typhoonzero): operator deps may not needed.
# op_library(lod_tensor_to_array_op DEPS lod_rank_table_op)
# op_library(array_to_lod_tensor_op DEPS lod_rank_table_op)
# op_library(unsqueeze_op DEPS reshape_op)
# op_library(squeeze_op DEPS reshape_op)
# op_library(flatten_op DEPS reshape_op)
# op_library(unstack_op DEPS stack_op)
# op_library(tensor_array_to_tensor_op DEPS concat_op)
B
baiyf 已提交
170

W
Wu Yi 已提交
171 172
set(OPERATOR_DEPS ${OPERATOR_DEPS} ${COMMON_OP_DEPS})
set(GLOB_OPERATOR_DEPS ${OPERATOR_DEPS} CACHE INTERNAL "Global Op dependencies")
L
Luo Tao 已提交
173

174
cc_test(test_common_infer_shape_functions SRCS test_common_infer_shape_functions.cc DEPS common_infer_shape_functions ${COMMON_OP_DEPS} activation_op elementwise_add_op softmax_op softmax)
175
cc_test(gather_test SRCS gather_test.cc DEPS tensor)
176
cc_test(assign_op_test SRCS assign_op_test.cc DEPS assign_op)
Y
Yu Yang 已提交
177
cc_test(scatter_test SRCS scatter_test.cc DEPS tensor math_function)
Q
Qiao Longfei 已提交
178
cc_test(beam_search_decode_op_test SRCS beam_search_decode_op_test.cc DEPS lod_tensor)
Y
Yi Wang 已提交
179
cc_test(strided_memcpy_test SRCS strided_memcpy_test.cc DEPS tensor memory)
Y
Yu Yang 已提交
180
cc_test(save_load_op_test SRCS save_load_op_test.cc DEPS save_op load_op)
181
cc_test(save_load_combine_op_test SRCS save_load_combine_op_test.cc DEPS save_combine_op load_combine_op)
Z
Zeng Jinle 已提交
182
if (WITH_GPU)
183
    nv_test(dropout_op_test SRCS dropout_op_test.cc DEPS dropout_op tensor generator)
Z
Zeng Jinle 已提交
184
    nv_test(test_leaky_relu_grad_grad_functor SRCS test_leaky_relu_grad_grad_functor.cc test_leaky_relu_grad_grad_functor.cu DEPS tensor device_context eigen3)
185
    nv_test(feed_forward_test SRCS feed_forward_test.cu DEPS elementwise_add_op matmul_op tensor generator)
186 187 188
elseif(WITH_ROCM)
    hip_test(dropout_op_test SRCS dropout_op_test.cc DEPS dropout_op tensor generator)
    hip_test(test_leaky_relu_grad_grad_functor SRCS test_leaky_relu_grad_grad_functor.cc test_leaky_relu_grad_grad_functor.cu DEPS tensor device_context eigen3)
Z
Zeng Jinle 已提交
189 190 191
else()
    cc_test(test_leaky_relu_grad_grad_functor SRCS test_leaky_relu_grad_grad_functor.cc DEPS tensor device_context eigen3)
endif()
192

H
Huihuang Zheng 已提交
193
cc_library(tensor_formatter SRCS tensor_formatter.cc DEPS ${OP_HEADER_DEPS})
S
sneaxiy 已提交
194 195
if (WITH_PYTHON)
  cc_library(py_func_op SRCS py_func_op.cc DEPS op_registry python pybind)
196
  cc_library(py_layer_op SRCS py_layer_op.cc DEPS op_registry python pybind)
S
sneaxiy 已提交
197 198
endif()

199 200
if (WITH_ASCEND_CL)
  cc_test(range_op_npu_test SRCS range_op_npu_test.cc DEPS op_registry range_op scope device_context enforce executor)
201
  cc_test(expand_op_npu_test SRCS expand_op_npu_test.cc DEPS op_registry expand_op eigen_function scope device_context enforce executor compare_op)
202 203
endif()

W
Wu Yi 已提交
204
set(GLOB_OP_LIB ${OP_LIBRARY} CACHE INTERNAL "Global OP library")
205
add_subdirectory(benchmark)
206 207

cc_test(op_debug_string_test SRCS op_debug_string_test.cc DEPS elementwise_add_op)
208 209 210 211
if (WITH_ASCEND_CL)
    cc_test(transpose_op_npu_test SRCS transpose_op_npu_test.cc DEPS op_registry transpose_op scope device_context enforce executor)
endif()

212 213 214

if(WITH_MKLDNN)
include(mkldnn/inplace_op_tests.cmake)
215
include(mkldnn/caching_tests.cmake)
J
Jacek Czaja 已提交
216
include(mkldnn/nhwc_op_tests.cmake)
217
endif()
218 219 220 221 222

if(WITH_UNITY_BUILD)
    # Using Unity Build to compile operators, `register_operator` will cause
    # the unity library to lose some symbols.
    # The specified link dependency needs to be displayed here.
T
tangwei12 已提交
223
    target_link_libraries(paddle_operators_unity ${OP_HEADER_DEPS} ${COMMON_OP_DEPS})
224
endif()
225 226 227 228

if(WITH_ASCEND_CL)
cc_test(gelu_op_npu_test SRCS gelu_op_npu_test.cc DEPS op_registry gelu_op scope device_context enforce executor)
endif()
B
Baibaifan 已提交
229 230 231 232

if (WITH_GPU OR WITH_ASCEND_CL)
cc_test(copy_cross_scope_test SRCS copy_cross_scope_test.cc DEPS op_registry copy_cross_scope_op scope device_context enforce executor)
endif()
233 234

copy_if_different(${pybind_file} ${pybind_file_final})