CMakeLists.txt 6.4 KB
Newer Older
W
Wu Yi 已提交
1
include(operators)
D
dzhwinter 已提交
2

3 4
add_subdirectory(generator)

W
Wilber 已提交
5
# solve "math constants not defined" problems caused by the order of inclusion
6 7 8
# of <cmath> and the definition of macro _USE_MATH_DEFINES
add_definitions(-D_USE_MATH_DEFINES)

W
Wu Yi 已提交
9 10 11
# clean cache and pybind_file content first when rebuild
unset(GLOB_OP_LIB CACHE)
unset(OP_LIBRARY CACHE)
12
set(pybind_file ${PADDLE_BINARY_DIR}/paddle/fluid/pybind/pybind.h.tmp CACHE INTERNAL "pybind.h file")
13
set(pybind_file_prune ${PADDLE_BINARY_DIR}/paddle/fluid/pybind/pybind.h.prune CACHE INTERNAL "pybind.h file")
14
set(pybind_file_final ${PADDLE_BINARY_DIR}/paddle/fluid/pybind/pybind.h)
15
file(WRITE ${pybind_file} "#include \"paddle/phi/core/kernel_registry.h\" // Generated by the paddle/fluid/operators/CMakeLists.txt.  DO NOT EDIT!\n\n")
16

Q
qijun 已提交
17
add_subdirectory(math)
W
Wu Yi 已提交
18 19 20 21 22 23 24 25
add_subdirectory(controlflow)
add_subdirectory(detection)
add_subdirectory(elementwise)
add_subdirectory(fused)
add_subdirectory(metrics)
add_subdirectory(optimizers)
add_subdirectory(reduce_ops)
add_subdirectory(sequence_ops)
S
Steffy-zxf 已提交
26
add_subdirectory(string)
L
levi131 已提交
27
add_subdirectory(prim_ops)
Q
QI JUN 已提交
28

T
tangwei12 已提交
29

T
typhoonzero 已提交
30
if(WITH_DISTRIBUTE)
31
    add_subdirectory(collective)
W
Wu Yi 已提交
32
endif()
33

T
tangwei12 已提交
34 35 36 37
if (WITH_PSCORE)
    add_subdirectory(pscore)
endif()

38 39
add_subdirectory(amp)

W
wopeizl 已提交
40
add_subdirectory(reader)
T
typhoonzero 已提交
41

W
Wu Yi 已提交
42 43
if (NOT WIN32)
    add_subdirectory(nccl)
S
sneaxiy 已提交
44 45
endif()

46
if (WITH_GPU AND TENSORRT_FOUND)
W
Wu Yi 已提交
47
    add_subdirectory(tensorrt)
48
endif()
49

D
denglin-github 已提交
50 51 52 53
if (WITH_DLNNE)
    add_subdirectory(dlnne)
endif()

石晓伟 已提交
54 55 56 57
if (WITH_LITE)
    add_subdirectory(lite)
endif()

58 59 60 61
if(WITH_CINN)
    add_subdirectory(cinn)
endif()

A
Allen Guo 已提交
62 63 64 65
if(WITH_IPU)
    add_subdirectory(ipu)
endif()

W
Wilber 已提交
66
SET(OP_HEADER_DEPS xxhash executor)
石晓伟 已提交
67

68
if (WITH_GPU)
69 70 71
    if (${CMAKE_CUDA_COMPILER_VERSION} LESS 11.0)
        SET(OP_HEADER_DEPS ${OP_HEADER_DEPS} cub)
    endif()
72 73
endif()

74 75 76 77
if (WITH_POCKETFFT)
    SET(OP_HEADER_DEPS ${OP_HEADER_DEPS} pocketfft)
endif()

78

A
Aurelius84 已提交
79
SET(OP_MKL_DEPS "")
80
if (NOT WITH_MKL OR NOT WITH_AVX)
A
Aurelius84 已提交
81 82 83
    SET(OP_MKL_DEPS ${OP_MKL_DEPS} match_matrix_tensor_op)
    SET(OP_MKL_DEPS ${OP_MKL_DEPS} var_conv_2d_op)
endif()
84
if(WITH_COVERAGE OR WIN32 OR WITH_NV_JETSON)
A
Aurelius84 已提交
85
    SET(OP_MKL_DEPS ${OP_MKL_DEPS} pyramid_hash_op)
K
Kevin 已提交
86 87
endif()

88 89 90 91 92
if(WITH_UNITY_BUILD)
    # Load Unity Build rules for operators in paddle/fluid/operators.
    include(unity_build_rule.cmake)
endif()

93
set(OP_HEADER_DEPS ${OP_HEADER_DEPS} phi phi_utils static_prim_api get_expected_kernel_func)
94

95
register_operators(EXCLUDES py_func_op dgc_op generated_op1 generated_op2 generated_op3 generated_op4 load_combine_op lstm_op run_program_op quantize_linear_op
R
risemeup1 已提交
96
        recurrent_op save_combine_op sparse_attention_op sync_batch_norm_op activation_op ${OP_MKL_DEPS} DEPS ${OP_HEADER_DEPS} processgroup_comm_utils)
武毅 已提交
97

98
op_library(generated_op UNITY SRCS generated_op1.cc generated_op2.cc generated_op3.cc generated_op4.cc DEPS ${OP_HEADER_DEPS})
99
op_library(run_program_op DEPS executor_cache ${OP_HEADER_DEPS})
100
target_link_libraries(run_program_op cuda_graph_with_memory_pool)
101
op_library(quantize_linear_op DEPS phi)
102
op_library(save_combine_op DEPS string_array phi)
S
Steffy-zxf 已提交
103
op_library(load_combine_op DEPS string_array)
104

105 106 107 108
if (WITH_GPU OR WITH_ROCM)
    register_cu_kernel(class_center_sample_op SRCS class_center_sample_op.cu DEPS ${OP_HEADER_DEPS})
endif()

109 110 111 112
if (WITH_MKLDNN)
    register_mkldnn_kernel(layer_norm_op SRCS layer_norm_mkldnn_op.cc DEPS ${OP_HEADER_DEPS})
endif()

H
huangjiyi 已提交
113 114 115 116 117 118 119 120
if (WITH_GPU OR WITH_ROCM)
    op_library(activation_op SRCS activation_op.cc activation_op.kps soft_relu_op.cu DEPS ${OP_HEADER_DEPS})
elseif (WITH_XPU_KP)
    op_library(activation_op SRCS activation_op.cc activation_op.kps DEPS ${OP_HEADER_DEPS})
else()
    op_library(activation_op SRCS activation_op.cc DEPS ${OP_HEADER_DEPS})
endif()

121
if (WITH_GPU OR WITH_ROCM)
R
risemeup1 已提交
122
    op_library(sync_batch_norm_op DEPS processgroup_comm_utils)
123
    if ((NOT WIN32) AND (NOT WITH_ROCM) AND (NOT PADDLE_WITH_ARM) AND (NOT ${CMAKE_CUDA_COMPILER_VERSION} VERSION_LESS 11.3) )
R
risemeup1 已提交
124
        op_library(sparse_attention_op DEPS processgroup_comm_utils)
125
    endif()
W
Wu Yi 已提交
126
endif()
T
tangwei12 已提交
127

128
op_library(lstm_op DEPS ${OP_HEADER_DEPS})
R
risemeup1 已提交
129 130 131 132 133 134
if (WITH_ROCM)
    op_library(recurrent_op DEPS executor ${OP_HEADER_DEPS})
else()
    op_library(recurrent_op DEPS ${OP_HEADER_DEPS})
endif()

135

136
set(COMMON_OP_DEPS ${OP_HEADER_DEPS})
137

G
gongweibao 已提交
138
if (WITH_DGC)
139 140 141 142
    op_library(dgc_op DEPS dgc)
    set(COMMON_OP_DEPS ${COMMON_OP_DEPS} dgc)
endif()

143
cc_library(common_infer_shape_functions SRCS common_infer_shape_functions.cc DEPS operator)
144
cc_library(ops_extra_info SRCS ops_extra_info.cc DEPS attribute phi)
A
Aurelius84 已提交
145

146 147 148
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} phi)
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} selected_rows_utils
lod_tensor unpooling lod_rank_table context_project executor static_prim_api)
149
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} dynload_warpctc static_prim_api static_utils static_global_utils prim_utils)
150 151
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} cos_sim_functor memory concat_and_split sampler sample_prob tree2col)
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} beam_search)
R
Ruibiao Chen 已提交
152
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} box_wrapper ps_gpu_wrapper)
153
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} common_infer_shape_functions)
154 155 156 157
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} processgroup_comm_utils)
if(WITH_NCCL OR WITH_RCCL)
  set(COMMON_OP_DEPS ${COMMON_OP_DEPS} process_group_nccl)
endif()
158
if (WITH_GPU OR WITH_ROCM)
159
  set(COMMON_OP_DEPS ${COMMON_OP_DEPS} depthwise_conv prelu bert_encoder_functor)
W
Wu Yi 已提交
160
endif()
161 162 163
if(WITH_XPU)
  set(COMMON_OP_DEPS ${COMMON_OP_DEPS} xpulib)
endif()
164
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} layer)
165
set(COMMON_OP_DEPS ${COMMON_OP_DEPS} op_version_registry)
张春乔 已提交
166

167

W
Wu Yi 已提交
168 169 170 171 172 173
# FIXME(typhoonzero): operator deps may not needed.
# op_library(unsqueeze_op DEPS reshape_op)
# op_library(squeeze_op DEPS reshape_op)
# op_library(flatten_op DEPS reshape_op)
# op_library(unstack_op DEPS stack_op)
# op_library(tensor_array_to_tensor_op DEPS concat_op)
B
baiyf 已提交
174

W
Wu Yi 已提交
175 176
set(OPERATOR_DEPS ${OPERATOR_DEPS} ${COMMON_OP_DEPS})
set(GLOB_OPERATOR_DEPS ${OPERATOR_DEPS} CACHE INTERNAL "Global Op dependencies")
L
Luo Tao 已提交
177

S
sneaxiy 已提交
178 179 180 181
if (WITH_PYTHON)
  cc_library(py_func_op SRCS py_func_op.cc DEPS op_registry python pybind)
endif()

W
Wu Yi 已提交
182
set(GLOB_OP_LIB ${OP_LIBRARY} CACHE INTERNAL "Global OP library")
183

184 185 186 187
if(WITH_UNITY_BUILD)
    # Using Unity Build to compile operators, `register_operator` will cause
    # the unity library to lose some symbols.
    # The specified link dependency needs to be displayed here.
T
tangwei12 已提交
188
    target_link_libraries(paddle_operators_unity ${OP_HEADER_DEPS} ${COMMON_OP_DEPS})
189
endif()
190

191
copy_if_different(${pybind_file} ${pybind_file_final})
192 193

if (WITH_CUSTOM_DEVICE)
194
cc_library(custom_device_common_op_registry SRCS custom_device_common_op_registry.cc DEPS operator phi type_info)
195
endif()
196 197 198 199

if(NOT "${OP_LIST}" STREQUAL "")
prune_pybind_h()
endif()