CMakeLists.txt 12.2 KB
Newer Older
L
Luo Tao 已提交
1
file(GLOB GENERAL_OPS RELATIVE "${CMAKE_CURRENT_SOURCE_DIR}" "*_op.cc")
2
string(REPLACE "_mkldnn" "" GENERAL_OPS "${GENERAL_OPS}")
L
Luo Tao 已提交
3
string(REPLACE ".cc" "" GENERAL_OPS "${GENERAL_OPS}")
4
list(REMOVE_DUPLICATES GENERAL_OPS)
5
set(DEPS_OPS "")
6 7
set(pybind_file ${PADDLE_BINARY_DIR}/paddle/fluid/pybind/pybind.h)
file(WRITE ${pybind_file} "// Generated by the paddle/fluid/operator/CMakeLists.txt.  DO NOT EDIT!\n\n")
Y
Yu Yang 已提交
8 9 10 11
function(op_library TARGET)
    # op_library is a function to create op library. The interface is same as
    # cc_library. But it handle split GPU/CPU code and link some common library
    # for ops.
L
Luo Tao 已提交
12
    set(OP_LIBRARY ${TARGET} ${OP_LIBRARY} PARENT_SCOPE)
Y
Yu Yang 已提交
13 14
    set(cc_srcs)
    set(cu_srcs)
S
sabreshao 已提交
15 16
    set(hip_cu_srcs)
    set(miopen_hip_cc_srcs)
17
    set(cu_cc_srcs)
C
chengduoZH 已提交
18
    set(cudnn_cu_cc_srcs)
C
chengduoZH 已提交
19
    set(CUDNN_FILE)
20 21
    set(mkldnn_cc_srcs)
    set(MKLDNN_FILE)
Y
update  
Yancey1989 已提交
22
    set(op_common_deps operator op_registry math_function)
Y
Yu Yang 已提交
23 24 25
    set(options "")
    set(oneValueArgs "")
    set(multiValueArgs SRCS DEPS)
L
Luo Tao 已提交
26
    set(pybind_flag 0)
Y
Yu Yang 已提交
27 28 29
    cmake_parse_arguments(op_library "${options}" "${oneValueArgs}"
            "${multiValueArgs}" ${ARGN})

30 31 32 33
    list(LENGTH op_library_SRCS op_library_SRCS_len)
    if (${op_library_SRCS_len} EQUAL 0)
        if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/${TARGET}.cc)
            list(APPEND cc_srcs ${TARGET}.cc)
Y
Yu Yang 已提交
34
        endif()
35 36 37
        if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/${TARGET}.cu.cc)
            list(APPEND cu_cc_srcs ${TARGET}.cu.cc)
        endif()
38
        if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/${TARGET}.cu)
39
            list(APPEND cu_srcs ${TARGET}.cu)
40
        endif()
S
sabreshao 已提交
41 42 43
        if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/${TARGET}.hip.cu)
            list(APPEND hip_cu_srcs ${TARGET}.hip.cu)
        endif()
C
chengduoZH 已提交
44 45 46 47
        string(REPLACE "_op" "_cudnn_op" CUDNN_FILE "${TARGET}")
        if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/${CUDNN_FILE}.cu.cc)
            list(APPEND cudnn_cu_cc_srcs ${CUDNN_FILE}.cu.cc)
        endif()
S
sabreshao 已提交
48 49 50 51 52 53
        if(WITH_AMD_GPU)
            string(REPLACE "_op" "_miopen_op" MIOPEN_FILE "${TARGET}")
            if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/${MIOPEN_FILE}.hip.cc)
                list(APPEND miopen_hip_cc_srcs ${MIOPEN_FILE}.hip.cc)
            endif()
        endif()
54 55 56 57 58 59
        if(WITH_MKLDNN)
            string(REPLACE "_op" "_mkldnn_op" MKLDNN_FILE "${TARGET}")
            if (EXISTS ${CMAKE_CURRENT_SOURCE_DIR}/${MKLDNN_FILE}.cc)
                list(APPEND mkldnn_cc_srcs ${MKLDNN_FILE}.cc)
            endif()
        endif()
60 61
    else()
        foreach(src ${op_library_SRCS})
S
sabreshao 已提交
62 63 64
            if (${src} MATCHES ".*\\.hip.cu$")
                list(APPEND hip_cu_srcs ${src})
            elseif (${src} MATCHES ".*\\.cu$")
65
                list(APPEND cu_srcs ${src})
C
chengduoZH 已提交
66 67
            elseif(${src} MATCHES ".*_cudnn_op.cu.cc$")
                list(APPEND cudnn_cu_cc_srcs ${src})
S
sabreshao 已提交
68 69
            elseif(WITH_AMD_GPU AND ${src} MATCHES ".*_miopen_op.hip.cc$")
                list(APPEND miopen_hip_cc_srcs ${src})
70 71
            elseif(WITH_MKLDNN AND ${src} MATCHES ".*_mkldnn_op.cc$")
                list(APPEND mkldnn_cc_srcs ${src})
72 73
            elseif(${src} MATCHES ".*\\.cu.cc$")
                list(APPEND cu_cc_srcs ${src})
74 75 76 77 78 79 80
            elseif(${src} MATCHES ".*\\.cc$")
                list(APPEND cc_srcs ${src})
            else()
                message(FATAL_ERROR "${TARGET} Source file ${src} should only be .cc or .cu")
            endif()
        endforeach()
    endif()
Y
Yu Yang 已提交
81 82 83 84 85 86

    list(LENGTH cc_srcs cc_srcs_len)
    if (${cc_srcs_len} EQUAL 0)
        message(FATAL_ERROR "The op library ${TARGET} should contains at least one .cc file")
    endif()

87 88 89 90
    list(LENGTH op_library_DEPS op_library_DEPS_len)
    if (${op_library_DEPS_len} GREATER 0)
        set(DEPS_OPS ${TARGET} ${DEPS_OPS} PARENT_SCOPE)
    endif()
Y
Yu Yang 已提交
91
    if (WITH_GPU)
92
        nv_library(${TARGET} SRCS ${cc_srcs} ${cu_cc_srcs} ${cudnn_cu_cc_srcs} ${mkldnn_cc_srcs} ${cu_srcs} DEPS ${op_library_DEPS}
Y
Yu Yang 已提交
93
                ${op_common_deps})
94
    elseif (WITH_AMD_GPU)
S
sabreshao 已提交
95 96
        hip_library(${TARGET} SRCS ${cc_srcs} ${hip_cu_srcs} ${miopen_hip_cc_srcs} ${mkldnn_cc_srcs} DEPS ${op_library_DEPS}
                ${op_common_deps})
Y
Yu Yang 已提交
97
    else()
98 99
        cc_library(${TARGET} SRCS ${cc_srcs} ${mkldnn_cc_srcs} DEPS ${op_library_DEPS}
            ${op_common_deps})
Y
Yu Yang 已提交
100
    endif()
L
Luo Tao 已提交
101

102
    # Define operators that don't need pybind here.
103
    foreach(manual_pybind_op "compare_op" "logical_op" "nccl_op" "tensor_array_read_write_op")
104 105 106 107
        if ("${TARGET}" STREQUAL "${manual_pybind_op}")
            set(pybind_flag 1)
        endif()
    endforeach()
Q
qijun 已提交
108

S
sabreshao 已提交
109
    # The registration of USE_OP, please refer to paddle/fluid/framework/op_registry.h.
110 111
    # Note that it's enough to just adding one operator to pybind in a *_op.cc file.
    # And for detail pybind information, please see generated paddle/pybind/pybind.h.
112
    file(READ ${TARGET}.cc TARGET_CONTENT)
Y
Yang Yang 已提交
113 114
    string(REGEX MATCH "REGISTER_OPERATOR\\(.*REGISTER_OPERATOR\\(" multi_register "${TARGET_CONTENT}")
    string(REGEX MATCH "REGISTER_OPERATOR\\([a-z0-9_]*," one_register "${multi_register}")
115 116 117
    if (one_register STREQUAL "")
        string(REPLACE "_op" "" TARGET "${TARGET}")
    else ()
Y
Yang Yang 已提交
118
        string(REPLACE "REGISTER_OPERATOR(" "" TARGET "${one_register}")
119
        string(REPLACE "," "" TARGET "${TARGET}")
Y
Yu Yang 已提交
120 121
    endif()

L
Luo Tao 已提交
122
    # pybind USE_NO_KERNEL_OP
T
typhoonzero 已提交
123
    # HACK: if REGISTER_OP_CPU_KERNEL presents the operator must have kernel
T
typhoonzero 已提交
124
    string(REGEX MATCH "REGISTER_OP_CPU_KERNEL" regex_result "${TARGET_CONTENT}")
L
Luo Tao 已提交
125 126 127 128 129 130 131 132
    string(REPLACE "_op" "" TARGET "${TARGET}")
    if (${pybind_flag} EQUAL 0 AND regex_result STREQUAL "")
        file(APPEND ${pybind_file} "USE_NO_KERNEL_OP(${TARGET});\n")
        set(pybind_flag 1)
    endif()

    # pybind USE_CPU_ONLY_OP
    list(LENGTH cu_srcs cu_srcs_len)
133
    list(LENGTH cu_cc_srcs cu_cc_srcs_len)
134
    list(LENGTH mkldnn_cc_srcs mkldnn_cc_srcs_len)
S
sabreshao 已提交
135 136 137 138
    list(LENGTH hip_cu_srcs hip_cu_srcs_len)
    list(LENGTH miopen_hip_cc_srcs miopen_hip_cc_srcs_len)
    if (${pybind_flag} EQUAL 0 AND ${mkldnn_cc_srcs_len} EQUAL 0 AND ${cu_srcs_len} EQUAL 0 AND ${cu_cc_srcs_len} EQUAL 0 AND
        ${hip_cu_srcs_len} EQUAL 0 AND ${miopen_hip_cc_srcs_len} EQUAL 0)
L
Luo Tao 已提交
139 140 141 142
        file(APPEND ${pybind_file} "USE_CPU_ONLY_OP(${TARGET});\n")
        set(pybind_flag 1)
    endif()

C
chengduoZH 已提交
143 144
    # pybind USE_OP_DEVICE_KERNEL for CUDNN
    list(LENGTH cudnn_cu_cc_srcs cudnn_cu_cc_srcs_len)
C
chengduoZH 已提交
145
    if (WITH_GPU AND ${cudnn_cu_cc_srcs_len} GREATER 0)
C
chengduoZH 已提交
146 147 148
        file(APPEND ${pybind_file} "USE_OP_DEVICE_KERNEL(${TARGET}, CUDNN);\n")
    endif()

S
sabreshao 已提交
149 150 151 152 153
    # pybind USE_OP_DEVICE_KERNEL for MIOPEN
    if (WITH_AMD_GPU AND ${miopen_hip_cc_srcs_len} GREATER 0)
        file(APPEND ${pybind_file} "USE_OP_DEVICE_KERNEL(${TARGET}, MIOPEN);\n")
    endif()

154 155
    # pybind USE_OP_DEVICE_KERNEL for MKLDNN
    if (WITH_MKLDNN AND ${mkldnn_cc_srcs_len} GREATER 0)
156 157 158 159
      # Append first implemented MKLDNN activation operator
      if (${MKLDNN_FILE} STREQUAL "activation_mkldnn_op")
        file(APPEND ${pybind_file} "USE_OP_DEVICE_KERNEL(relu, MKLDNN);\n")
      else()
160
        file(APPEND ${pybind_file} "USE_OP_DEVICE_KERNEL(${TARGET}, MKLDNN);\n")
161
      endif()
162 163
    endif()

L
Luo Tao 已提交
164 165
    # pybind USE_OP
    if (${pybind_flag} EQUAL 0)
D
dzhwinter 已提交
166 167 168 169
      # NOTE(*): activation use macro to regist the kernels, set use_op manually.
      if(${TARGET} STREQUAL "activation")
        file(APPEND ${pybind_file} "USE_OP(relu);\n")
      else()
L
Luo Tao 已提交
170
        file(APPEND ${pybind_file} "USE_OP(${TARGET});\n")
D
dzhwinter 已提交
171
      endif()
L
Luo Tao 已提交
172
    endif()
Y
Yu Yang 已提交
173 174
endfunction()

Q
qijun 已提交
175
add_subdirectory(math)
D
Dong Zhihong 已提交
176
add_subdirectory(nccl)
177

L
Luo Tao 已提交
178 179
if(WITH_GPU)
    op_library(nccl_op DEPS nccl_common)
180
    file(APPEND ${pybind_file} "USE_CUDA_ONLY_OP(ncclAllReduce);\n")
L
Luo Tao 已提交
181 182 183
else()
    set(DEPS_OPS ${DEPS_OPS} nccl_op)
endif()
Q
QI JUN 已提交
184

185
add_subdirectory(detail)
T
typhoonzero 已提交
186
if(WITH_DISTRIBUTE)
T
typhoonzero 已提交
187
    set(DISTRIBUTE_DEPS sendrecvop_grpc grpc++_unsecure grpc_unsecure gpr cares zlib protobuf)
188 189 190
    set(DISTRIBUTE_COMPILE_FLAGS "-Wno-non-virtual-dtor -Wno-error=non-virtual-dtor -Wno-error=delete-non-virtual-dtor")
    op_library(send_op DEPS ${DISTRIBUTE_DEPS})
    set_source_files_properties(send_op.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
Q
Qiao Longfei 已提交
191 192
    op_library(prefetch_op DEPS ${DISTRIBUTE_DEPS})
    set_source_files_properties(prefetch_op.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
193 194
    op_library(recv_op DEPS ${DISTRIBUTE_DEPS})
    set_source_files_properties(recv_op.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
195 196
    op_library(listen_and_serv_op DEPS ${DISTRIBUTE_DEPS})
    set_source_files_properties(listen_and_serv_op.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
197 198 199 200
    op_library(send_vars_op DEPS ${DISTRIBUTE_DEPS})
    set_source_files_properties(send_vars_op.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
    op_library(send_barrier_op DEPS ${DISTRIBUTE_DEPS})
    set_source_files_properties(send_barrier_op.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
update  
typhoonzero 已提交
201
    set_source_files_properties(send_recv_op_test.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
Q
Qiao Longfei 已提交
202
    cc_test(test_send_recv SRCS send_recv_op_test.cc DEPS prefetch_op send_op listen_and_serv_op sum_op executor)
203
else()
Q
Qiao Longfei 已提交
204
    set(DEPS_OPS ${DEPS_OPS} send_op prefetch_op recv_op listen_and_serv_op send_vars_op send_barrier_op)
T
typhoonzero 已提交
205 206
endif()

207 208
op_library(cross_entropy_op DEPS cross_entropy)
op_library(softmax_with_cross_entropy_op DEPS cross_entropy softmax)
209 210
op_library(softmax_op DEPS softmax)
op_library(sequence_softmax_op DEPS softmax)
Q
QI JUN 已提交
211 212
op_library(sum_op DEPS selected_rows_functor)
op_library(sgd_op DEPS selected_rows_functor)
Y
Yan Chunwei 已提交
213
op_library(print_op DEPS lod_tensor)
Q
QI JUN 已提交
214
op_library(adagrad_op DEPS selected_rows_functor)
W
wanghaox 已提交
215
op_library(maxout_op DEPS maxouting)
S
sweetsky0901 已提交
216
op_library(unpool_op DEPS unpooling)
217
op_library(pool_op DEPS pooling)
C
chengduoZH 已提交
218
op_library(pool_with_index_op DEPS pooling)
219 220 221 222
op_library(lod_rank_table_op DEPS lod_rank_table)
op_library(lod_tensor_to_array_op DEPS lod_rank_table_op)
op_library(array_to_lod_tensor_op DEPS lod_rank_table_op)
op_library(max_sequence_len_op DEPS lod_rank_table)
C
chengduoZH 已提交
223
op_library(sequence_conv_op DEPS context_project)
224
op_library(sequence_pool_op DEPS sequence_pooling)
D
dangqingqing 已提交
225
op_library(lstm_op DEPS sequence2batch lstm_compute)
226
op_library(lstmp_op DEPS sequence2batch lstm_compute)
G
guosheng 已提交
227
op_library(gru_op DEPS sequence2batch gru_compute)
228
op_library(recurrent_op DEPS executor)
C
chengduoZH 已提交
229
op_library(warpctc_op DEPS dynload_warpctc sequence_padding sequence_scale)
C
chengduoZH 已提交
230
op_library(cos_sim_op DEPS cos_sim_functor)
Y
Yang Yang 已提交
231
op_library(parallel_do_op DEPS executor)
T
tangwei12 已提交
232
op_library(ckpt_save_op DEPS lod_tensor)
233 234

if (WITH_GPU)
235
    op_library(conv_op DEPS vol2col depthwise_conv im2col)
236
else()
237
    op_library(conv_op DEPS vol2col im2col)
238
endif()
239
op_library(conv_transpose_op DEPS vol2col im2col)
240

武毅 已提交
241 242 243
# FIXME(typhoonzero): save/load depends lodtensor serialization functions
op_library(save_op DEPS lod_tensor)
op_library(load_op DEPS lod_tensor)
244 245
op_library(save_combine_op DEPS lod_tensor)
op_library(load_combine_op DEPS lod_tensor)
246
op_library(concat_op DEPS concat)
武毅 已提交
247

T
Thuan Nguyen 已提交
248 249 250 251 252
# FIXME(thuan): Move CSP operators to paddle/fluid/framework/operators/concurrency
add_subdirectory(concurrency)
op_library(channel_send_op DEPS concurrency)
op_library(channel_recv_op DEPS concurrency)

253
list(REMOVE_ITEM GENERAL_OPS ${DEPS_OPS})
254 255 256 257 258 259 260

# The fully connected layer is deleted when the WITH_MKLDNN flag is OFF
# Because the fully connected layer has only one MKLDNN's operator
if(NOT WITH_MKLDNN)
    list(REMOVE_ITEM GENERAL_OPS fc_op)
endif(NOT WITH_MKLDNN)

L
Luo Tao 已提交
261
foreach(src ${GENERAL_OPS})
262
    op_library(${src})
L
Luo Tao 已提交
263
endforeach()
264

265
file(APPEND ${pybind_file} "USE_OP(less_than);\nUSE_OP(logical_and);\nUSE_NO_KERNEL_OP(read_from_array);\n")
266

Y
FIX CI  
Yu Yang 已提交
267 268 269 270
add_subdirectory(reader)
foreach(src ${READER_LIBRARY})
    set(OP_LIBRARY ${src} ${OP_LIBRARY})
endforeach()
271

L
Luo Tao 已提交
272 273
set(GLOB_OP_LIB ${OP_LIBRARY} CACHE INTERNAL "Global OP library")

274 275
cc_test(gather_test SRCS gather_test.cc DEPS tensor)
cc_test(scatter_test SRCS scatter_test.cc DEPS tensor)
Q
Qiao Longfei 已提交
276
cc_test(beam_search_decode_op_test SRCS beam_search_decode_op_test.cc DEPS lod_tensor)
Y
Yan Chunwei 已提交
277
cc_test(beam_search_op_test SRCS beam_search_op_test.cc DEPS lod_tensor beam_search_op)
Y
Yi Wang 已提交
278
cc_test(strided_memcpy_test SRCS strided_memcpy_test.cc DEPS tensor memory)
Y
Yu Yang 已提交
279
cc_test(save_load_op_test SRCS save_load_op_test.cc DEPS save_op load_op)
280
cc_test(save_load_combine_op_test SRCS save_load_combine_op_test.cc DEPS save_combine_op load_combine_op)
T
tangwei12 已提交
281
cc_test(ckpt_save_op_test SRCS ckpt_save_op_test.cc DEPS ckpt_save_op)
Q
QI JUN 已提交
282
nv_test(nccl_op_test SRCS nccl_op_test.cu.cc DEPS nccl_op gpu_info device_context)
G
gongweibao 已提交
283
nv_test(dropout_op_test SRCS dropout_op_test.cc DEPS dropout_op tensor)