CMakeLists.txt 25.1 KB
Newer Older
D
dongdaxiang 已提交
1

H
heqiaozhi 已提交
2 3
#windows treat symbolic file as a real file, which is different with unix
#We create a hidden file and compile it instead of origin source file.
D
dzhwinter 已提交
4 5
function(windows_symbolic TARGET)
  set(oneValueArgs "")
P
peizhilin 已提交
6
  set(multiValueArgs SRCS PATH)
D
dzhwinter 已提交
7
  cmake_parse_arguments(windows_symbolic "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
P
peizhilin 已提交
8
  set(final_path ${CMAKE_CURRENT_SOURCE_DIR}/${windows_symbolic_PATH})
D
dzhwinter 已提交
9
  foreach(src ${windows_symbolic_SRCS})
P
peizhilin 已提交
10 11 12 13
    get_filename_component(src ${src} NAME_WE)
    if (NOT EXISTS ${final_path}/${src}.cc OR NOT EXISTS ${final_path}/${src}.cu)
        message(FATAL " ${src}.cc and ${src}.cu must exsits, and ${src}.cu must be symbolic file.")
    endif()
D
dzhwinter 已提交
14

P
peizhilin 已提交
15 16 17 18 19
    file(GENERATE OUTPUT ${final_path}/.${src}.cu INPUT ${final_path}/${src}.cc)

    add_custom_command(OUTPUT ${final_path}/.${src}.cu
            COMMAND ${CMAKE_COMMAND} -E copy_if_different "${final_path}/${src}.cc" "${final_path}/.${src}.cu"
            COMMENT "create hidden file of ${src}.cu")
20
    add_custom_target(${TARGET} ALL DEPENDS ${final_path}/.${src}.cu)
D
dzhwinter 已提交
21 22 23
  endforeach()
endfunction()

X
start  
Xin Pan 已提交
24
add_subdirectory(ir)
D
dzhwinter 已提交
25
add_subdirectory(details)
D
dongdaxiang 已提交
26
add_subdirectory(fleet)
27
add_subdirectory(io)
28
add_subdirectory(new_executor)
29 30 31
if (WITH_CINN)
  add_subdirectory(paddle2cinn)
endif()
H
heqiaozhi 已提交
32
#ddim lib
33
proto_library(framework_proto SRCS framework.proto)
34
proto_library(pass_desc_proto SRCS pass_desc.proto DEPS framework_proto)
35

36
proto_library(op_def_proto SRCS op_def.proto DEPS framework_proto)
37
cc_library(op_def_api SRCS op_def_api.cc DEPS op_def_proto boost)
38

39 40 41 42 43 44 45 46 47 48 49 50
FILE(GLOB OP_DEF_FILES ${PADDLE_SOURCE_DIR}/paddle/fluid/operators/compat/*.pbtxt)
FILE(WRITE ${CMAKE_CURRENT_BINARY_DIR}/op_def.pbtxt 
     "namespace { \n"
     "const std::unordered_map<std::string, std::string> op_def_map =  { \n")
foreach(OP_DEF_FILE ${OP_DEF_FILES})
    FILE(READ ${OP_DEF_FILE}  OP_DEF_CONTENT)
    get_filename_component(OP_NAME ${OP_DEF_FILE} NAME_WE)
    FILE(APPEND ${CMAKE_CURRENT_BINARY_DIR}/op_def.pbtxt
    "{\"${OP_NAME}\",R\"(${OP_DEF_CONTENT})\"},\n")
endforeach(OP_DEF_FILE)
FILE(APPEND ${CMAKE_CURRENT_BINARY_DIR}/op_def.pbtxt "{\"\",\"\"}};\n}")

T
Thunderbrook 已提交
51
proto_library(heter_service_proto SRCS heter_service.proto)
D
dongdaxiang 已提交
52
proto_library(data_feed_proto SRCS data_feed.proto)
H
hutuxian 已提交
53 54
proto_library(trainer_desc_proto SRCS trainer_desc.proto DEPS framework_proto
  data_feed_proto)
55

S
Steffy-zxf 已提交
56 57
cc_library(string_array SRCS string_array.cc DEPS utf8proc)

Y
yuyang18 已提交
58
cc_library(data_type SRCS data_type.cc DEPS framework_proto ddim device_context)
D
dzhwinter 已提交
59
cc_test(data_type_test SRCS data_type_test.cc DEPS data_type place tensor)
60
if(WITH_GPU)
D
dzhwinter 已提交
61 62
  if (WIN32)
    windows_symbolic(tensor_util SRCS tensor_util.cu)
63
    nv_library(tensor SRCS tensor.cc .tensor_util.cu DEPS place memory data_type device_context dense_tensor)
D
dzhwinter 已提交
64 65
    add_dependencies(tensor tensor_util)
  else()
66
    nv_library(tensor SRCS tensor.cc tensor_util.cu DEPS place memory data_type device_context profiler dense_tensor)
D
dzhwinter 已提交
67
  endif(WIN32)
68
elseif(WITH_ROCM)
69
  hip_library(tensor SRCS tensor.cc tensor_util.cu DEPS place memory data_type device_context profiler dense_tensor)
Y
Yang Yu 已提交
70
else()
71
  cc_library(tensor SRCS tensor.cc tensor_util.cc DEPS place memory data_type device_context profiler dense_tensor)
72
endif()
D
dzhwinter 已提交
73

Y
Yu Yang 已提交
74
cc_test(tensor_test SRCS tensor_test.cc DEPS tensor)
75
if(WITH_GPU)
6
633WHU 已提交
76
  nv_test(tensor_util_test SRCS tensor_util_test.cc tensor_util_test.cu DEPS tensor dlpack_tensor)
77 78
elseif(WITH_ROCM)
  hip_test(tensor_util_test SRCS tensor_util_test.cc tensor_util_test.cu DEPS tensor dlpack_tensor)
Y
Yang Yu 已提交
79
else()
6
633WHU 已提交
80
  cc_test(tensor_util_test SRCS tensor_util_test.cc DEPS tensor dlpack_tensor)
Y
Yang Yu 已提交
81
endif()
D
dzhwinter 已提交
82

83 84
cc_test(copy_same_tensor_test SRCS copy_same_tensor_test.cc DEPS tensor)

Y
Update  
Yi Wang 已提交
85
cc_test(eigen_test SRCS eigen_test.cc DEPS tensor)
86
cc_library(mixed_vector SRCS mixed_vector.cc DEPS device_context place memory)
L
liaogang 已提交
87

88
if(WITH_GPU)
89
  nv_test(mixed_vector_test SRCS mixed_vector_test.cc mixed_vector_test.cu DEPS mixed_vector place memory device_context tensor)
90
elseif(WITH_ROCM)
91
  hip_test(mixed_vector_test SRCS mixed_vector_test.cc mixed_vector_test.cu DEPS mixed_vector place memory device_context tensor)
92
else()
93
  cc_test(mixed_vector_test SRCS mixed_vector_test.cc DEPS mixed_vector place memory device_context tensor)
94
endif()
95
cc_library(lod_tensor SRCS lod_tensor.cc DEPS ddim mixed_vector place tensor framework_proto version)
D
dzhwinter 已提交
96

97
cc_test(lod_tensor_test SRCS lod_tensor_test.cc DEPS lod_utils lod_tensor memory)
98 99 100 101 102 103

if(WITH_GPU)
  nv_test(lod_tensor_gpu_test SRCS lod_tensor_test.cu DEPS lod_tensor)
elseif(WITH_ROCM)
  hip_test(lod_tensor_gpu_test SRCS lod_tensor_test.cu DEPS lod_tensor)
endif()
104

S
sneaxiy 已提交
105
cc_library(garbage_collector SRCS garbage_collector.cc DEPS device_context memory gflags glog)
S
sneaxiy 已提交
106

F
fengjiayi 已提交
107
cc_library(reader SRCS reader.cc DEPS lod_tensor ddim)
Y
yuyang18 已提交
108
cc_test(reader_test SRCS reader_test.cc DEPS reader)
F
fengjiayi 已提交
109

Y
Yi Wang 已提交
110
cc_library(threadpool SRCS threadpool.cc DEPS enforce)
Y
Yang Yu 已提交
111 112
cc_test(threadpool_test SRCS threadpool_test.cc DEPS threadpool)

113
cc_library(var_type_traits SRCS var_type_traits.cc DEPS lod_tensor selected_rows_utils framework_proto scope)
S
sneaxiy 已提交
114
if (WITH_GPU)
S
sneaxiy 已提交
115
  target_link_libraries(var_type_traits dynload_cuda)
S
sneaxiy 已提交
116 117 118
endif()
cc_test(var_type_traits_test SRCS var_type_traits_test.cc DEPS var_type_traits)

T
Thunderbrook 已提交
119 120
set(BRPC_DEPS "")
if(WITH_PSLIB OR WITH_PSCORE)
T
Thunderbrook 已提交
121 122 123
    if(NOT WITH_HETERPS)
        set(BRPC_DEPS brpc ssl crypto)
    endif()
T
Thunderbrook 已提交
124 125 126 127 128
    if(WITH_PSLIB_BRPC)
        set(BRPC_DEPS pslib_brpc)
    endif()
endif()

129
cc_library(scope SRCS scope.cc DEPS glog threadpool xxhash var_type_traits)
T
Thunderbrook 已提交
130
cc_library(device_worker SRCS device_worker.cc DEPS trainer_desc_proto lod_tensor scope ${BRPC_DEPS})
H
hutuxian 已提交
131
cc_test(device_worker_test SRCS device_worker_test.cc DEPS device_worker)
132

S
sneaxiy 已提交
133
cc_library(scope_pool SRCS scope_pool.cc DEPS scope)
Y
Yi Wang 已提交
134
cc_test(scope_test SRCS scope_test.cc DEPS scope)
S
sneaxiy 已提交
135
cc_test(variable_test SRCS variable_test.cc DEPS tensor var_type_traits)
L
liaogang 已提交
136

137
cc_library(data_device_transform SRCS data_device_transform.cc DEPS tensor)
138 139
if(WITH_GPU)
  nv_test(data_device_transform_test SRCS data_device_transform_test.cu
S
sneaxiy 已提交
140
        DEPS operator op_registry device_context math_function scope)
141 142 143 144
elseif(WITH_ROCM)
  hip_test(data_device_transform_test SRCS data_device_transform_test.cu
        DEPS operator op_registry device_context math_function scope)
endif()
145

146
if(WITH_GPU)
D
dzhwinter 已提交
147
  if (WIN32)
H
heqiaozhi 已提交
148 149
#windows treat symbolic file as a real file, which is different with unix
#We create a hidden file and compile it instead of origin source file.
D
dzhwinter 已提交
150 151 152 153 154 155
      windows_symbolic(hidden_file SRCS data_type_transform.cu)
      nv_library(data_type_transform SRCS .data_type_transform.cu DEPS tensor)
      add_dependencies(data_type_transform hidden_file)
  else()
      nv_library(data_type_transform SRCS data_type_transform.cu DEPS tensor)
  endif(WIN32)
156
  nv_test(data_type_transform_test SRCS data_type_transform_test.cc data_type_transform_test.cu DEPS data_type_transform)
157 158 159
elseif(WITH_ROCM)
  hip_library(data_type_transform SRCS data_type_transform.cu DEPS tensor)
  hip_test(data_type_transform_test SRCS data_type_transform_test.cc data_type_transform_test.cu DEPS data_type_transform)
160 161 162 163
else()
  cc_library(data_type_transform SRCS data_type_transform.cc DEPS tensor)
  cc_test(data_type_transform_test SRCS data_type_transform_test.cc DEPS data_type_transform)
endif()
164

165
cc_library(data_layout_transform SRCS data_layout_transform.cc DEPS tensor math_function)
166
cc_test(data_layout_transform_test SRCS data_layout_transform_test.cc DEPS data_layout_transform)
167

168
cc_library(data_transform SRCS data_transform.cc DEPS math_function tensor
169
        framework_proto selected_rows_utils data_device_transform data_type_transform data_layout_transform)
Q
Qiao Longfei 已提交
170

171
cc_library(attribute SRCS attribute.cc DEPS framework_proto boost enforce)
172
cc_test(attribute_test SRCS attribute_test.cc DEPS attribute framework_proto proto_desc)
173 174
cc_test(program_desc_test SRCS program_desc_test.cc DEPS proto_desc
device_context)
175

176 177 178
cc_library(op_version_proto SRCS op_version_proto.cc DEPS framework_proto boost)

cc_library(op_version_registry SRCS op_version_registry.cc DEPS op_version_proto framework_proto boost)
179 180
cc_test(op_version_registry_test SRCS op_version_registry_test.cc DEPS op_version_registry)

R
reyoung 已提交
181
cc_library(op_proto_maker SRCS op_proto_maker.cc DEPS framework_proto attribute glog)
182
cc_test(op_proto_maker_test SRCS op_proto_maker_test.cc DEPS op_proto_maker)
183
cc_library(no_need_buffer_vars_inference SRCS no_need_buffer_vars_inference.cc DEPS attribute device_context)
184
cc_library(op_info SRCS op_info.cc DEPS attribute framework_proto no_need_buffer_vars_inference)
T
tensor-tang 已提交
185
cc_library(shape_inference SRCS shape_inference.cc DEPS ddim attribute device_context)
D
dzhwinter 已提交
186

187 188
cc_test(no_need_buffer_vars_inference_test SRCS no_need_buffer_vars_inference_test.cc DEPS no_need_buffer_vars_inference layer)

S
superjomn 已提交
189
cc_library(transfer_scope_cache SRCS transfer_scope_cache.cc DEPS scope framework_proto device_context)
190 191 192

cc_library(unused_var_check SRCS unused_var_check.cc DEPS glog no_need_buffer_vars_inference)

193 194 195
cc_library(op_kernel_type SRCS op_kernel_type.cc DEPS device_context place)

IF(WITH_XPU)
196
cc_library(phi_utils SRCS phi_utils.cc DEPS lod_tensor selected_rows_utils place phi var_type_traits phi_api_utils op_info xpu_op_list)
197
ELSE()
198
cc_library(phi_utils SRCS phi_utils.cc DEPS lod_tensor selected_rows_utils place phi var_type_traits phi_api_utils op_info)
199 200
ENDIF()

Q
QingshuChen 已提交
201 202
IF(WITH_XPU)
cc_library(operator SRCS operator.cc DEPS xpu_op_list op_info device_context tensor scope glog trainer_desc_proto data_feed_proto
203
    shape_inference data_transform lod_tensor profiler transfer_scope_cache op_kernel_type op_call_stack unused_var_check nan_inf_utils
204
    phi phi_utils kernel_factory infershape_utils op_utils)
Q
QingshuChen 已提交
205
ELSE()
206
cc_library(operator SRCS operator.cc DEPS op_info device_context tensor scope glog trainer_desc_proto data_feed_proto
207
    shape_inference data_transform lod_tensor profiler transfer_scope_cache op_kernel_type op_call_stack unused_var_check nan_inf_utils
208
    phi phi_utils kernel_factory infershape_utils op_utils)
Q
QingshuChen 已提交
209
ENDIF()
D
dzhwinter 已提交
210

211
cc_test(operator_test SRCS operator_test.cc DEPS operator op_registry device_context)
212
cc_test(operator_exception_test SRCS operator_exception_test.cc DEPS operator op_registry device_context)
X
version  
Xin Pan 已提交
213 214

cc_library(version SRCS version.cc)
X
Xin Pan 已提交
215 216
cc_test(version_test SRCS version_test.cc DEPS version)

217
cc_library(proto_desc SRCS var_desc.cc op_desc.cc block_desc.cc program_desc.cc process_mesh_desc.cc DEPS attribute shape_inference op_info operator glog version)
B
baojun-nervana 已提交
218

219
cc_library(op_registry SRCS op_registry.cc DEPS op_proto_maker op_info operator glog proto_desc)
D
dongdaxiang 已提交
220

221
cc_library(op_call_stack SRCS op_call_stack.cc DEPS op_proto_maker enforce)
222
cc_test(op_call_stack_test SRCS op_call_stack_test.cc DEPS op_call_stack)
223

224
cc_library(program_processing SRCS program_processing.cc DEPS boost proto_desc)
225 226
cc_test(program_processing_test SRCS program_processing_test.cc DEPS proto_desc program_processing)

227 228 229 230 231
if(WITH_GPU)
  nv_test(op_registry_test SRCS op_registry_test.cc DEPS op_registry)
elseif(WITH_ROCM)
  hip_test(op_registry_test SRCS op_registry_test.cc DEPS op_registry)
endif()
232

233 234 235
if(WITH_PYTHON)
  py_proto_compile(framework_py_proto SRCS framework.proto data_feed.proto)
  py_proto_compile(trainer_py_proto SRCS trainer_desc.proto data_feed.proto)
236
  py_proto_compile(distributed_strategy_py_proto SRCS distributed_strategy.proto)
237
  py_proto_compile(pass_desc_py_proto SRCS pass_desc.proto)
Z
ziyoujiyi 已提交
238
  py_proto_compile(ps_py_proto SRCS ps.proto)
H
heqiaozhi 已提交
239
#Generate an empty \
H
heqiaozhi 已提交
240
    #__init__.py to make framework_py_proto as a valid python module.
1
123malin 已提交
241 242 243 244
  add_custom_target(fleet_proto_init ALL  
    COMMAND ${CMAKE_COMMAND} -E make_directory ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto
    COMMAND ${CMAKE_COMMAND} -E touch ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto/__init__.py 
  )
245
  add_custom_target(framework_py_proto_init ALL COMMAND ${CMAKE_COMMAND} -E touch __init__.py)
Z
ziyoujiyi 已提交
246
  add_dependencies(framework_py_proto framework_py_proto_init trainer_py_proto distributed_strategy_py_proto fleet_proto_init pass_desc_py_proto ps_py_proto)
247 248
  if (NOT WIN32)
    add_custom_command(TARGET framework_py_proto POST_BUILD
P
peizhilin 已提交
249 250
      COMMAND ${CMAKE_COMMAND} -E make_directory ${PADDLE_BINARY_DIR}/python/paddle/fluid/proto
      COMMAND cp *.py ${PADDLE_BINARY_DIR}/python/paddle/fluid/proto/
251
      COMMAND cp distributed_strategy_*.py ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto
Z
ziyoujiyi 已提交
252
      COMMAND cp ps_pb2.py ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto
P
peizhilin 已提交
253 254
      COMMENT "Copy generated python proto into directory paddle/fluid/proto."
      WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR})
A
Aganlengzi 已提交
255
    add_custom_target(fleet_executor_proto_init ALL DEPENDS fleet_proto_init fleet_executor_desc_py_proto
L
LiYuRio 已提交
256 257
      COMMAND cp ${PADDLE_BINARY_DIR}/paddle/fluid/distributed/fleet_executor/fleet_executor_*.py ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto
      COMMENT "Copy generated python proto into directory paddle/distributed/fleet/proto.")
258 259
  else(NOT WIN32)
    string(REPLACE "/" "\\" proto_dstpath "${PADDLE_BINARY_DIR}/python/paddle/fluid/proto/")
260
    string(REPLACE "/" "\\" fleet_proto_dstpath "${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto/")
261
    add_custom_command(TARGET framework_py_proto POST_BUILD
P
peizhilin 已提交
262 263
          COMMAND ${CMAKE_COMMAND} -E make_directory ${PADDLE_BINARY_DIR}/python/paddle/fluid/proto
          COMMAND copy /Y *.py ${proto_dstpath}
Z
ziyoujiyi 已提交
264
      COMMAND copy /Y ps_pb2.py ${fleet_proto_dstpath}
265
	  COMMAND copy /Y distributed_strategy_*.py ${fleet_proto_dstpath}
P
peizhilin 已提交
266
          COMMENT "Copy generated python proto into directory paddle/fluid/proto."
267
	  COMMENT "Copy generated python proto into directory paddle/distributed/fleet/proto."
P
peizhilin 已提交
268
          WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR})
269 270
  endif(NOT WIN32)
endif()
271

1
123malin 已提交
272 273 274 275 276 277
if (WITH_PSCORE)
  add_custom_target(index_dataset_proto_init ALL DEPENDS fleet_proto_init index_dataset_py_proto
    COMMAND cp ${PADDLE_BINARY_DIR}/paddle/fluid/distributed/index_dataset/index_dataset_*.py ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto
    COMMENT "Copy generated python proto into directory paddle/distributed/fleet/proto.")
endif(WITH_PSCORE)

Y
Yu Yang 已提交
278
cc_library(lod_rank_table SRCS lod_rank_table.cc DEPS lod_tensor)
Y
Yan Chunwei 已提交
279

280
cc_library(feed_fetch_method SRCS feed_fetch_method.cc DEPS lod_tensor scope glog)
W
Wang Guibao 已提交
281
cc_library(variable_helper SRCS variable_helper.cc DEPS lod_tensor)
282

W
wenbin 已提交
283 284 285
if (TENSORRT_FOUND)
cc_library(naive_executor SRCS naive_executor.cc DEPS op_registry denormal device_context scope framework_proto glog lod_rank_table feed_fetch_method graph_to_program_pass variable_helper tensorrt_engine_op)
else()
286
cc_library(naive_executor SRCS naive_executor.cc DEPS op_registry denormal device_context scope framework_proto glog lod_rank_table feed_fetch_method graph_to_program_pass variable_helper)
W
wenbin 已提交
287
endif(TENSORRT_FOUND)
288

289
cc_library(executor_gc_helper SRCS executor_gc_helper.cc DEPS scope proto_desc operator garbage_collector op_registry while_op_helper recurrent_op_helper conditional_block_op_helper)
290
if(WITH_DISTRIBUTE)
T
Thunderbrook 已提交
291 292 293 294
  if(WITH_PSLIB)
    cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
    dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
    heterxpu_trainer.cc
T
Thunderbrook 已提交
295
    data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc ps_gpu_worker.cc
T
Thunderbrook 已提交
296
    ps_gpu_trainer.cc downpour_worker.cc downpour_worker_opt.cc
T
Thunderbrook 已提交
297
    pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
W
wangzhen38 已提交
298
    device_context scope framework_proto trainer_desc_proto glog fs shell 
299
    fleet_wrapper heter_wrapper ps_gpu_wrapper box_wrapper metrics lodtensor_printer
T
tangwei12 已提交
300
    lod_rank_table feed_fetch_method collective_helper ${GLOB_DISTRIBUTE_DEPS}
T
Thunderbrook 已提交
301
    graph_to_program_pass variable_helper data_feed_proto timer monitor
L
LiYuRio 已提交
302
    heter_service_proto fleet_executor ${BRPC_DEP})
T
Thunderbrook 已提交
303
    set(DISTRIBUTE_COMPILE_FLAGS "-Wno-non-virtual-dtor -Wno-error=non-virtual-dtor -Wno-error=delete-non-virtual-dtor")
T
Thunderbrook 已提交
304 305 306 307
    if (CMAKE_CXX_COMPILER_VERSION VERSION_GREATER 7.0)
        set(DISTRIBUTE_COMPILE_FLAGS
                "${DISTRIBUTE_COMPILE_FLAGS} -faligned-new")
    endif()
T
Thunderbrook 已提交
308
    set_source_files_properties(executor.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
Thunderbrook 已提交
309 310 311
    set_source_files_properties(device_worker.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
    set_source_files_properties(hetercpu_worker.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
    set_source_files_properties(heterxpu_trainer.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
tangwei12 已提交
312
  elseif(WITH_PSCORE)
T
Thunderbrook 已提交
313
    cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
T
tangwei12 已提交
314
            dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
315
            heterxpu_trainer.cc heter_pipeline_trainer.cc
T
tangwei12 已提交
316
            data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc
T
Thunderbrook 已提交
317
            downpour_worker.cc downpour_worker_opt.cc
318
            pull_dense_worker.cc section_worker.cc heter_section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
T
tangwei12 已提交
319
            device_context scope framework_proto data_feed_proto heter_service_proto trainer_desc_proto glog
W
wangzhen38 已提交
320
            index_sampler index_wrapper sampler index_dataset_proto
321
            lod_rank_table fs shell fleet_wrapper heter_wrapper box_wrapper metrics lodtensor_printer feed_fetch_method
322
            graph_to_program_pass variable_helper timer monitor heter_service_proto fleet heter_server brpc fleet_executor)
T
Thunderbrook 已提交
323
    set(DISTRIBUTE_COMPILE_FLAGS "-Wno-non-virtual-dtor -Wno-error=non-virtual-dtor -Wno-error=delete-non-virtual-dtor")
324 325 326 327
    if (CMAKE_CXX_COMPILER_VERSION VERSION_GREATER 7.0)
        set(DISTRIBUTE_COMPILE_FLAGS
                "${DISTRIBUTE_COMPILE_FLAGS} -faligned-new")
    endif()
T
Thunderbrook 已提交
328
    set_source_files_properties(executor.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
329
    set_source_files_properties(device_worker.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
tangwei12 已提交
330 331
    set_source_files_properties(multi_trainer.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
    set_source_files_properties(hogwild_worker.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
332 333
    set_source_files_properties(heter_section_worker.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
    set_source_files_properties(heter_pipeline_trainer.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
tangwei12 已提交
334 335 336 337 338
  else()
    cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
            dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
            heterxpu_trainer.cc
            data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc ps_gpu_worker.cc
T
Thunderbrook 已提交
339
            ps_gpu_trainer.cc downpour_worker.cc downpour_worker_opt.cc
T
tangwei12 已提交
340 341
            pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
            device_context scope framework_proto data_feed_proto heter_service_proto trainer_desc_proto glog
342
            lod_rank_table fs shell fleet_wrapper heter_wrapper ps_gpu_wrapper box_wrapper metrics lodtensor_printer feed_fetch_method
L
LiYuRio 已提交
343
            graph_to_program_pass variable_helper timer monitor fleet_executor)
T
Thunderbrook 已提交
344
  endif()
T
Thunderbrook 已提交
345
elseif(WITH_PSLIB)
T
Thunderbrook 已提交
346 347 348 349 350 351 352 353 354
  set(DISTRIBUTE_COMPILE_FLAGS "-Wno-non-virtual-dtor -Wno-error=non-virtual-dtor -Wno-error=delete-non-virtual-dtor")
  if (CMAKE_CXX_COMPILER_VERSION VERSION_GREATER 7.0)
      set(DISTRIBUTE_COMPILE_FLAGS
              "${DISTRIBUTE_COMPILE_FLAGS} -faligned-new")
  endif()
  set_source_files_properties(executor.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
  set_source_files_properties(device_worker.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
  set_source_files_properties(hetercpu_worker.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
  set_source_files_properties(heterxpu_trainer.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
Thunderbrook 已提交
355 356 357
  cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
  dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
  heterxpu_trainer.cc
T
Thunderbrook 已提交
358
  data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc ps_gpu_worker.cc
T
Thunderbrook 已提交
359
  ps_gpu_trainer.cc downpour_worker.cc downpour_worker_opt.cc
T
Thunderbrook 已提交
360 361
  pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
  device_context scope framework_proto data_feed_proto heter_service_proto trainer_desc_proto glog
T
Thunderbrook 已提交
362
  lod_rank_table fs shell fleet_wrapper heter_wrapper ps_gpu_wrapper box_wrapper lodtensor_printer feed_fetch_method
L
LiYuRio 已提交
363
  graph_to_program_pass variable_helper timer monitor fleet_executor ${BRPC_DEP})
W
Wu Yi 已提交
364
else()
H
hutuxian 已提交
365
  cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
366
  dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
T
Thunderbrook 已提交
367
  heterxpu_trainer.cc
T
Thunderbrook 已提交
368
  data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc ps_gpu_worker.cc
T
Thunderbrook 已提交
369
  ps_gpu_trainer.cc downpour_worker.cc downpour_worker_opt.cc
H
hutuxian 已提交
370
  pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
T
Thunderbrook 已提交
371
  device_context scope framework_proto data_feed_proto heter_service_proto trainer_desc_proto glog
T
Thunderbrook 已提交
372
  lod_rank_table fs shell fleet_wrapper heter_wrapper ps_gpu_wrapper box_wrapper lodtensor_printer feed_fetch_method
L
LiYuRio 已提交
373
  graph_to_program_pass variable_helper timer monitor fleet_executor)
W
Wu Yi 已提交
374
endif()
B
baojun-nervana 已提交
375

Z
Zeng Jinle 已提交
376
target_link_libraries(executor while_op_helper executor_gc_helper recurrent_op_helper conditional_block_op_helper)
S
sneaxiy 已提交
377

378
cc_library(parallel_executor SRCS parallel_executor.cc DEPS
Q
can run  
Qiao Longfei 已提交
379
        threaded_ssa_graph_executor scope_buffered_ssa_graph_executor parallel_ssa_graph_executor async_ssa_graph_executor
380
        graph build_strategy bind_threaded_ssa_graph_executor collective_helper
381
        fast_threaded_ssa_graph_executor variable_helper)
Q
qijun 已提交
382

383
cc_library(executor_cache SRCS executor_cache.cc DEPS parallel_executor)
T
Thunderbrook 已提交
384 385 386
if(WITH_PSCORE)
    get_property(RPC_DEPS GLOBAL PROPERTY RPC_DEPS)
    cc_test(dist_multi_trainer_test SRCS dist_multi_trainer_test.cc DEPS
Y
yaoxuefeng 已提交
387
        conditional_block_op executor gloo_wrapper ${RPC_DEPS})
388
    cc_test(heter_pipeline_trainer_test SRCS heter_pipeline_trainer_test.cc DEPS
Z
zmx 已提交
389
           conditional_block_op scale_op heter_listen_and_serv_op executor heter_server gloo_wrapper eigen_function ${RPC_DEPS})
T
Thunderbrook 已提交
390 391
else()
    cc_test(dist_multi_trainer_test SRCS dist_multi_trainer_test.cc DEPS
Y
yaoxuefeng 已提交
392
        conditional_block_op executor gloo_wrapper)
T
Thunderbrook 已提交
393
endif()
H
Huihuang Zheng 已提交
394
cc_library(prune SRCS prune.cc DEPS framework_proto boost)
Y
Yang Yang 已提交
395
cc_test(prune_test SRCS prune_test.cc DEPS op_info prune recurrent_op device_context)
Y
Yu Yang 已提交
396 397
cc_test(var_type_inference_test SRCS var_type_inference_test.cc DEPS op_registry
        proto_desc)
398
cc_library(selected_rows_utils SRCS selected_rows_utils.cc DEPS selected_rows)
399
cc_test(selected_rows_utils_test SRCS selected_rows_utils_test.cc DEPS selected_rows_utils)
D
dzhwinter 已提交
400

X
Xin Pan 已提交
401
cc_test(op_kernel_type_test SRCS op_kernel_type_test.cc DEPS place device_context framework_proto op_kernel_type)
Y
Yang Yu 已提交
402
cc_test(cow_ptr_tests SRCS details/cow_ptr_test.cc)
M
minqiyang 已提交
403

C
chengduo 已提交
404
cc_test(tuple_test SRCS tuple_test.cc )
405

Z
Zeng Jinle 已提交
406 407
cc_test(inlined_vector_test SRCS inlined_vector_test.cc)

S
sneaxiy 已提交
408 409
cc_library(dlpack_tensor SRCS dlpack_tensor.cc DEPS tensor dlpack)
cc_test(dlpack_tensor_test SRCS dlpack_tensor_test.cc DEPS dlpack_tensor glog)
Y
Yan Chunwei 已提交
410

411
cc_library(op_compatible_info SRCS op_compatible_info.cc DEPS string_helper proto_desc)
412
cc_test(op_compatible_info_test SRCS op_compatible_info_test.cc DEPS op_compatible_info proto_desc string_helper glog)
H
hong 已提交
413

414
cc_library(save_load_util SRCS save_load_util.cc DEPS tensor scope layer)
H
hong 已提交
415
cc_test(save_load_util_test SRCS save_load_util_test.cc DEPS save_load_util tensor scope layer)
Y
yaoxuefeng 已提交
416
cc_library(generator SRCS generator.cc DEPS enforce place)
H
hong 已提交
417

418
cc_library(infershape_utils SRCS infershape_utils.cc DEPS lod_tensor selected_rows_utils attribute place phi var_type_traits phi phi_api_utils op_info shape_inference)
419
cc_test(infershape_utils_test SRCS infershape_utils_test.cc DEPS infershape_utils infermeta_utils meta_tensor)
420

Y
Yan Chunwei 已提交
421 422 423
# Get the current working branch
execute_process(
  COMMAND git rev-parse --abbrev-ref HEAD
D
dongdaxiang 已提交
424 425 426 427
    WORKING_DIRECTORY ${CMAKE_SOURCE_DIR}
      OUTPUT_VARIABLE PADDLE_BRANCH
        OUTPUT_STRIP_TRAILING_WHITESPACE
	)
Y
Yan Chunwei 已提交
428 429 430 431

# Get the latest abbreviated commit hash of the working branch
execute_process(
  COMMAND git log -1 --format=%h
D
dongdaxiang 已提交
432 433 434 435
    WORKING_DIRECTORY ${CMAKE_SOURCE_DIR}
      OUTPUT_VARIABLE PADDLE_COMMIT
        OUTPUT_STRIP_TRAILING_WHITESPACE
	)
Y
Yan Chunwei 已提交
436 437 438 439 440

message(STATUS "commit: ${PADDLE_COMMIT}")
message(STATUS "branch: ${PADDLE_BRANCH}")

configure_file(commit.h.in commit.h)
441

442 443
cc_library(custom_operator SRCS custom_operator.cc DEPS tensor attribute framework_proto op_registry operator dynamic_loader string_helper phi_tensor op_meta_info phi_api)
cc_library(custom_kernel SRCS custom_kernel.cc DEPS op_registry phi_custom_kernel phi_tensor_raw)
H
hong 已提交
444 445 446
#cc_binary(test_executor SRCS test_executor.cc DEPS executor op_registry ${GLOB_OP_LIB} ${GLOB_OPERATOR_DEPS} )
#cc_binary(new_executor SRCS new_exec_test.cc DEPS operator op_registry executor ${GLOB_OP_LIB} ${GLOB_OPERATOR_DEPS} profiler)

447
set(FLUID_FRAMEWORK_MODULES proto_desc memory lod_tensor executor data_feed_proto layer dynamic_loader custom_operator custom_kernel)
448

449
cc_library(paddle_framework DEPS ${FLUID_FRAMEWORK_MODULES})
450

451 452
if(WITH_TESTING AND TEST selected_rows_utils_test)
  set_tests_properties(selected_rows_utils_test PROPERTIES TIMEOUT 120)
Y
YUNSHEN XIE 已提交
453
endif()
Z
Zeng Jinle 已提交
454 455

cc_test(scope_guard_test SRCS scope_guard_test.cc)
456
cc_test(phi_utils_test SRCS phi_utils_test.cc DEPS phi_utils)
457 458 459 460 461 462

if(WITH_GPU OR WITH_ROCM)
  cc_library(fluid_convert_utils SRCS convert_utils.cc DEPS data_type place gpu_info)
else()
  cc_library(fluid_convert_utils SRCS convert_utils.cc DEPS data_type place)
endif()
463
cc_test(convert_utils_test SRCS convert_utils_test.cc DEPS fluid_convert_utils)