CMakeLists.txt 21.0 KB
Newer Older
D
dongdaxiang 已提交
1

H
heqiaozhi 已提交
2 3
#windows treat symbolic file as a real file, which is different with unix
#We create a hidden file and compile it instead of origin source file.
D
dzhwinter 已提交
4 5
function(windows_symbolic TARGET)
  set(oneValueArgs "")
P
peizhilin 已提交
6
  set(multiValueArgs SRCS PATH)
D
dzhwinter 已提交
7
  cmake_parse_arguments(windows_symbolic "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
P
peizhilin 已提交
8
  set(final_path ${CMAKE_CURRENT_SOURCE_DIR}/${windows_symbolic_PATH})
D
dzhwinter 已提交
9
  foreach(src ${windows_symbolic_SRCS})
P
peizhilin 已提交
10 11 12 13
    get_filename_component(src ${src} NAME_WE)
    if (NOT EXISTS ${final_path}/${src}.cc OR NOT EXISTS ${final_path}/${src}.cu)
        message(FATAL " ${src}.cc and ${src}.cu must exsits, and ${src}.cu must be symbolic file.")
    endif()
D
dzhwinter 已提交
14

P
peizhilin 已提交
15 16 17 18 19 20
    file(GENERATE OUTPUT ${final_path}/.${src}.cu INPUT ${final_path}/${src}.cc)

    add_custom_command(OUTPUT ${final_path}/.${src}.cu
            COMMAND ${CMAKE_COMMAND} -E copy_if_different "${final_path}/${src}.cc" "${final_path}/.${src}.cu"
            COMMENT "create hidden file of ${src}.cu")
    add_custom_target(${TARGET} ALL DEPENDS .${src}.cu)
D
dzhwinter 已提交
21 22 23
  endforeach()
endfunction()

X
start  
Xin Pan 已提交
24
add_subdirectory(ir)
D
dzhwinter 已提交
25
add_subdirectory(details)
D
dongdaxiang 已提交
26
add_subdirectory(fleet)
27
add_subdirectory(io)
H
heqiaozhi 已提交
28
#ddim lib
29
proto_library(framework_proto SRCS framework.proto)
T
Thunderbrook 已提交
30
proto_library(heter_service_proto SRCS heter_service.proto)
D
dongdaxiang 已提交
31
proto_library(data_feed_proto SRCS data_feed.proto)
H
hutuxian 已提交
32 33
proto_library(trainer_desc_proto SRCS trainer_desc.proto DEPS framework_proto
  data_feed_proto)
34

S
sneaxiy 已提交
35
cc_library(ddim SRCS ddim.cc DEPS eigen3 boost enforce)
36
cc_test(ddim_test SRCS ddim_test.cc DEPS ddim)
37 38 39 40 41
if(WITH_GPU)
  nv_test(dim_test SRCS dim_test.cu DEPS ddim)
elseif(WITH_ROCM)
  hip_test(dim_test SRCS dim_test.cu DEPS ddim)
endif()
S
sneaxiy 已提交
42
cc_test(unroll_array_ops_test SRCS unroll_array_ops_test.cc)
Y
yuyang18 已提交
43
cc_library(data_type SRCS data_type.cc DEPS framework_proto ddim device_context)
D
dzhwinter 已提交
44
cc_test(data_type_test SRCS data_type_test.cc DEPS data_type place tensor)
45
if(WITH_GPU)
D
dzhwinter 已提交
46 47 48 49 50
  if (WIN32)
    windows_symbolic(tensor_util SRCS tensor_util.cu)
    nv_library(tensor SRCS tensor.cc .tensor_util.cu DEPS place memory data_type device_context)
    add_dependencies(tensor tensor_util)
  else()
51
    nv_library(tensor SRCS tensor.cc tensor_util.cu DEPS place memory data_type device_context profiler)
D
dzhwinter 已提交
52
  endif(WIN32)
53 54
elseif(WITH_ROCM)
  hip_library(tensor SRCS tensor.cc tensor_util.cu DEPS place memory data_type device_context profiler)
Y
Yang Yu 已提交
55
else()
56
  cc_library(tensor SRCS tensor.cc tensor_util.cc DEPS place memory data_type device_context profiler)
57
endif()
D
dzhwinter 已提交
58

Y
Yu Yang 已提交
59
cc_test(tensor_test SRCS tensor_test.cc DEPS tensor)
60
if(WITH_GPU)
6
633WHU 已提交
61
  nv_test(tensor_util_test SRCS tensor_util_test.cc tensor_util_test.cu DEPS tensor dlpack_tensor)
62 63
elseif(WITH_ROCM)
  hip_test(tensor_util_test SRCS tensor_util_test.cc tensor_util_test.cu DEPS tensor dlpack_tensor)
Y
Yang Yu 已提交
64
else()
6
633WHU 已提交
65
  cc_test(tensor_util_test SRCS tensor_util_test.cc DEPS tensor dlpack_tensor)
Y
Yang Yu 已提交
66
endif()
D
dzhwinter 已提交
67

68 69
cc_test(copy_same_tensor_test SRCS copy_same_tensor_test.cc DEPS tensor)

Y
Update  
Yi Wang 已提交
70
cc_test(eigen_test SRCS eigen_test.cc DEPS tensor)
L
liaogang 已提交
71

72
if(WITH_GPU)
Q
qiaolongfei 已提交
73
  nv_test(mixed_vector_test SRCS mixed_vector_test.cc mixed_vector_test.cu DEPS place memory device_context tensor)
74 75
elseif(WITH_ROCM)
  hip_test(mixed_vector_test SRCS mixed_vector_test.cc mixed_vector_test.cu DEPS place memory device_context tensor)
76 77 78
else()
  cc_test(mixed_vector_test SRCS mixed_vector_test.cc DEPS place memory device_context tensor)
endif()
79
cc_library(lod_tensor SRCS lod_tensor.cc DEPS ddim place tensor framework_proto version)
D
dzhwinter 已提交
80

Y
Yi Wang 已提交
81
cc_test(lod_tensor_test SRCS lod_tensor_test.cc DEPS lod_tensor memory)
82 83 84 85 86 87

if(WITH_GPU)
  nv_test(lod_tensor_gpu_test SRCS lod_tensor_test.cu DEPS lod_tensor)
elseif(WITH_ROCM)
  hip_test(lod_tensor_gpu_test SRCS lod_tensor_test.cu DEPS lod_tensor)
endif()
88

S
sneaxiy 已提交
89
cc_library(garbage_collector SRCS garbage_collector.cc DEPS device_context memory gflags glog)
S
sneaxiy 已提交
90

F
fengjiayi 已提交
91
cc_library(reader SRCS reader.cc DEPS lod_tensor ddim)
Y
yuyang18 已提交
92
cc_test(reader_test SRCS reader_test.cc DEPS reader)
F
fengjiayi 已提交
93

Y
Yi Wang 已提交
94
cc_library(threadpool SRCS threadpool.cc DEPS enforce)
Y
Yang Yu 已提交
95 96
cc_test(threadpool_test SRCS threadpool_test.cc DEPS threadpool)

97
cc_library(var_type_traits SRCS var_type_traits DEPS lod_tensor selected_rows framework_proto)
S
sneaxiy 已提交
98
if (WITH_GPU)
S
sneaxiy 已提交
99
  target_link_libraries(var_type_traits dynload_cuda)
S
sneaxiy 已提交
100 101 102
endif()
cc_test(var_type_traits_test SRCS var_type_traits_test.cc DEPS var_type_traits)

103
cc_library(scope SRCS scope.cc DEPS glog threadpool xxhash var_type_traits)
H
hutuxian 已提交
104 105
cc_library(device_worker SRCS device_worker.cc DEPS trainer_desc_proto lod_tensor scope)
cc_test(device_worker_test SRCS device_worker_test.cc DEPS device_worker)
106

S
sneaxiy 已提交
107
cc_library(scope_pool SRCS scope_pool.cc DEPS scope)
Y
Yi Wang 已提交
108
cc_test(scope_test SRCS scope_test.cc DEPS scope)
S
sneaxiy 已提交
109
cc_test(variable_test SRCS variable_test.cc DEPS tensor var_type_traits)
L
liaogang 已提交
110

111
cc_library(data_device_transform SRCS data_device_transform.cc DEPS tensor)
112 113
if(WITH_GPU)
  nv_test(data_device_transform_test SRCS data_device_transform_test.cu
S
sneaxiy 已提交
114
        DEPS operator op_registry device_context math_function scope)
115 116 117 118
elseif(WITH_ROCM)
  hip_test(data_device_transform_test SRCS data_device_transform_test.cu
        DEPS operator op_registry device_context math_function scope)
endif()
119

120
if(WITH_GPU)
D
dzhwinter 已提交
121
  if (WIN32)
H
heqiaozhi 已提交
122 123
#windows treat symbolic file as a real file, which is different with unix
#We create a hidden file and compile it instead of origin source file.
D
dzhwinter 已提交
124 125 126 127 128 129
      windows_symbolic(hidden_file SRCS data_type_transform.cu)
      nv_library(data_type_transform SRCS .data_type_transform.cu DEPS tensor)
      add_dependencies(data_type_transform hidden_file)
  else()
      nv_library(data_type_transform SRCS data_type_transform.cu DEPS tensor)
  endif(WIN32)
130
  nv_test(data_type_transform_test SRCS data_type_transform_test.cc data_type_transform_test.cu DEPS data_type_transform)
131 132 133
elseif(WITH_ROCM)
  hip_library(data_type_transform SRCS data_type_transform.cu DEPS tensor)
  hip_test(data_type_transform_test SRCS data_type_transform_test.cc data_type_transform_test.cu DEPS data_type_transform)
134 135 136 137
else()
  cc_library(data_type_transform SRCS data_type_transform.cc DEPS tensor)
  cc_test(data_type_transform_test SRCS data_type_transform_test.cc DEPS data_type_transform)
endif()
138

139
cc_library(data_layout_transform SRCS data_layout_transform.cc DEPS tensor math_function)
140
cc_test(data_layout_transform_test SRCS data_layout_transform_test.cc DEPS data_layout_transform)
141

142 143
cc_library(data_transform SRCS data_transform.cc DEPS math_function tensor
        framework_proto selected_rows data_device_transform data_type_transform data_layout_transform)
Q
Qiao Longfei 已提交
144

145
cc_library(attribute SRCS attribute.cc DEPS framework_proto boost enforce)
146 147
cc_test(program_desc_test SRCS program_desc_test.cc DEPS proto_desc
device_context)
148

149 150 151
cc_library(op_version_proto SRCS op_version_proto.cc DEPS framework_proto boost)

cc_library(op_version_registry SRCS op_version_registry.cc DEPS op_version_proto framework_proto boost)
152 153
cc_test(op_version_registry_test SRCS op_version_registry_test.cc DEPS op_version_registry)

R
reyoung 已提交
154
cc_library(op_proto_maker SRCS op_proto_maker.cc DEPS framework_proto attribute glog)
155
cc_test(op_proto_maker_test SRCS op_proto_maker_test.cc DEPS op_proto_maker)
156
cc_library(no_need_buffer_vars_inference SRCS no_need_buffer_vars_inference.cc DEPS attribute device_context)
157
cc_library(op_info SRCS op_info.cc DEPS attribute framework_proto no_need_buffer_vars_inference)
T
tensor-tang 已提交
158
cc_library(shape_inference SRCS shape_inference.cc DEPS ddim attribute device_context)
D
dzhwinter 已提交
159

160 161
cc_test(no_need_buffer_vars_inference_test SRCS no_need_buffer_vars_inference_test.cc DEPS no_need_buffer_vars_inference layer)

S
superjomn 已提交
162
cc_library(transfer_scope_cache SRCS transfer_scope_cache.cc DEPS scope framework_proto device_context)
X
Xin Pan 已提交
163
cc_library(op_kernel_type SRCS op_kernel_type.cc DEPS device_context place)
164 165 166

cc_library(unused_var_check SRCS unused_var_check.cc DEPS glog no_need_buffer_vars_inference)

167
cc_library(operator SRCS operator.cc DEPS op_info device_context tensor scope glog trainer_desc_proto data_feed_proto
W
WangXi 已提交
168
    shape_inference data_transform lod_tensor profiler transfer_scope_cache op_kernel_type op_call_stack unused_var_check nan_inf_utils)
D
dzhwinter 已提交
169

170
cc_test(operator_test SRCS operator_test.cc DEPS operator op_registry device_context)
171
cc_test(operator_exception_test SRCS operator_exception_test.cc DEPS operator op_registry device_context)
X
version  
Xin Pan 已提交
172 173

cc_library(version SRCS version.cc)
X
Xin Pan 已提交
174 175
cc_test(version_test SRCS version_test.cc DEPS version)

X
version  
Xin Pan 已提交
176
cc_library(proto_desc SRCS var_desc.cc op_desc.cc block_desc.cc program_desc.cc DEPS shape_inference op_info operator glog version)
B
baojun-nervana 已提交
177

178
cc_library(op_registry SRCS op_registry.cc DEPS op_proto_maker op_info operator glog proto_desc)
D
dongdaxiang 已提交
179

180
cc_library(op_call_stack SRCS op_call_stack.cc DEPS op_proto_maker enforce)
181
cc_test(op_call_stack_test SRCS op_call_stack_test.cc DEPS op_call_stack)
182 183 184 185 186
if(WITH_GPU)
  nv_test(op_registry_test SRCS op_registry_test.cc DEPS op_registry)
elseif(WITH_ROCM)
  hip_test(op_registry_test SRCS op_registry_test.cc DEPS op_registry)
endif()
187

188 189 190
if(WITH_PYTHON)
  py_proto_compile(framework_py_proto SRCS framework.proto data_feed.proto)
  py_proto_compile(trainer_py_proto SRCS trainer_desc.proto data_feed.proto)
191
  py_proto_compile(distributed_strategy_py_proto SRCS distributed_strategy.proto)
H
heqiaozhi 已提交
192
#Generate an empty \
H
heqiaozhi 已提交
193
    #__init__.py to make framework_py_proto as a valid python module.
194
  add_custom_target(framework_py_proto_init ALL COMMAND ${CMAKE_COMMAND} -E touch __init__.py)
195
  add_dependencies(framework_py_proto framework_py_proto_init trainer_py_proto distributed_strategy_py_proto)
196 197
  if (NOT WIN32)
    add_custom_command(TARGET framework_py_proto POST_BUILD
P
peizhilin 已提交
198
      COMMAND ${CMAKE_COMMAND} -E make_directory ${PADDLE_BINARY_DIR}/python/paddle/fluid/proto
199 200
      COMMAND ${CMAKE_COMMAND} -E make_directory ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto
      COMMAND ${CMAKE_COMMAND} -E touch ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto/__init__.py
P
peizhilin 已提交
201
      COMMAND cp *.py ${PADDLE_BINARY_DIR}/python/paddle/fluid/proto/
202
      COMMAND cp distributed_strategy_*.py ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto
P
peizhilin 已提交
203 204
      COMMENT "Copy generated python proto into directory paddle/fluid/proto."
      WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR})
205 206
  else(NOT WIN32)
    string(REPLACE "/" "\\" proto_dstpath "${PADDLE_BINARY_DIR}/python/paddle/fluid/proto/")
207
    string(REPLACE "/" "\\" fleet_proto_dstpath "${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto/")
208
    add_custom_command(TARGET framework_py_proto POST_BUILD
P
peizhilin 已提交
209
          COMMAND ${CMAKE_COMMAND} -E make_directory ${PADDLE_BINARY_DIR}/python/paddle/fluid/proto
210 211
	  COMMAND ${CMAKE_COMMAND} -E make_directory ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto
	  COMMAND ${CMAKE_COMMAND} -E touch ${PADDLE_BINARY_DIR}/python/paddle/distributed/fleet/proto/__init__.py
P
peizhilin 已提交
212
          COMMAND copy /Y *.py ${proto_dstpath}
213
	  COMMAND copy /Y distributed_strategy_*.py ${fleet_proto_dstpath}
P
peizhilin 已提交
214
          COMMENT "Copy generated python proto into directory paddle/fluid/proto."
215
	  COMMENT "Copy generated python proto into directory paddle/distributed/fleet/proto."
P
peizhilin 已提交
216
          WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR})
217 218
  endif(NOT WIN32)
endif()
219

Y
Yu Yang 已提交
220
cc_library(lod_rank_table SRCS lod_rank_table.cc DEPS lod_tensor)
Y
Yan Chunwei 已提交
221

222
cc_library(feed_fetch_method SRCS feed_fetch_method.cc DEPS lod_tensor scope glog)
W
Wang Guibao 已提交
223
cc_library(variable_helper SRCS variable_helper.cc DEPS lod_tensor)
224

225
cc_library(naive_executor SRCS naive_executor.cc DEPS op_registry denormal device_context scope framework_proto glog lod_rank_table feed_fetch_method graph_to_program_pass variable_helper)
226

S
sneaxiy 已提交
227
cc_library(executor_gc_helper SRCS executor_gc_helper.cc DEPS scope proto_desc operator garbage_collector)
228
if(WITH_DISTRIBUTE)
T
Thunderbrook 已提交
229 230 231 232
  if(WITH_PSLIB)
    cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
    dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
    heterxpu_trainer.cc
T
Thunderbrook 已提交
233 234
    data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc ps_gpu_worker.cc
    heterbox_worker.cc heterbox_trainer.cc ps_gpu_trainer.cc downpour_worker.cc downpour_worker_opt.cc
T
Thunderbrook 已提交
235 236
    pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
    device_context scope framework_proto trainer_desc_proto glog fs shell
T
Thunderbrook 已提交
237
    fleet_wrapper heter_wrapper ps_gpu_wrapper box_wrapper lodtensor_printer
T
tangwei12 已提交
238
    lod_rank_table feed_fetch_method collective_helper ${GLOB_DISTRIBUTE_DEPS}
T
Thunderbrook 已提交
239 240 241 242
    graph_to_program_pass variable_helper data_feed_proto timer monitor
    heter_service_proto pslib_brpc)
    set(DISTRIBUTE_COMPILE_FLAGS "-Wno-non-virtual-dtor -Wno-error=non-virtual-dtor -Wno-error=delete-non-virtual-dtor")
    set_source_files_properties(executor.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
tangwei12 已提交
243
  elseif(WITH_PSCORE)
T
Thunderbrook 已提交
244
    cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
T
tangwei12 已提交
245 246 247 248 249 250 251 252
            dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
            heterxpu_trainer.cc
            data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc
            heterbox_worker.cc heterbox_trainer.cc downpour_worker.cc downpour_worker_opt.cc
            pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
            device_context scope framework_proto data_feed_proto heter_service_proto trainer_desc_proto glog
            lod_rank_table fs shell fleet_wrapper heter_wrapper box_wrapper lodtensor_printer feed_fetch_method
            graph_to_program_pass variable_helper timer monitor heter_service_proto fleet)
T
Thunderbrook 已提交
253 254
    set(DISTRIBUTE_COMPILE_FLAGS "-Wno-non-virtual-dtor -Wno-error=non-virtual-dtor -Wno-error=delete-non-virtual-dtor")
    set_source_files_properties(executor.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
tangwei12 已提交
255 256
    set_source_files_properties(multi_trainer.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
    set_source_files_properties(hogwild_worker.cc PROPERTIES COMPILE_FLAGS ${DISTRIBUTE_COMPILE_FLAGS})
T
tangwei12 已提交
257 258 259 260 261 262 263 264 265 266
  else()
    cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
            dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
            heterxpu_trainer.cc
            data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc ps_gpu_worker.cc
            heterbox_worker.cc heterbox_trainer.cc ps_gpu_trainer.cc downpour_worker.cc downpour_worker_opt.cc
            pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
            device_context scope framework_proto data_feed_proto heter_service_proto trainer_desc_proto glog
            lod_rank_table fs shell fleet_wrapper heter_wrapper ps_gpu_wrapper box_wrapper lodtensor_printer feed_fetch_method
            graph_to_program_pass variable_helper timer monitor)
T
Thunderbrook 已提交
267
  endif()
T
Thunderbrook 已提交
268 269 270 271
elseif(WITH_PSLIB)
  cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
  dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
  heterxpu_trainer.cc
T
Thunderbrook 已提交
272 273
  data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc ps_gpu_worker.cc
  heterbox_worker.cc heterbox_trainer.cc ps_gpu_trainer.cc downpour_worker.cc downpour_worker_opt.cc
T
Thunderbrook 已提交
274 275
  pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
  device_context scope framework_proto data_feed_proto heter_service_proto trainer_desc_proto glog
T
Thunderbrook 已提交
276
  lod_rank_table fs shell fleet_wrapper heter_wrapper ps_gpu_wrapper box_wrapper lodtensor_printer feed_fetch_method
T
Thunderbrook 已提交
277
  graph_to_program_pass variable_helper timer monitor pslib_brpc )
W
Wu Yi 已提交
278
else()
H
hutuxian 已提交
279
  cc_library(executor SRCS executor.cc multi_trainer.cc pipeline_trainer.cc dataset_factory.cc
280
  dist_multi_trainer.cc trainer_factory.cc trainer.cc data_feed_factory.cc
T
Thunderbrook 已提交
281
  heterxpu_trainer.cc
T
Thunderbrook 已提交
282 283
  data_feed.cc device_worker.cc hogwild_worker.cc hetercpu_worker.cc ps_gpu_worker.cc
  heterbox_worker.cc heterbox_trainer.cc ps_gpu_trainer.cc downpour_worker.cc downpour_worker_opt.cc
H
hutuxian 已提交
284
  pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry
T
Thunderbrook 已提交
285
  device_context scope framework_proto data_feed_proto heter_service_proto trainer_desc_proto glog
T
Thunderbrook 已提交
286
  lod_rank_table fs shell fleet_wrapper heter_wrapper ps_gpu_wrapper box_wrapper lodtensor_printer feed_fetch_method
H
hutuxian 已提交
287
  graph_to_program_pass variable_helper timer monitor)
W
Wu Yi 已提交
288
endif()
B
baojun-nervana 已提交
289

Z
Zeng Jinle 已提交
290
target_link_libraries(executor while_op_helper executor_gc_helper recurrent_op_helper conditional_block_op_helper)
S
sneaxiy 已提交
291

292
cc_library(parallel_executor SRCS parallel_executor.cc DEPS
Q
can run  
Qiao Longfei 已提交
293
        threaded_ssa_graph_executor scope_buffered_ssa_graph_executor parallel_ssa_graph_executor async_ssa_graph_executor
294
        graph build_strategy bind_threaded_ssa_graph_executor collective_helper
W
Wang Guibao 已提交
295
        fast_threaded_ssa_graph_executor variable_helper)
Q
qijun 已提交
296

297
cc_library(executor_cache SRCS executor_cache.cc DEPS executor)
Z
zhang wenhui 已提交
298 299
cc_test(dist_multi_trainer_test SRCS dist_multi_trainer_test.cc DEPS
    conditional_block_op executor)
H
Huihuang Zheng 已提交
300
cc_library(prune SRCS prune.cc DEPS framework_proto boost)
Y
Yang Yang 已提交
301
cc_test(prune_test SRCS prune_test.cc DEPS op_info prune recurrent_op device_context)
Y
Yu Yang 已提交
302 303
cc_test(var_type_inference_test SRCS var_type_inference_test.cc DEPS op_registry
        proto_desc)
Q
qijun 已提交
304 305
cc_library(selected_rows SRCS selected_rows.cc DEPS tensor)
cc_test(selected_rows_test SRCS selected_rows_test.cc DEPS selected_rows)
D
dzhwinter 已提交
306

X
Xin Pan 已提交
307
cc_test(op_kernel_type_test SRCS op_kernel_type_test.cc DEPS place device_context framework_proto op_kernel_type)
Y
Yang Yu 已提交
308
cc_test(cow_ptr_tests SRCS details/cow_ptr_test.cc)
M
minqiyang 已提交
309

C
chengduo 已提交
310
cc_test(tuple_test SRCS tuple_test.cc )
311

Z
Zeng Jinle 已提交
312 313
cc_test(inlined_vector_test SRCS inlined_vector_test.cc)

D
dzhwinter 已提交
314
if (NOT WIN32)
Q
Qiao Longfei 已提交
315
cc_test(rw_lock_test SRCS rw_lock_test.cc)
D
dzhwinter 已提交
316
endif (NOT WIN32)
S
sneaxiy 已提交
317 318 319

cc_library(dlpack_tensor SRCS dlpack_tensor.cc DEPS tensor dlpack)
cc_test(dlpack_tensor_test SRCS dlpack_tensor_test.cc DEPS dlpack_tensor glog)
Y
Yan Chunwei 已提交
320

321
cc_library(op_compatible_info SRCS op_compatible_info DEPS string_helper proto_desc)
322
cc_test(op_compatible_info_test SRCS op_compatible_info_test.cc DEPS op_compatible_info proto_desc string_helper glog)
H
hong 已提交
323

H
hong 已提交
324 325
cc_library(save_load_util SRCS save_load_util DEPS tensor scope layer)
cc_test(save_load_util_test SRCS save_load_util_test.cc DEPS save_load_util tensor scope layer)
Y
yaoxuefeng 已提交
326
cc_library(generator SRCS generator.cc DEPS enforce place)
H
hong 已提交
327

Y
Yan Chunwei 已提交
328 329 330
# Get the current working branch
execute_process(
  COMMAND git rev-parse --abbrev-ref HEAD
D
dongdaxiang 已提交
331 332 333 334
    WORKING_DIRECTORY ${CMAKE_SOURCE_DIR}
      OUTPUT_VARIABLE PADDLE_BRANCH
        OUTPUT_STRIP_TRAILING_WHITESPACE
	)
Y
Yan Chunwei 已提交
335 336 337 338

# Get the latest abbreviated commit hash of the working branch
execute_process(
  COMMAND git log -1 --format=%h
D
dongdaxiang 已提交
339 340 341 342
    WORKING_DIRECTORY ${CMAKE_SOURCE_DIR}
      OUTPUT_VARIABLE PADDLE_COMMIT
        OUTPUT_STRIP_TRAILING_WHITESPACE
	)
Y
Yan Chunwei 已提交
343 344 345 346 347

message(STATUS "commit: ${PADDLE_COMMIT}")
message(STATUS "branch: ${PADDLE_BRANCH}")

configure_file(commit.h.in commit.h)
348

349 350 351 352 353
# Adapt to custom op mechanism: Include the header files related to the data type
# to avoid exposing the path of the underlying file
include_directories(${PADDLE_SOURCE_DIR}/paddle/fluid/platform)
include_directories(${CMAKE_CURRENT_SOURCE_DIR}/../extension/include)

354 355
cc_library(custom_tensor SRCS ../extension/src/ext_tensor.cc DEPS lod_tensor memory enforce)
cc_library(op_meta_info SRCS ../extension/src/ext_op_meta_info.cc DEPS custom_tensor)
356
cc_library(custom_operator SRCS custom_operator.cc DEPS tensor attribute framework_proto op_registry operator dynamic_loader string_helper custom_tensor op_meta_info)
357 358 359
cc_test(custom_tensor_test SRCS custom_tensor_test.cc DEPS custom_tensor glog)

set(FLUID_FRAMEWORK_MODULES proto_desc memory lod_tensor executor data_feed_proto layer dynamic_loader custom_operator)
360

361
cc_library(paddle_framework DEPS ${FLUID_FRAMEWORK_MODULES})
362

363 364
if(WITH_TESTING AND TEST selected_rows_test)
  set_tests_properties(selected_rows_test PROPERTIES TIMEOUT 120)
Y
YUNSHEN XIE 已提交
365
endif()
366

367
##### 2.0 New custom op extension mechanism related #####
368 369 370 371

# if not deps `layer`, will cause: undefined symbol: _ZN6paddle10imperative7VarBase9name_set_
set(PADDLE_CUSTOM_OP_MODULES custom_tensor op_meta_info custom_operator layer)

372 373 374 375 376 377 378
set(PADDLE_CUSTOM_OP_SRCS
    ${CMAKE_CURRENT_SOURCE_DIR}/custom_operator.cc
    ${CMAKE_CURRENT_SOURCE_DIR}/../extension/src/ext_tensor.cc
    ${CMAKE_CURRENT_SOURCE_DIR}/../extension/src/ext_op_meta_info.cc
    ${CMAKE_SOURCE_DIR}/paddle/fluid/imperative/layer.cc)
set(PADDLE_CUSTOM_OP_SRCS ${PADDLE_CUSTOM_OP_SRCS} PARENT_SCOPE)

379
cc_library(paddle_custom_op_shared
380 381
    SHARED SRCS ${PADDLE_CUSTOM_OP_SRCS} DEPS ${PADDLE_CUSTOM_OP_MODULES})

382 383 384 385 386 387 388 389 390 391 392
get_property(os_dependency_modules GLOBAL PROPERTY OS_DEPENDENCY_MODULES)
set_target_properties(paddle_custom_op_shared PROPERTIES OUTPUT_NAME paddle_custom_op)
target_link_libraries(paddle_custom_op_shared ${os_dependency_modules})

if (LINUX)
  set(PADDLE_CUSTOM_OP_SHARED_LIB
      ${PADDLE_BINARY_DIR}/paddle/fluid/framework/libpaddle_custom_op.so
      CACHE INTERNAL "Paddle custom op lib")
endif()

if (WIN32)
393 394 395 396 397
  if("${CMAKE_GENERATOR}" STREQUAL "Ninja")
    set(paddle_custom_op_lib_path ${CMAKE_CURRENT_BINARY_DIR})
  else()
    set(paddle_custom_op_lib_path ${CMAKE_CURRENT_BINARY_DIR}/${CMAKE_BUILD_TYPE})
  endif()
398
  set(PADDLE_CUSTOM_OP_IMPORT_LIB
399
      ${paddle_custom_op_lib_path}/paddle_custom_op.lib
400
      CACHE INTERNAL "Paddle custom op import lib")
401
  set(PADDLE_CUSTOM_OP_SHARED_LIB
402
      ${paddle_custom_op_lib_path}/paddle_custom_op.dll
403 404 405 406 407 408 409 410
      CACHE INTERNAL "Paddle custom op dll")
endif()

if(APPLE)
  set(PADDLE_CUSTOM_OP_SHARED_LIB
      ${PADDLE_BINARY_DIR}/paddle/fluid/framework/paddle_custom_op.dylib
      CACHE INTERNAL "Paddle custom op lib")
endif()