Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle-Lite
提交
9343782b
P
Paddle-Lite
项目概览
PaddlePaddle
/
Paddle-Lite
通知
338
Star
4
Fork
1
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
271
列表
看板
标记
里程碑
合并请求
78
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle-Lite
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
271
Issue
271
列表
看板
标记
里程碑
合并请求
78
合并请求
78
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
9343782b
编写于
1月 17, 2020
作者:
石
石晓伟
提交者:
GitHub
1月 17, 2020
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
support dynamic cuda libs, test=develop (#2780)
上级
9611e046
变更
6
隐藏空白更改
内联
并排
Showing
6 changed file
with
58 addition
and
32 deletion
+58
-32
CMakeLists.txt
CMakeLists.txt
+1
-1
cmake/cuda.cmake
cmake/cuda.cmake
+35
-17
cmake/cudnn.cmake
cmake/cudnn.cmake
+8
-2
lite/api/CMakeLists.txt
lite/api/CMakeLists.txt
+9
-9
lite/backends/cuda/CMakeLists.txt
lite/backends/cuda/CMakeLists.txt
+3
-3
lite/core/lite.map
lite/core/lite.map
+2
-0
未找到文件。
CMakeLists.txt
浏览文件 @
9343782b
...
@@ -75,7 +75,7 @@ lite_option(LITE_BUILD_EXTRA "Enable extra algorithm support in Lite, both kerne
...
@@ -75,7 +75,7 @@ lite_option(LITE_BUILD_EXTRA "Enable extra algorithm support in Lite, both kerne
lite_option
(
LITE_BUILD_TAILOR
"Enable tailoring library according to model"
OFF
)
lite_option
(
LITE_BUILD_TAILOR
"Enable tailoring library according to model"
OFF
)
# cv build options
# cv build options
lite_option
(
LITE_WITH_CV
"Enable build cv image in lite"
OFF
)
lite_option
(
LITE_WITH_CV
"Enable build cv image in lite"
OFF
)
lite_option
(
LITE_WITH_STATIC_CUDA
"Statically link cuda libraries."
ON
)
# TODO(Superjomn) Remove WITH_ANAKIN option if not needed latter.
# TODO(Superjomn) Remove WITH_ANAKIN option if not needed latter.
if
(
ANDROID OR IOS OR ARMLINUX
)
if
(
ANDROID OR IOS OR ARMLINUX
)
...
...
cmake/cuda.cmake
浏览文件 @
9343782b
...
@@ -174,27 +174,45 @@ if(NOT WITH_DSO)
...
@@ -174,27 +174,45 @@ if(NOT WITH_DSO)
endif
(
WIN32
)
endif
(
WIN32
)
endif
(
NOT WITH_DSO
)
endif
(
NOT WITH_DSO
)
function
(
add_cuda_static_lib alias cuda_lib_paths file_name
)
function
(
add_cuda_lib TARGET_NAME
)
unset
(
ABS_PATH CACHE
)
set
(
options STATIC SHARED
)
find_library
(
ABS_PATH NAMES
${
file_name
}
PATHS
${${
cuda_lib_paths
}}
NO_DEFAULT_PATH
)
set
(
oneValueArgs
"NAME"
)
add_library
(
${
alias
}
STATIC IMPORTED GLOBAL
)
set
(
multiValueArgs
"PATHS"
)
set_property
(
TARGET
${
alias
}
PROPERTY IMPORTED_LOCATION
${
ABS_PATH
}
)
cmake_parse_arguments
(
add_cuda_lib
"
${
options
}
"
"
${
oneValueArgs
}
"
"
${
multiValueArgs
}
"
${
ARGN
}
)
set
(
CUDA_STATIC_MODULES
${
CUDA_STATIC_MODULES
}
${
alias
}
PARENT_SCOPE
)
unset
(
ABS_PATH CACHE
)
if
(
NOT ABS_PATH
)
if
(
NOT add_cuda_lib_PATHS
)
message
(
FATAL_ERROR
"Can not find CUDA static library:
${
file_name
}
"
)
set
(
add_cuda_lib_PATHS CUDNN_CHECK_LIBRARY_DIRS
)
endif
()
endif
()
find_library
(
ABS_PATH NAMES
${
add_cuda_lib_NAME
}
PATHS
${${
add_cuda_lib_PATHS
}}
NO_DEFAULT_PATH
)
add_library
(
${
TARGET_NAME
}
SHARED IMPORTED GLOBAL
)
set_property
(
TARGET
${
TARGET_NAME
}
PROPERTY IMPORTED_LOCATION
${
ABS_PATH
}
)
set
(
CUDA_MODULES
${
CUDA_MODULES
}
${
TARGET_NAME
}
PARENT_SCOPE
)
if
(
NOT ABS_PATH
)
message
(
FATAL_ERROR
"Can not find CUDA library:
${
add_cuda_lib_NAME
}
"
)
endif
()
endfunction
()
endfunction
()
add_cuda_static_lib
(
cudart_static CUDNN_CHECK_LIBRARY_DIRS libcudart_static.a
)
if
(
LITE_WITH_STATIC_CUDA
)
add_cuda_static_lib
(
cublas_static CUDNN_CHECK_LIBRARY_DIRS libcublas_static.a
)
message
(
STATUS
"Static link CUDA toolkit."
)
add_cuda_static_lib
(
curand_static CUDNN_CHECK_LIBRARY_DIRS libcurand_static.a
)
add_cuda_lib
(
cudart_static STATIC NAME libcudart_static.a
)
add_cuda_static_lib
(
culibos_static CUDNN_CHECK_LIBRARY_DIRS libculibos.a
)
add_cuda_lib
(
cublas_static STATIC NAME libcublas_static.a
)
if
(
NOT
${
CUDA_VERSION
}
LESS 10.1
)
add_cuda_lib
(
curand_static STATIC NAME libcurand_static.a
)
add_cuda_static_lib
(
cublasLt_static CUDNN_CHECK_LIBRARY_DIRS libcublasLt_static.a
)
add_cuda_lib
(
culibos_static STATIC NAME libculibos.a
)
if
(
NOT
${
CUDA_VERSION
}
LESS 10.1
)
add_cuda_lib
(
cublasLt_static STATIC NAME libcublasLt_static.a
)
endif
()
set_property
(
GLOBAL PROPERTY CUDA_MODULES cudnn_static
${
CUDA_MODULES
}
)
else
()
message
(
STATUS
"Dynamic Link CUDA toolkit."
)
add_cuda_lib
(
cudart SHARED NAME libcudart.so
)
add_cuda_lib
(
cublas SHARED NAME libcublas.so
)
add_cuda_lib
(
curand SHARED NAME libcurand.so
)
if
(
NOT
${
CUDA_VERSION
}
LESS 10.1
)
add_cuda_lib
(
cublasLt SHARED NAME libcublasLt.so
)
endif
()
set_property
(
GLOBAL PROPERTY CUDA_MODULES cudnn
${
CUDA_MODULES
}
)
endif
()
endif
()
set_property
(
GLOBAL PROPERTY CUDA_STATIC_MODULES cudnn_static
${
CUDA_STATIC_MODULES
}
)
# setting nvcc arch flags
# setting nvcc arch flags
select_nvcc_arch_flags
(
NVCC_FLAGS_EXTRA
)
select_nvcc_arch_flags
(
NVCC_FLAGS_EXTRA
)
list
(
APPEND CUDA_NVCC_FLAGS
${
NVCC_FLAGS_EXTRA
}
)
list
(
APPEND CUDA_NVCC_FLAGS
${
NVCC_FLAGS_EXTRA
}
)
...
...
cmake/cudnn.cmake
浏览文件 @
9343782b
...
@@ -69,9 +69,15 @@ if(CUDNN_FOUND)
...
@@ -69,9 +69,15 @@ if(CUDNN_FOUND)
file
(
READ
${
CUDNN_INCLUDE_DIR
}
/cudnn.h CUDNN_VERSION_FILE_CONTENTS
)
file
(
READ
${
CUDNN_INCLUDE_DIR
}
/cudnn.h CUDNN_VERSION_FILE_CONTENTS
)
get_filename_component
(
CUDNN_LIB_PATH
${
CUDNN_LIBRARY
}
DIRECTORY
)
get_filename_component
(
CUDNN_LIB_PATH
${
CUDNN_LIBRARY
}
DIRECTORY
)
add_library
(
cudnn_static STATIC IMPORTED GLOBAL
)
if
(
LITE_WITH_STATIC_CUDA
)
set_property
(
TARGET cudnn_static PROPERTY IMPORTED_LOCATION
add_library
(
cudnn_static STATIC IMPORTED GLOBAL
)
set_property
(
TARGET cudnn_static PROPERTY IMPORTED_LOCATION
"
${
CUDNN_LIB_PATH
}
/libcudnn_static.a"
)
"
${
CUDNN_LIB_PATH
}
/libcudnn_static.a"
)
else
()
add_library
(
cudnn SHARED IMPORTED GLOBAL
)
set_property
(
TARGET cudnn PROPERTY IMPORTED_LOCATION
"
${
CUDNN_LIB_PATH
}
/libcudnn.so"
)
endif
(
LITE_WITH_STATIC_CUDA
)
string
(
REGEX MATCH
"define CUDNN_VERSION +([0-9]+)"
string
(
REGEX MATCH
"define CUDNN_VERSION +([0-9]+)"
CUDNN_VERSION
"
${
CUDNN_VERSION_FILE_CONTENTS
}
"
)
CUDNN_VERSION
"
${
CUDNN_VERSION_FILE_CONTENTS
}
"
)
...
...
lite/api/CMakeLists.txt
浏览文件 @
9343782b
...
@@ -35,13 +35,12 @@ if ((NOT LITE_ON_TINY_PUBLISH) AND (LITE_WITH_CUDA OR LITE_WITH_X86 OR ARM_TARGE
...
@@ -35,13 +35,12 @@ if ((NOT LITE_ON_TINY_PUBLISH) AND (LITE_WITH_CUDA OR LITE_WITH_X86 OR ARM_TARGE
NPU_DEPS
${
npu_kernels
}
)
NPU_DEPS
${
npu_kernels
}
)
target_link_libraries
(
paddle_light_api_shared
${
light_lib_DEPS
}
${
arm_kernels
}
${
npu_kernels
}
)
target_link_libraries
(
paddle_light_api_shared
${
light_lib_DEPS
}
${
arm_kernels
}
${
npu_kernels
}
)
set
(
LINK_MAP_FILE
"
${
PADDLE_SOURCE_DIR
}
/lite/core/lite.map"
)
if
(
LITE_WITH_NPU
)
set
(
LINK_FLAGS
"-Wl,--version-script
${
LINK_MAP_FILE
}
"
)
# Strips the symbols of our protobuf functions to fix the conflicts during
add_custom_command
(
OUTPUT
${
LINK_MAP_FILE
}
COMMAND ...
)
# loading HIAI builder libs (libhiai_ir.so and libhiai_ir_build.so)
add_custom_target
(
custom_linker_map DEPENDS
${
LINK_MAP_FILE
}
)
set
(
LINK_FLAGS
"-Wl,--version-script
${
PADDLE_SOURCE_DIR
}
/lite/core/lite.map"
)
set_target_properties
(
paddle_full_api_shared PROPERTIES LINK_FLAGS
${
LINK_FLAGS
}
)
set_target_properties
(
paddle_light_api_shared PROPERTIES LINK_FLAGS
"
${
LINK_FLAGS
}
"
)
add_dependencies
(
paddle_full_api_shared custom_linker_map
)
endif
()
else
()
else
()
if
((
ARM_TARGET_OS STREQUAL
"android"
)
OR
(
ARM_TARGET_OS STREQUAL
"armlinux"
))
if
((
ARM_TARGET_OS STREQUAL
"android"
)
OR
(
ARM_TARGET_OS STREQUAL
"armlinux"
))
add_library
(
paddle_light_api_shared SHARED
""
)
add_library
(
paddle_light_api_shared SHARED
""
)
...
@@ -106,7 +105,7 @@ endif()
...
@@ -106,7 +105,7 @@ endif()
set
(
light_api_deps
set
(
light_api_deps
scope target_wrapper_host model_parser program
)
scope target_wrapper_host model_parser program
)
if
(
LITE_WITH_CUDA
)
if
(
LITE_WITH_CUDA
)
get_property
(
cuda_
static_deps GLOBAL PROPERTY CUDA_STATIC
_MODULES
)
get_property
(
cuda_
deps GLOBAL PROPERTY CUDA
_MODULES
)
set
(
light_api_deps
${
light_api_deps
}
target_wrapper_cuda
)
set
(
light_api_deps
${
light_api_deps
}
target_wrapper_cuda
)
endif
()
endif
()
lite_cc_library
(
light_api SRCS light_api.cc
lite_cc_library
(
light_api SRCS light_api.cc
...
@@ -258,9 +257,10 @@ if (NOT LITE_ON_TINY_PUBLISH)
...
@@ -258,9 +257,10 @@ if (NOT LITE_ON_TINY_PUBLISH)
FPGA_DEPS
${
fpga_kernels
}
)
FPGA_DEPS
${
fpga_kernels
}
)
# The final inference library for just MobileConfig.
# The final inference library for just MobileConfig.
bundle_static_library
(
paddle_api_full paddle_api_full_bundled bundle_full_api
)
bundle_static_library
(
paddle_api_full paddle_api_full_bundled bundle_full_api
)
target_link_libraries
(
paddle_api_full
${
cuda_deps
}
)
get_property
(
fluid_modules GLOBAL PROPERTY FLUID_MODULES
)
get_property
(
fluid_modules GLOBAL PROPERTY FLUID_MODULES
)
cc_library
(
api_full_static SRCS DEPS paddle_api_full cxx_api paddle_api light_api
${
cxx_api_deps
}
${
ops
}
${
host_kernels
}
${
cuda_kernels
}
program tensor memory naive_buffer types
${
fluid_modules
}
protobuf
${
cuda_static_deps
}
)
endif
()
endif
()
bundle_static_library
(
paddle_api_light paddle_api_light_bundled bundle_light_api
)
bundle_static_library
(
paddle_api_light paddle_api_light_bundled bundle_light_api
)
#-----------------------------------------------------------------------------------------------------
#-----------------------------------------------------------------------------------------------------
...
...
lite/backends/cuda/CMakeLists.txt
浏览文件 @
9343782b
if
(
NOT LITE_WITH_CUDA
)
if
(
NOT LITE_WITH_CUDA
)
return
()
return
()
endif
()
endif
()
get_property
(
cuda_
static_deps GLOBAL PROPERTY CUDA_STATIC
_MODULES
)
get_property
(
cuda_
deps GLOBAL PROPERTY CUDA
_MODULES
)
nv_library
(
target_wrapper_cuda SRCS target_wrapper.cc DEPS
${
cuda_
static_
deps
}
)
nv_library
(
target_wrapper_cuda SRCS target_wrapper.cc DEPS
${
cuda_deps
}
)
nv_library
(
cuda_blas SRCS blas.cc DEPS
${
cuda_
static_
deps
}
)
nv_library
(
cuda_blas SRCS blas.cc DEPS
${
cuda_deps
}
)
add_subdirectory
(
math
)
add_subdirectory
(
math
)
lite/core/lite.map
浏览文件 @
9343782b
{
{
global:
global:
*paddle*;
*paddle*;
*touch_*;
*mir_pass_*;
local:
local:
*;
*;
};
};
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录