From 1d68850cb22ebcbda1e114ec3d586edb60dcff5e Mon Sep 17 00:00:00 2001 From: Anatoly Baksheev Date: Wed, 10 Oct 2012 22:16:42 +0400 Subject: [PATCH] Added CUDA fast math flag --- CMakeLists.txt | 1 + cmake/OpenCVDetectCUDA.cmake | 8 ++++++++ 2 files changed, 9 insertions(+) diff --git a/CMakeLists.txt b/CMakeLists.txt index 83bea076e6..25bf7c80ff 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -768,6 +768,7 @@ if(HAVE_CUDA) status(" Use CUBLAS:" HAVE_CUBLAS THEN YES ELSE NO) status(" NVIDIA GPU arch:" ${OPENCV_CUDA_ARCH_BIN}) status(" NVIDIA PTX archs:" ${OPENCV_CUDA_ARCH_PTX}) + status(" Use fast math:" CUDA_FAST_MATH THEN YES ELSE NO) endif() # ========================== python ========================== diff --git a/cmake/OpenCVDetectCUDA.cmake b/cmake/OpenCVDetectCUDA.cmake index 9b3fcd1f72..a777a466b9 100644 --- a/cmake/OpenCVDetectCUDA.cmake +++ b/cmake/OpenCVDetectCUDA.cmake @@ -78,6 +78,14 @@ if(CUDA_FOUND) set(OpenCV_CUDA_CC "${NVCC_FLAGS_EXTRA}") message(STATUS "CUDA NVCC target flags: ${CUDA_NVCC_FLAGS}") + + OCV_OPTION(CUDA_FAST_MATH "Enable --use_fast_math for CUDA compiler " OFF) + + if(ENABLE_CUDA_MATH) + set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} --use_fast_math) + endif() + + mark_as_advanced(CUDA_BUILD_CUBIN CUDA_BUILD_EMULATION CUDA_VERBOSE_BUILD CUDA_SDK_ROOT_DIR) unset(CUDA_npp_LIBRARY CACHE) find_cuda_helper_libs(npp) -- GitLab