Merge pull request #15 from stoneyang/hl_device_func

fixed build issue of double definition of atomicAdd on modern GPUs

Merge pull request #15 from stoneyang/hl_device_func
fixed build issue of double definition of atomicAdd on modern GPUs
f2b84d54 · liaogang · GitHub · df826899 · f2aa2747 · f2b84d54
显示空白变更内容
内联并排

Showing with 4 addition and 0 deletion

paddle/cuda/include/hl_device_functions.cuh paddle/cuda/include/hl_device_functions.cuh +4 -0

未找到文件。
--- a/paddle/cuda/include/hl_device_functions.cuh
+++ b/paddle/cuda/include/hl_device_functions.cuh
@@ -16,6 +16,8 @@ limitations under the License. */
 #ifndef HL_DEVICE_FUNCTIONS_CUH_
 #define HL_DEVICE_FUNCTIONS_CUH_
+#if defined(__CUDA_ARCH__) && __CUDA_ARCH__ < 600
 namespace hppl {
 static __inline__ __device__ double atomicAdd(double* address, double val) {
@@ -38,4 +40,6 @@ static __inline__ __device__ double atomicAdd(double* address, double val) {
 using hppl::atomicAdd;
+#endif
 #endif /* HL_DEVICE_FUNCTIONS_CUH_ */