fix ln (#41918)

771a4144 · sneaxiy · GitHub · 6bd39b5e · 771a4144
隐藏空白更改
内联并排

Showing with 4 addition and 2 deletion

paddle/fluid/operators/layer_norm_kernel.cu.h paddle/fluid/operators/layer_norm_kernel.cu.h +4 -2

未找到文件。
--- a/paddle/fluid/operators/layer_norm_kernel.cu.h
+++ b/paddle/fluid/operators/layer_norm_kernel.cu.h
@@ -130,7 +130,9 @@ __forceinline__ __device__ U BlockReduceSum(U val, U *shared) {
                                            ##__VA_ARGS__)

 static __device__ __forceinline__ float real_sqrt(float x) { return sqrtf(x); }
-static __device__ __forceinline__ double real_sqrt(double x) { return sqrt(x); }
+static __device__ __forceinline__ double real_sqrt(double x) {
+  return ::sqrt(x);
+}

 template <typename T>
 struct PairForLayerNorm {
@@ -162,7 +164,7 @@ __inline__ __device__ float rsqrt_(const float val) {

 template <>
 __inline__ __device__ double rsqrt_(const double val) {
-  return rsqrt(val);
+  return ::rsqrt(val);
 }

 #if CUDA_ARCH_FP16_SUPPORTED(__CUDA_ARCH__)