add macro to ban windows (#21422)

remove nccl related code in windows

add macro to ban windows (#21422)
remove nccl related code in windows
a6b089c6 · hutuxian · GitHub · ebfb720a · a6b089c6 · a6b089c6
Showing with 15 addition and 1 deletion

paddle/fluid/operators/data_norm_op.cu paddle/fluid/operators/data_norm_op.cu +10 -1

python/paddle/fluid/tests/unittests/test_data_norm_op.py python/paddle/fluid/tests/unittests/test_data_norm_op.py +5 -0

未找到文件。
--- a/paddle/fluid/operators/data_norm_op.cu
+++ b/paddle/fluid/operators/data_norm_op.cu
@@ -16,9 +16,11 @@ limitations under the License. */
 #include <string>
 #include "paddle/fluid/framework/data_layout.h"
 #include "paddle/fluid/operators/data_norm_op.h"
-#include "paddle/fluid/platform/collective_helper.h"
 #include "paddle/fluid/platform/cuda_primitives.h"
+#if defined(PADDLE_WITH_CUDA) && !defined(_WIN32)
+#include "paddle/fluid/platform/collective_helper.h"
 #include "paddle/fluid/platform/nccl_helper.h"
+#endif
 namespace paddle {
 namespace operators {
@@ -176,6 +178,7 @@ class DataNormGradKernel<platform::CUDADeviceContext, T>
        d_batch_sum, d_batch_square_sum);
    if (need_sync_stats) {
+#if defined(PADDLE_WITH_CUDA) && !defined(_WIN32)
      auto comm = platform::NCCLCommContext::Instance().Get(0, ctx.GetPlace());
      PADDLE_ENFORCE_CUDA_SUCCESS(platform::dynload::ncclAllReduce(
          reinterpret_cast<const void *>(d_batch_size),
@@ -194,7 +197,13 @@ class DataNormGradKernel<platform::CUDADeviceContext, T>
        LOG(FATAL) << "Fail to sync nccl stream: "
                   << cudaGetErrorString(e_sync);
      }
+#else
+      PADDLE_THROW(platform::errors::PreconditionNotMet(
+          "PaddlePaddle should compile with GPU, and need_sync_stats connot be "
+          "supported on windows now."));
+#endif
    }
    T *batch_size_data =
        ctx.Output<Tensor>("BatchSize")->mutable_data<T>(ctx.GetPlace());
    T *batch_sum_data =

--- a/python/paddle/fluid/tests/unittests/test_data_norm_op.py
+++ b/python/paddle/fluid/tests/unittests/test_data_norm_op.py
@@ -287,6 +287,11 @@ class TestDataNormOpWithSyncStats(OpTest):
    def test_sync_stats(self):
        if not core.is_compiled_with_cuda():
            return
+        if os.name == 'nt':
+            print(
+                'Skip TestDataNormOpWithSyncStats because nccl is not supported on windows'
+            )
+            return
        x = fluid.layers.data(name='x', shape=[1], dtype='int64', lod_level=0)
        emb = layers.embedding(
            input=x,