Use parentesis around min and max to enable Windows build (#449)

* Towards Windows build * formatting Co-authored-by: N Bruno Cabral <bruno@potelo.com.br> Co-authored-by: N Jeff Rasley <jerasley@microsoft.com> Co-authored-by: N Olatunji Ruwase <olruwase@microsoft.com>

Use parentesis around min and max to enable Windows build (#449)
* Towards Windows build * formatting Co-authored-by: N Bruno Cabral <bruno@potelo.com.br> Co-authored-by: N Jeff Rasley <jerasley@microsoft.com> Co-authored-by: N Olatunji Ruwase <olruwase@microsoft.com>
95575579 · Bruno · GitHub · 7b8be2a7 · 95575579 · 95575579
Showing with 6 addition and 6 deletion

csrc/includes/context.h csrc/includes/context.h +2 -2

csrc/includes/gemm_test.h csrc/includes/gemm_test.h +2 -2

csrc/transformer/ds_transformer_cuda.cpp csrc/transformer/ds_transformer_cuda.cpp +2 -2

未找到文件。
--- a/csrc/includes/context.h
+++ b/csrc/includes/context.h
@@ -33,8 +33,8 @@

 inline int DS_GET_BLOCKS(const int N)
 {
-    return std::max(
-        std::min((N + DS_CUDA_NUM_THREADS - 1) / DS_CUDA_NUM_THREADS, DS_MAXIMUM_NUM_BLOCKS),
+    return (std::max)(
+        (std::min)((N + DS_CUDA_NUM_THREADS - 1) / DS_CUDA_NUM_THREADS, DS_MAXIMUM_NUM_BLOCKS),
        // Use at least 1 block, since CUDA does not allow empty block
        1);
 }

--- a/csrc/includes/gemm_test.h
+++ b/csrc/includes/gemm_test.h
@@ -97,7 +97,7 @@ public:
    template <typename Func>
    int Run(int loops, Func f)
    {
-        float fast_latency = std::numeric_limits<float>::max();
+        float fast_latency = (std::numeric_limits<float>::max)();
        int fast_algo = 0;

        for (int algo = (int)CUBLAS_GEMM_DEFAULT_TENSOR_OP;
@@ -252,7 +252,7 @@ public:
    template <typename Func>
    int Run(int loops, Func f)
    {
-        float fast_latency = std::numeric_limits<float>::max();
+        float fast_latency = (std::numeric_limits<float>::max)();
        int fast_algo = 0;

        for (int algo = (int)CUBLAS_GEMM_DEFAULT_TENSOR_OP;

--- a/csrc/transformer/ds_transformer_cuda.cpp
+++ b/csrc/transformer/ds_transformer_cuda.cpp
@@ -27,8 +27,8 @@ size_t get_workspace_size(int maxBatchSize,
 {
    size_t workSpacesize = 4 * (size_t(maxBatchSize) * seq_len * hidden_size);
    if (training) {
-        workSpacesize += (std::max((size_t(maxBatchSize) * seq_len * intermediate_size),
-                                   2 * (size_t(maxBatchSize) * heads * seq_len * seq_len)));
+        workSpacesize += ((std::max)((size_t(maxBatchSize) * seq_len * intermediate_size),
+                                     2 * (size_t(maxBatchSize) * heads * seq_len * seq_len)));
        if (gelu_checkpoint) workSpacesize += 2 * (size_t(maxBatchSize) * seq_len * hidden_size);
    }
    return workSpacesize * sizeof(T);