stream_callback_manager.cc 3.7 KB
Newer Older
S
sneaxiy 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/platform/stream_callback_manager.h"
16
#include "paddle/fluid/platform/device/device_wrapper.h"
S
sneaxiy 已提交
17 18 19 20

namespace paddle {
namespace platform {

21 22 23
#ifdef PADDLE_WITH_HIP
static void StreamCallbackFunc(gpuStream_t stream, gpuError_t status,
                               void *user_data)
24 25 26 27
#endif
#ifdef PADDLE_WITH_CUDA
#if CUDA_VERSION >= 10000
    static void CUDART_CB StreamCallbackFunc(void *user_data)
S
fix bug  
sneaxiy 已提交
28
#else
29 30 31 32 33 34 35
    static void CUDART_CB
    StreamCallbackFunc(cudaStream_t stream, cudaError_t status, void *user_data)
#endif
#endif

#if PADDLE_WITH_ASCEND_CL
        static void StreamCallbackFunc(void *user_data)
S
fix bug  
sneaxiy 已提交
36
#endif
F
fwenguang 已提交
37 38 39
#if PADDLE_WITH_MLU
            static void StreamCallbackFunc(void *user_data)
#endif
S
fix bug  
sneaxiy 已提交
40 41 42 43 44
{
  std::unique_ptr<std::function<void()>> func(
      reinterpret_cast<std::function<void()> *>(user_data));
  (*func)();
}
S
sneaxiy 已提交
45

46 47
template <typename Stream>
StreamCallbackManager<Stream>::StreamCallbackManager(const Stream stream)
S
fix bug  
sneaxiy 已提交
48
    : stream_(stream), thread_pool_(1) {}
S
sneaxiy 已提交
49

50 51 52
template <typename Stream>
void StreamCallbackManager<Stream>::AddCallback(
    std::function<void()> callback) const {
S
fix bug  
sneaxiy 已提交
53 54 55 56 57 58 59 60
  auto *callback_func = new std::function<void()>(std::move(callback));
  auto *func = new std::function<void()>([this, callback_func] {
    std::lock_guard<std::mutex> lock(mtx_);
    last_future_ = thread_pool_.enqueue([callback_func] {
      std::unique_ptr<std::function<void()>> releaser(callback_func);
      (*callback_func)();
    });
  });
61

62
#ifdef PADDLE_WITH_HIP
63
  PADDLE_ENFORCE_GPU_SUCCESS(
64
      hipStreamAddCallback(stream_, StreamCallbackFunc, func, 0));
65 66 67
#endif
#ifdef PADDLE_WITH_CUDA
#if CUDA_VERSION >= 10000
68
  PADDLE_ENFORCE_GPU_SUCCESS(
G
GaoWei8 已提交
69
      cudaLaunchHostFunc(stream_, StreamCallbackFunc, func));
S
sneaxiy 已提交
70
#else
71
  PADDLE_ENFORCE_GPU_SUCCESS(
G
GaoWei8 已提交
72
      cudaStreamAddCallback(stream_, StreamCallbackFunc, func, 0));
S
sneaxiy 已提交
73
#endif
74 75 76
#endif

#if PADDLE_WITH_ASCEND_CL
77 78
  VLOG(3) << "aclrtLaunchCallback at stream: " << stream_;
  // TODO(zhiqiu): failed to call aclrtLaunchCallback
79
  NPULaunchCallback(StreamCallbackFunc, func, ACL_CALLBACK_BLOCK, stream_);
80
#endif
F
fwenguang 已提交
81 82

#if PADDLE_WITH_MLU
F
fwenguang 已提交
83 84 85 86
  VLOG(3) << "MLULaunchCallback at stream: " << stream_
          << " Failed to call MLULaunchCallback, "
          << "because mlu not support StreamAddCallback yet. "
          << "function: " << func;
F
fwenguang 已提交
87
#endif
S
sneaxiy 已提交
88 89
}

90 91
template <typename Stream>
void StreamCallbackManager<Stream>::Wait() const {
92 93
#if defined(PADDLE_WITH_HIP) || defined(PADDLE_WITH_CUDA)
  platform::GpuStreamSync(stream_);
94
#endif
F
fwenguang 已提交
95 96 97
#ifdef PADDLE_WITH_MLU
  PADDLE_ENFORCE_MLU_SUCCESS(cnrtQueueSync(stream_));
#endif
98
#ifdef PADDLE_WITH_ASCEND_CL
99
  NPUStreamSync(stream_);
100
#endif
S
fix bug  
sneaxiy 已提交
101 102 103 104 105 106
  {
    std::lock_guard<std::mutex> lock(mtx_);
    if (last_future_.valid()) {
      last_future_.wait();
    }
  }
S
sneaxiy 已提交
107 108
}

109 110 111 112 113 114 115 116 117
#ifdef PADDLE_WITH_CUDA
template struct StreamCallbackManager<gpuStream_t>;
#endif
#ifdef PADDLE_WITH_HIP
template struct StreamCallbackManager<hipStream_t>;
#endif
#ifdef PADDLE_WITH_ASCEND_CL
template struct StreamCallbackManager<aclrtStream>;
#endif
F
fwenguang 已提交
118 119 120
#ifdef PADDLE_WITH_MLU
template struct StreamCallbackManager<mluStream>;
#endif
121

S
sneaxiy 已提交
122 123
}  // namespace platform
}  // namespace paddle