// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #pragma once #include #include #include #include #include "ThreadPool.h" #include "paddle/fluid/platform/enforce.h" namespace paddle { namespace platform { using StreamCallback = std::function; class StreamCallbackManager; struct StreamCallbackContext { template inline StreamCallbackContext(const StreamCallbackManager *manager, Callback &&callback) : manager_(manager), callback_(callback) {} const StreamCallbackManager *manager_; // do not own StreamCallback callback_; }; class StreamCallbackManager { public: explicit inline StreamCallbackManager(cudaStream_t stream = nullptr) : stream_(stream), thread_pool_(new ThreadPool(1)) {} template inline void AddCallback(Callback &&callback) const { AddCallbackWithStreamAndErrorInfo( [=](cudaStream_t, cudaError_t) { callback(); }); } template inline void AddCallbackWithStreamAndErrorInfo(Callback &&callback) const { auto *stream_callback_context = new StreamCallbackContext(this, callback); PADDLE_ENFORCE(cudaStreamAddCallback( stream_, StreamCallbackManager::StreamCallbackFunc, stream_callback_context, 0)); } void Wait() const { thread_pool_.reset(new ThreadPool(1)); } private: const cudaStream_t stream_; mutable std::unique_ptr thread_pool_; // cudaStreamCallback cannot call CUDA API inside, so we have to use // thread_pool here static void CUDART_CB StreamCallbackFunc(cudaStream_t stream, cudaError_t status, void *user_data) { auto *callback_context_ptr = reinterpret_cast(user_data); callback_context_ptr->manager_->thread_pool_->enqueue([=]() { std::unique_ptr callback_context( callback_context_ptr); callback_context->callback_(stream, status); }); } }; } // namespace platform } // namespace paddle