// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #pragma once #include #include #include #include #include #include #include #include "paddle/fluid/distributed/fleet_executor/interceptor_message.pb.h" #include "paddle/fluid/platform/enforce.h" #include "paddle/fluid/platform/errors.h" #include "paddle/fluid/platform/macros.h" namespace paddle { namespace distributed { class TaskNode; class Interceptor { public: using MsgHandle = std::function; public: Interceptor() = delete; Interceptor(int64_t interceptor_id, TaskNode* node); virtual ~Interceptor(); // register interceptor handle void RegisterMsgHandle(MsgHandle handle); void Handle(const InterceptorMessage& msg); // return the interceptor id int64_t GetInterceptorId() const; // return the conditional var std::condition_variable& GetCondVar(); // Called by Carrier, enqueue an InterceptorMessage to remote mailbox bool EnqueueRemoteInterceptorMessage( const InterceptorMessage& interceptor_message); bool Send(int64_t dst_id, InterceptorMessage& msg); // NOLINT DISABLE_COPY_AND_ASSIGN(Interceptor); protected: TaskNode* GetTaskNode() const { return node_; } private: // pool the local mailbox, parse the Message void PoolTheMailbox(); // fetch all Message from remote mailbox to local mailbox // return true if remote mailbox not empty, otherwise return false bool FetchRemoteMailbox(); // interceptor id, handed from above layer int64_t interceptor_id_; // node need to be handled by this interceptor TaskNode* node_; // interceptor handle which process message MsgHandle handle_{nullptr}; // mutex to control read/write conflict for remote mailbox std::mutex remote_mailbox_mutex_; // interceptor runs PoolTheMailbox() function to poll local mailbox std::thread interceptor_thread_; // conditional variable for blocking the thread when // fetch an empty remote mailbox std::condition_variable cond_var_; // remote mailbox, written by EnqueueRemoteMessage() // read by FetchRemoteMailbox() std::queue remote_mailbox_; // local mailbox, written by FetchRemoteMailbox() // read by PoolTheMailbox() std::queue local_mailbox_; int64_t already_run_times_{0}; int64_t used_slot_nums_{0}; }; class InterceptorFactory { public: using CreateInterceptorFunc = std::unique_ptr (*)(int64_t, TaskNode*); using CreateInterceptorMap = std::unordered_map; static void Register(const std::string& type, CreateInterceptorFunc func); static std::unique_ptr Create(const std::string& type, int64_t id, TaskNode* node); }; template std::unique_ptr CreatorInterceptor(int64_t id, TaskNode* node) { return std::make_unique(id, node); } #define REGISTER_INTERCEPTOR(interceptor_type, interceptor_class) \ class __RegisterInterceptor_##interceptor_type { \ public: \ __RegisterInterceptor_##interceptor_type() { \ InterceptorFactory::Register(#interceptor_type, \ CreatorInterceptor); \ } \ void Touch() {} \ }; \ __RegisterInterceptor_##interceptor_type g_register_##interceptor_type; \ int TouchRegisterInterceptor_##interceptor_type() { \ g_register_##interceptor_type.Touch(); \ return 0; \ } #define USE_INTERCEPTOR(interceptor_type) \ extern int TouchRegisterInterceptor_##interceptor_type(); \ UNUSED static int use_interceptor_##interceptor_type = \ TouchRegisterInterceptor_##interceptor_type(); } // namespace distributed } // namespace paddle