/* Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ #pragma once #include #include #include #include #include #include #include #include #include #include #include "gflags/gflags.h" #include "paddle/fluid/framework/scope.h" #include "paddle/fluid/framework/variable.h" #include "paddle/fluid/operators/distributed/distributed.h" #include "paddle/fluid/operators/distributed/rpc_client.h" #include "paddle/fluid/operators/distributed/rpc_common.h" #include "paddle/fluid/operators/distributed_ops/send_recv_util.h" #include "paddle/fluid/operators/math/math_function.h" #include "paddle/fluid/operators/math/selected_rows_functor.h" #include "paddle/fluid/platform/device_context.h" #include "paddle/fluid/platform/enforce.h" #include "paddle/fluid/platform/place.h" DECLARE_bool(communicator_is_sgd_optimizer); namespace paddle { namespace operators { namespace distributed { using Scope = framework::Scope; using Variable = framework::Variable; template class BlockingQueue { public: explicit BlockingQueue(size_t capacity) : capacity_(capacity) { PADDLE_ENFORCE_GT(capacity_, 0, "The capacity must be greater than 0."); } bool Push(const T& elem) { { std::unique_lock lock(mutex_); cv_.wait(lock, [&] { return queue_.size() < capacity_; }); PADDLE_ENFORCE_LT(queue_.size(), capacity_); queue_.push_back(elem); } cv_.notify_one(); return true; } bool Push(T&& elem) { { std::unique_lock lock(mutex_); cv_.wait(lock, [&] { return queue_.size() < capacity_; }); PADDLE_ENFORCE_LT(queue_.size(), capacity_); queue_.emplace_back(std::move(elem)); } cv_.notify_one(); return true; } T Pop() { std::unique_lock lock(mutex_); cv_.wait(lock, [=] { return !queue_.empty(); }); T rc(std::move(queue_.front())); queue_.pop_front(); cv_.notify_one(); return rc; } size_t Cap() const { std::lock_guard lock(mutex_); return capacity_; } size_t Size() const { std::lock_guard lock(mutex_); return queue_.size(); } private: const size_t capacity_; std::deque queue_; mutable std::mutex mutex_; std::condition_variable cv_; }; template using EigenVector = framework::EigenVector; template inline void MergeVars(const std::string& var_name, const std::vector>& vars, Scope* scope, bool merge_add = true) { PADDLE_ENFORCE(!vars.empty(), "should have value to merge!"); auto cpu_place = platform::CPUPlace(); auto& var0 = vars[0]; auto* out_var = scope->Var(var_name); if (var0->IsType()) { auto dims = var0->Get().dims(); VLOG(3) << "merge " << var_name << " LoDTensor dims " << dims << "; merge add: " << merge_add; // init output tensor auto* out_t = out_var->GetMutable(); out_t->mutable_data(dims, cpu_place); // check the input dims for (auto& var : vars) { auto& var_t = var->Get(); PADDLE_ENFORCE_EQ(var_t.dims(), dims, "should have the same dims"); } // set output tensor to 0. auto cpu_ctx = paddle::platform::CPUDeviceContext(); math::SetConstant constant_functor; constant_functor(cpu_ctx, out_t, static_cast(0)); // sum all vars to out auto result = EigenVector::Flatten(*out_t); for (auto& var : vars) { auto& in_t = var->Get(); auto in = EigenVector::Flatten(in_t); result.device(*cpu_ctx.eigen_device()) = result + in; } if (!merge_add) { result.device(*cpu_ctx.eigen_device()) = result / static_cast(vars.size()); } } else if (var0->IsType()) { auto& slr0 = var0->Get(); auto* out_slr = out_var->GetMutable(); out_slr->mutable_rows()->clear(); out_slr->mutable_value()->mutable_data({{}}, cpu_place); std::vector inputs; inputs.reserve(vars.size()); for (auto& var : vars) { inputs.push_back(&var->Get()); } auto dev_ctx = paddle::platform::CPUDeviceContext(); if (merge_add) { math::scatter::MergeAdd merge_add; merge_add(dev_ctx, inputs, out_slr); } else { math::scatter::MergeAverage merge_average; merge_average(dev_ctx, inputs, out_slr); } VLOG(3) << "merge " << var_name << " SelectedRows height: " << slr0.height() << " dims: " << slr0.value().dims() << "; merge add: " << merge_add; } else { PADDLE_THROW("unsupported var type!"); } } using RpcCtxMap = std::unordered_map; class Communicator { public: Communicator(); explicit Communicator(const std::map& env_flags); virtual ~Communicator() {} virtual void SetEnvFlagsDefault(); virtual void Start() = 0; virtual void Stop() = 0; virtual bool IsRunning() { return running_; } virtual void Send(const std::string& var_name, const framework::Scope& scope) = 0; virtual void Send(const std::vector& sparse_var_names, const std::vector& sparse_var_tables, const framework::Scope& scope) = 0; virtual void Recv() = 0; virtual void InitImpl(const RpcCtxMap& send_varname_to_ctx, const RpcCtxMap& recv_varname_to_ctx, Scope* recv_scope) = 0; virtual void InitImpl(const paddle::framework::ProgramDesc& program, Scope* recv_scope) = 0; // for geo-sgd virtual void InitImpl( const paddle::framework::ProgramDesc& program, Scope* param_scope, std::map>>& vars_info, const int& trainers, const int& geo_need_push_nums) = 0; static Communicator* GetInstance() { return communicator_.get(); } static std::shared_ptr GetInstantcePtr() { return communicator_; } template static Communicator* InitInstance(const RpcCtxMap& send_varname_to_ctx, const RpcCtxMap& recv_varname_to_ctx, Scope* recv_scope) { std::call_once(init_flag_, &Communicator::InitWithRpcCtx, send_varname_to_ctx, recv_varname_to_ctx, recv_scope); return communicator_.get(); } template static Communicator* InitInstance( const paddle::framework::ProgramDesc& program, Scope* recv_scope, const std::map& env_flags) { std::call_once(init_flag_, &Communicator::InitWithProgram, program, recv_scope, std::ref(env_flags)); return communicator_.get(); } template static Communicator* InitInstance( const paddle::framework::ProgramDesc& program, Scope* training_scope, std::map>>& vars_info, const int& trainers, const int& geo_need_push_nums, const std::map& env_flags) { std::call_once(init_flag_, &Communicator::InitWithTranspilerInfo, program, training_scope, std::ref(vars_info), std::ref(trainers), std::ref(geo_need_push_nums), std::ref(env_flags)); return communicator_.get(); } // Init is called by InitInstance. template static void InitWithRpcCtx(const RpcCtxMap& send_varname_to_ctx, const RpcCtxMap& recv_varname_to_ctx, Scope* recv_scope) { if (communicator_.get() == nullptr) { communicator_.reset(new T()); communicator_->InitImpl(send_varname_to_ctx, recv_varname_to_ctx, recv_scope); } } template static void InitWithProgram(const paddle::framework::ProgramDesc& program, Scope* recv_scope, const std::map& env_flags) { if (communicator_.get() == nullptr) { communicator_.reset(new T(std::ref(env_flags))); communicator_->InitImpl(program, recv_scope); } } template static void InitWithTranspilerInfo( const paddle::framework::ProgramDesc& program, Scope* training_scope, std::map>>& vars_info, const int& trainers, const int& geo_need_push_nums, const std::map& env_flags) { if (communicator_.get() == nullptr) { communicator_.reset(new T(std::ref(env_flags))); communicator_->InitImpl(program, training_scope, std::ref(vars_info), std::ref(trainers), std::ref(geo_need_push_nums)); } } protected: bool running_ = false; static std::shared_ptr communicator_; static std::once_flag init_flag_; std::unordered_map env_flags_dict; }; using SparseIdsMap = std::unordered_map>>; class AsyncCommunicator : public Communicator { public: AsyncCommunicator() : Communicator() {} explicit AsyncCommunicator(const std::map& env_flags) : Communicator(env_flags) {} ~AsyncCommunicator(); void Start() override; void Stop() override; void Send(const std::string& var_name, const framework::Scope& scope) override; void Recv() override; void RecvAll(); void InitImpl(const RpcCtxMap& send_varname_to_ctx, const RpcCtxMap& recv_varname_to_ctx, Scope* recv_scope) override; void InitImpl(const paddle::framework::ProgramDesc& program, Scope* recv_scope) override; void SendThread(); void RecvThread(); void Send(const std::vector& sparse_var_names, const std::vector& sparse_var_tables, const framework::Scope& scope) override; void InitImpl( const paddle::framework::ProgramDesc& program, Scope* param_scope, std::map>>& vars_info, const int& trainers, const int& geo_need_push_nums) override; private: std::unordered_map>>> send_varname_to_queue_; RpcCtxMap send_varname_to_ctx_; RpcCtxMap recv_varname_to_ctx_; std::unique_ptr send_thread_{nullptr}; std::unique_ptr recv_thread_{nullptr}; Scope* recv_scope_; // should be global scope std::unique_ptr send_scope_; // an independent scope std::unique_ptr<::ThreadPool> send_threadpool_{nullptr}; std::unique_ptr<::ThreadPool> recv_threadpool_{nullptr}; std::atomic_uint grad_num_{0}; // the num of gradient sent since last recv }; class GeoSgdCommunicator : public Communicator { public: GeoSgdCommunicator() : Communicator() {} explicit GeoSgdCommunicator(const std::map& env_flags) : Communicator(env_flags) {} ~GeoSgdCommunicator(); void InitImpl( const paddle::framework::ProgramDesc& program, Scope* training_scope, std::map>>& vars_info, const int& trainers, const int& geo_need_push_nums) override; void Start() override; void Stop() override; void Send(const std::string& var_name, const framework::Scope& scope) override; void Send(const std::vector& sparse_var_names, const std::vector& sparse_var_tables, const framework::Scope& scope) override; void Recv() override; void InitImpl(const RpcCtxMap& send_varname_to_ctx, const RpcCtxMap& recv_varname_to_ctx, Scope* recv_scope) override; void InitImpl(const paddle::framework::ProgramDesc& program, Scope* recv_scope) override; private: void SendThread(); std::unordered_set SparseIdsMerge( const std::vector& ids_send_vec, const std::string& var_name, const std::string& splited_var_name); void SendUpdateDenseVars(const std::string& var_name, const std::string& splited_var_name); void SendUpdateSparseVars(const std::string& var_name, const std::string& splited_var_name, const std::unordered_set& ids_table); void RecvUpdateDenseVars(const std::string& var_name, const std::string& splited_var_name); void RecvUpdateSparseVars(const std::string& var_name, const std::string& splited_var_name); void GeoSgdDenseParamInit(framework::Scope* scope_x, framework::Scope* scope_y, const std::string var_name); void GeoSgdSparseParamInit(framework::Scope* scope_x, framework::Scope* scope_y, const std::string var_name); void RpcSend(const std::string& origin_var_name, const std::string& splited_var_name, const size_t& splited_var_index); void RpcRecv(const std::string& origin_var_name, const std::string& splited_var_name, const size_t& splited_var_index); const std::string VarToDeltaVar(const std::string var_name) { std::string delta_name = var_name; const std::string send_name = delta_name.append(".delta"); return send_name; } const std::string DeltaVarToVar(const std::string var_name) { std::string origin_name = var_name; origin_name.erase(origin_name.find(".delta"), 6); const std::string param_name = origin_name; return param_name; } size_t GetSplitedVarIndex(const std::string var_name, const std::string splited_var_name) { size_t index = 0; for (size_t i = 0; i < send_varname_to_ctx_[var_name].splited_var_names.size(); i++) { if (send_varname_to_ctx_[var_name].splited_var_names[i] == splited_var_name) { index = i; break; } } return index; } private: int trainer_nums_ = 1; size_t geo_need_push_nums_ = 100; bool is_geo_sgd_ = false; int send_var_nums_ = 0; RpcCtxMap send_varname_to_ctx_; RpcCtxMap recv_varname_to_ctx_; // parameter for local training Scope* training_scope_; // parameter for delta calc and send std::shared_ptr delta_scope_; // parameter for storage the pserver param after last recv std::shared_ptr old_scope_; // parameter on pserver std::shared_ptr pserver_scope_; // if var is sparse, using selected rows, bool=true std::unordered_map var_list_; std::shared_ptr>> need_push_queue_; std::vector ids_send_vec_; std::unordered_map> absolute_section_; std::unordered_map vars_first_dimension_; std::unique_ptr<::ThreadPool> send_threadpool_{nullptr}; std::unique_ptr send_thread_{nullptr}; size_t need_thread_nums_{0}; }; } // namespace distributed } // namespace operators } // namespace paddle