grpc_server.h 4.1 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
G
gongweibao 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once

Y
Yi Wang 已提交
17 18 19
#include <string>
#include <thread>  // NOLINT
#include <utility>
20

Y
Yi Wang 已提交
21
#include "grpc++/grpc++.h"
T
typhoonzero 已提交
22
#include "paddle/fluid/framework/blocking_queue.h"
23
#include "paddle/fluid/framework/executor.h"
Y
Yi Wang 已提交
24
#include "paddle/fluid/framework/lod_tensor.h"
25
#include "paddle/fluid/framework/program_desc.h"
Y
Yi Wang 已提交
26 27 28
#include "paddle/fluid/framework/scope.h"
#include "paddle/fluid/framework/selected_rows.h"
#include "paddle/fluid/framework/var_type.h"
T
update  
typhoonzero 已提交
29
#include "paddle/fluid/operators/detail/grpc_service.h"
Y
Yi Wang 已提交
30 31
#include "paddle/fluid/operators/detail/send_recv.grpc.pb.h"
#include "paddle/fluid/operators/detail/send_recv.pb.h"
Y
yi.wu 已提交
32
#include "paddle/fluid/operators/detail/sendrecvop_utils.h"
G
gongweibao 已提交
33 34 35 36 37

namespace paddle {
namespace operators {
namespace detail {

38 39
typedef std::pair<std::string, std::shared_ptr<VariableResponse>>
    ReceivedMessage;
T
typhoonzero 已提交
40
typedef framework::BlockingQueue<ReceivedMessage> ReceivedQueue;
41

G
gongweibao 已提交
42 43 44
typedef std::pair<std::string, sendrecv::VariableMessage> MessageWithName;
class RequestBase;

45
class AsyncGRPCServer final {
G
gongweibao 已提交
46
 public:
Q
qiaolongfei 已提交
47
  explicit AsyncGRPCServer(const std::string &address, bool sync_mode)
T
wip  
typhoonzero 已提交
48
      : address_(address), sync_mode_(sync_mode), ready_(0) {}
G
gongweibao 已提交
49

T
typhoonzero 已提交
50
  ~AsyncGRPCServer() {}
T
done  
typhoonzero 已提交
51
  void WaitServerReady();
G
gongweibao 已提交
52 53
  void RunSyncUpdate();

T
typhoonzero 已提交
54
  // functions to sync server barrier status.
T
typhoonzero 已提交
55 56
  void WaitCond(int cond);
  void SetCond(int cond);
T
typhoonzero 已提交
57
  void WaitClientGet(int count);
G
gongweibao 已提交
58 59 60

  void SetScope(framework::Scope *scope) { scope_ = scope; }

Y
Yancey1989 已提交
61 62
  void SetDevCtx(const platform::DeviceContext *dev_ctx) { dev_ctx_ = dev_ctx; }

63 64 65 66
  void SetProgram(framework::ProgramDesc *program) { program_ = program; }

  void SetExecutor(framework::Executor *executor) { executor_ = executor; }

X
Xin Pan 已提交
67 68 69
  void SetPrefetchPreparedCtx(
      std::unique_ptr<framework::ExecutorPrepareContext> prepared) {
    prefetch_ctx_.reset(prepared.release());
Y
Yancey1989 已提交
70 71
  }

Q
qiaolongfei 已提交
72
  int GetSelectedPort() const { return selected_port_; }
T
typhoonzero 已提交
73

74
  const ReceivedMessage Get() { return this->var_recv_queue_.Pop(); }
G
gongweibao 已提交
75

76 77 78
  void Push(const std::string &msg_name) {
    this->var_recv_queue_.Push(std::make_pair(msg_name, nullptr));
  }
G
gongweibao 已提交
79 80 81 82

  void ShutDown();

 protected:
Y
Yi Wang 已提交
83 84
  void HandleRequest(::grpc::ServerCompletionQueue *cq,
                     const std::string &cq_name,
G
gongweibao 已提交
85 86 87
                     std::function<void()> TryToRegisterNewOne);
  void TryToRegisterNewSendOne();
  void TryToRegisterNewGetOne();
88
  void TryToRegisterNewPrefetchOne();
G
gongweibao 已提交
89 90 91 92 93
  void ShutdownQueue();

 private:
  std::mutex cq_mutex_;
  volatile bool is_shut_down_ = false;
94 95
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_send_;
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_get_;
96
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_prefetch_;
G
gongweibao 已提交
97

98 99
  GrpcService::AsyncService service_;
  std::unique_ptr<::grpc::Server> server_;
G
gongweibao 已提交
100 101

  std::string address_;
Q
qiaolongfei 已提交
102
  const bool sync_mode_;
G
gongweibao 已提交
103
  framework::Scope *scope_;
Y
Yancey1989 已提交
104
  const platform::DeviceContext *dev_ctx_;
105

G
gongweibao 已提交
106
  // received variable from RPC, operators fetch variable from this queue.
T
typhoonzero 已提交
107
  framework::BlockingQueue<MessageWithName> var_get_queue_;
Q
qiaolongfei 已提交
108
  // client send variable to this queue.
109
  ReceivedQueue var_recv_queue_;
G
gongweibao 已提交
110 111

  // condition of the sub program
T
typhoonzero 已提交
112 113 114
  std::mutex barrier_mutex_;
  mutable int barrier_cond_step_;
  std::condition_variable barrier_condition_;
G
gongweibao 已提交
115 116 117

  std::unique_ptr<std::thread> t_send_;
  std::unique_ptr<std::thread> t_get_;
118 119
  std::unique_ptr<std::thread> t_prefetch_;

X
Xin Pan 已提交
120
  std::unique_ptr<framework::ExecutorPrepareContext> prefetch_ctx_;
121 122
  framework::ProgramDesc *program_;
  framework::Executor *executor_;
T
typhoonzero 已提交
123
  int selected_port_;
T
wip  
typhoonzero 已提交
124

T
done  
typhoonzero 已提交
125
  std::mutex mutex_ready_;
T
wip  
typhoonzero 已提交
126 127
  std::condition_variable condition_ready_;
  int ready_;
G
gongweibao 已提交
128 129 130 131 132
};

};  // namespace detail
};  // namespace operators
};  // namespace paddle