grpc_server.h 4.6 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
G
gongweibao 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once

Y
Yi Wang 已提交
17 18 19
#include <string>
#include <thread>  // NOLINT
#include <utility>
X
Xin Pan 已提交
20
#include <vector>
21

Y
Yi Wang 已提交
22
#include "grpc++/grpc++.h"
T
typhoonzero 已提交
23
#include "paddle/fluid/framework/blocking_queue.h"
24
#include "paddle/fluid/framework/executor.h"
Y
Yi Wang 已提交
25
#include "paddle/fluid/framework/lod_tensor.h"
26
#include "paddle/fluid/framework/program_desc.h"
Y
Yi Wang 已提交
27 28 29
#include "paddle/fluid/framework/scope.h"
#include "paddle/fluid/framework/selected_rows.h"
#include "paddle/fluid/framework/var_type.h"
T
update  
typhoonzero 已提交
30
#include "paddle/fluid/operators/detail/grpc_service.h"
Y
Yi Wang 已提交
31 32
#include "paddle/fluid/operators/detail/send_recv.grpc.pb.h"
#include "paddle/fluid/operators/detail/send_recv.pb.h"
Y
yi.wu 已提交
33
#include "paddle/fluid/operators/detail/sendrecvop_utils.h"
X
Xin Pan 已提交
34
#include "paddle/fluid/platform/profiler.h"
G
gongweibao 已提交
35 36 37 38 39

namespace paddle {
namespace operators {
namespace detail {

40 41
typedef std::pair<std::string, std::shared_ptr<VariableResponse>>
    ReceivedMessage;
T
typhoonzero 已提交
42
typedef framework::BlockingQueue<ReceivedMessage> ReceivedQueue;
43

G
gongweibao 已提交
44 45 46
typedef std::pair<std::string, sendrecv::VariableMessage> MessageWithName;
class RequestBase;

47
class AsyncGRPCServer final {
G
gongweibao 已提交
48
 public:
Q
qiaolongfei 已提交
49
  explicit AsyncGRPCServer(const std::string &address, bool sync_mode)
T
wip  
typhoonzero 已提交
50
      : address_(address), sync_mode_(sync_mode), ready_(0) {}
G
gongweibao 已提交
51

T
typhoonzero 已提交
52
  ~AsyncGRPCServer() {}
T
done  
typhoonzero 已提交
53
  void WaitServerReady();
G
gongweibao 已提交
54 55
  void RunSyncUpdate();

T
typhoonzero 已提交
56
  // functions to sync server barrier status.
T
typhoonzero 已提交
57 58
  void WaitCond(int cond);
  void SetCond(int cond);
T
typhoonzero 已提交
59
  void WaitClientGet(int count);
G
gongweibao 已提交
60 61 62

  void SetScope(framework::Scope *scope) { scope_ = scope; }

Y
Yancey1989 已提交
63 64
  void SetDevCtx(const platform::DeviceContext *dev_ctx) { dev_ctx_ = dev_ctx; }

65 66 67 68
  void SetProgram(framework::ProgramDesc *program) { program_ = program; }

  void SetExecutor(framework::Executor *executor) { executor_ = executor; }

X
Xin Pan 已提交
69 70 71
  void SetPrefetchPreparedCtx(
      std::unique_ptr<framework::ExecutorPrepareContext> prepared) {
    prefetch_ctx_.reset(prepared.release());
Y
Yancey1989 已提交
72 73
  }

Q
qiaolongfei 已提交
74
  int GetSelectedPort() const { return selected_port_; }
T
typhoonzero 已提交
75

76
  const ReceivedMessage Get() { return this->var_recv_queue_.Pop(); }
G
gongweibao 已提交
77

78 79 80
  void Push(const std::string &msg_name) {
    this->var_recv_queue_.Push(std::make_pair(msg_name, nullptr));
  }
G
gongweibao 已提交
81 82 83 84

  void ShutDown();

 protected:
Y
Yi Wang 已提交
85 86
  void HandleRequest(::grpc::ServerCompletionQueue *cq,
                     const std::string &cq_name,
X
Xin Pan 已提交
87 88 89 90
                     std::function<void(int)> TryToRegisterNewOne);
  void TryToRegisterNewSendOne(int i);
  void TryToRegisterNewGetOne(int i);
  void TryToRegisterNewPrefetchOne(int i);
G
gongweibao 已提交
91 92 93
  void ShutdownQueue();

 private:
X
Xin Pan 已提交
94 95
  static const int kSendReqsBufSize = 100;
  static const int kGetReqsBufSize = 100;
X
Xin Pan 已提交
96
  static const int kPrefetchReqsBufSize = 10;
X
Xin Pan 已提交
97

G
gongweibao 已提交
98 99
  std::mutex cq_mutex_;
  volatile bool is_shut_down_ = false;
100 101
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_send_;
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_get_;
102
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_prefetch_;
G
gongweibao 已提交
103

X
Xin Pan 已提交
104 105
  RequestBase *send_reqs_[kSendReqsBufSize];
  RequestBase *get_reqs_[kGetReqsBufSize];
X
Xin Pan 已提交
106
  RequestBase *prefetch_reqs_[kPrefetchReqsBufSize];
X
Xin Pan 已提交
107

108 109
  GrpcService::AsyncService service_;
  std::unique_ptr<::grpc::Server> server_;
G
gongweibao 已提交
110 111

  std::string address_;
Q
qiaolongfei 已提交
112
  const bool sync_mode_;
G
gongweibao 已提交
113
  framework::Scope *scope_;
Y
Yancey1989 已提交
114
  const platform::DeviceContext *dev_ctx_;
115

G
gongweibao 已提交
116
  // received variable from RPC, operators fetch variable from this queue.
T
typhoonzero 已提交
117
  framework::BlockingQueue<MessageWithName> var_get_queue_;
Q
qiaolongfei 已提交
118
  // client send variable to this queue.
119
  ReceivedQueue var_recv_queue_;
G
gongweibao 已提交
120 121

  // condition of the sub program
T
typhoonzero 已提交
122 123 124
  std::mutex barrier_mutex_;
  mutable int barrier_cond_step_;
  std::condition_variable barrier_condition_;
G
gongweibao 已提交
125

X
Xin Pan 已提交
126 127
  std::vector<std::unique_ptr<std::thread>> t_sends_;
  std::vector<std::unique_ptr<std::thread>> t_gets_;
X
Xin Pan 已提交
128
  std::vector<std::unique_ptr<std::thread>> t_prefetchs_;
X
Xin Pan 已提交
129

130 131
  std::unique_ptr<std::thread> t_prefetch_;

X
Xin Pan 已提交
132
  std::unique_ptr<framework::ExecutorPrepareContext> prefetch_ctx_;
133 134
  framework::ProgramDesc *program_;
  framework::Executor *executor_;
T
typhoonzero 已提交
135
  int selected_port_;
T
wip  
typhoonzero 已提交
136

T
done  
typhoonzero 已提交
137
  std::mutex mutex_ready_;
T
wip  
typhoonzero 已提交
138 139
  std::condition_variable condition_ready_;
  int ready_;
G
gongweibao 已提交
140 141 142 143 144
};

};  // namespace detail
};  // namespace operators
};  // namespace paddle