grpc_server.h 4.0 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
G
gongweibao 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once

Y
Yi Wang 已提交
17 18 19
#include <string>
#include <thread>  // NOLINT
#include <utility>
20

Y
Yi Wang 已提交
21
#include "grpc++/grpc++.h"
22
#include "paddle/fluid/framework/executor.h"
Y
Yi Wang 已提交
23
#include "paddle/fluid/framework/lod_tensor.h"
24
#include "paddle/fluid/framework/program_desc.h"
Y
Yi Wang 已提交
25 26 27
#include "paddle/fluid/framework/scope.h"
#include "paddle/fluid/framework/selected_rows.h"
#include "paddle/fluid/framework/var_type.h"
T
update  
typhoonzero 已提交
28
#include "paddle/fluid/operators/detail/grpc_service.h"
Y
Yi Wang 已提交
29 30
#include "paddle/fluid/operators/detail/send_recv.grpc.pb.h"
#include "paddle/fluid/operators/detail/send_recv.pb.h"
Y
yi.wu 已提交
31
#include "paddle/fluid/operators/detail/sendrecvop_utils.h"
Y
update  
yi.wu 已提交
32
#include "paddle/fluid/operators/detail/simple_block_queue.h"
G
gongweibao 已提交
33 34 35 36 37

namespace paddle {
namespace operators {
namespace detail {

38 39 40 41
typedef std::pair<std::string, std::shared_ptr<VariableResponse>>
    ReceivedMessage;
typedef SimpleBlockQueue<ReceivedMessage> ReceivedQueue;

G
gongweibao 已提交
42 43 44
typedef std::pair<std::string, sendrecv::VariableMessage> MessageWithName;
class RequestBase;

45
class AsyncGRPCServer final {
G
gongweibao 已提交
46
 public:
Y
Yancey1989 已提交
47
  explicit AsyncGRPCServer(const std::string &address) : address_(address) {}
G
gongweibao 已提交
48 49 50

  void RunSyncUpdate();

T
typhoonzero 已提交
51
  // functions to sync server barrier status.
T
typhoonzero 已提交
52 53
  void WaitCond(int cond);
  void SetCond(int cond);
T
typhoonzero 已提交
54
  void WaitClientGet(int count);
G
gongweibao 已提交
55 56 57

  void SetScope(framework::Scope *scope) { scope_ = scope; }

Y
Yancey1989 已提交
58 59
  void SetDevCtx(const platform::DeviceContext *dev_ctx) { dev_ctx_ = dev_ctx; }

60 61 62 63 64 65
  void SetProgram(framework::ProgramDesc *program) { program_ = program; }

  void SetPrefetchBlkdId(int blkid) { prefetch_blk_id_ = blkid; }

  void SetExecutor(framework::Executor *executor) { executor_ = executor; }

Y
Yancey1989 已提交
66 67 68 69
  void SetPrefetchPreparedCtx(framework::ExecutorPrepareContext *prepared) {
    prefetch_ctx_ = prepared;
  }

T
typhoonzero 已提交
70 71
  int GetSelectedPort() { return selected_port_; }

72
  const ReceivedMessage Get() { return this->var_recv_queue_.Pop(); }
G
gongweibao 已提交
73

74 75 76
  void Push(const std::string &msg_name) {
    this->var_recv_queue_.Push(std::make_pair(msg_name, nullptr));
  }
G
gongweibao 已提交
77 78 79 80

  void ShutDown();

 protected:
Y
Yi Wang 已提交
81 82
  void HandleRequest(::grpc::ServerCompletionQueue *cq,
                     const std::string &cq_name,
G
gongweibao 已提交
83 84 85
                     std::function<void()> TryToRegisterNewOne);
  void TryToRegisterNewSendOne();
  void TryToRegisterNewGetOne();
86
  void TryToRegisterNewPrefetchOne();
G
gongweibao 已提交
87 88 89 90 91
  void ShutdownQueue();

 private:
  std::mutex cq_mutex_;
  volatile bool is_shut_down_ = false;
92 93
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_send_;
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_get_;
94
  std::unique_ptr<::grpc::ServerCompletionQueue> cq_prefetch_;
G
gongweibao 已提交
95

96 97
  GrpcService::AsyncService service_;
  std::unique_ptr<::grpc::Server> server_;
G
gongweibao 已提交
98 99 100

  std::string address_;
  framework::Scope *scope_;
Y
Yancey1989 已提交
101
  const platform::DeviceContext *dev_ctx_;
102

G
gongweibao 已提交
103
  // received variable from RPC, operators fetch variable from this queue.
104
  SimpleBlockQueue<MessageWithName> var_get_queue_;
Q
qiaolongfei 已提交
105
  // client send variable to this queue.
106
  ReceivedQueue var_recv_queue_;
G
gongweibao 已提交
107 108

  // condition of the sub program
T
typhoonzero 已提交
109 110 111
  std::mutex barrier_mutex_;
  mutable int barrier_cond_step_;
  std::condition_variable barrier_condition_;
G
gongweibao 已提交
112 113 114

  std::unique_ptr<std::thread> t_send_;
  std::unique_ptr<std::thread> t_get_;
115 116 117
  std::unique_ptr<std::thread> t_prefetch_;

  int prefetch_blk_id_;
Y
Yancey1989 已提交
118
  framework::ExecutorPrepareContext *prefetch_ctx_;
119 120
  framework::ProgramDesc *program_;
  framework::Executor *executor_;
T
typhoonzero 已提交
121
  int selected_port_;
G
gongweibao 已提交
122 123 124 125 126
};

};  // namespace detail
};  // namespace operators
};  // namespace paddle