send_op.cc 3.4 KB
Newer Older
武毅 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.

   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

   http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License. */

#include <ostream>

#include "paddle/framework/data_type.h"
#include "paddle/framework/framework.pb.h"
#include "paddle/framework/lod_tensor.h"
#include "paddle/framework/op_registry.h"

#include "paddle/operators/detail/send_recv_impl.h"
#include "paddle/operators/detail/simple_block_queue.h"

namespace paddle {
namespace operators {

// TODO(typhoonzero): this is a simple implementation which only send
// one tensor
class SendOp : public framework::OperatorBase {
 public:
  SendOp(const std::string &type, const framework::VariableNameMap &inputs,
         const framework::VariableNameMap &outputs,
         const framework::AttributeMap &attrs)
      : OperatorBase(type, inputs, outputs, attrs) {
    // init client when the operator is created at runtime.
T
typhoonzero 已提交
37 38 39 40 41
    std::vector<std::string> endpoints =
        Attr<std::vector<std::string>>("endpoints");
    for (auto ep : endpoints) {
      client_map_[ep].reset(new detail::RPCClient(
          grpc::CreateChannel(ep, grpc::InsecureChannelCredentials())));
武毅 已提交
42 43
    }
  }
T
typhoonzero 已提交
44

武毅 已提交
45 46
  void Run(const framework::Scope &scope,
           const platform::DeviceContext &dev_ctx) const override {
T
typhoonzero 已提交
47
    auto ins = Inputs("X");
T
typhoonzero 已提交
48 49 50 51
    std::vector<std::string> epmap = Attr<std::vector<std::string>>("epmap");
    // TODO(typhoonzero): use async calls to send multiple variable asyncly.
    for (size_t i = 0; i < ins.size(); ++i) {
      bool ret = client_map_[epmap[i]]->SendVariable(scope, ins[i]);
T
typhoonzero 已提交
52
      if (!ret) {
T
typhoonzero 已提交
53
        LOG(ERROR) << "send variable error: " << ins[i];
T
typhoonzero 已提交
54
      }
武毅 已提交
55
    }
T
typhoonzero 已提交
56 57
    // TODO(typhoonzero): support async optimization
    client_map_[epmap[0]]->Wait();
T
typhoonzero 已提交
58 59
    for (size_t i = 0; i < ins.size(); ++i) {
      bool ret = client_map_[epmap[i]]->GetVariable(scope, ins[i]);
T
typhoonzero 已提交
60
      if (!ret) {
T
typhoonzero 已提交
61
        LOG(ERROR) << "GetVariable error: " << ins[i];
T
typhoonzero 已提交
62
      }
武毅 已提交
63 64 65 66
    }
  }

 protected:
T
typhoonzero 已提交
67 68
  mutable std::unordered_map<std::string, std::shared_ptr<detail::RPCClient>>
      client_map_;
武毅 已提交
69 70 71 72
};

class SendOpMaker : public framework::OpProtoAndCheckerMaker {
 public:
73
  SendOpMaker(OpProto *proto, OpAttrChecker *op_checker)
武毅 已提交
74
      : OpProtoAndCheckerMaker(proto, op_checker) {
T
typhoonzero 已提交
75
    AddInput("X", "(Tensor) Input tensor to be send").AsDuplicable();
武毅 已提交
76 77 78 79 80
    AddComment(R"DOC(
Recv operator

This operator will recv tensor from send_op
)DOC");
T
typhoonzero 已提交
81 82 83 84 85 86 87
    AddAttr<std::vector<std::string>>("endpoints",
                                      "(string vector, default 127.0.0.1:6164)"
                                      "Server endpoints to send variables to.");
    AddAttr<std::vector<std::string>>("epmap",
                                      "(string vector, default 127.0.0.1:6164)"
                                      "Server endpoints in the order of input "
                                      "variables for mapping");
武毅 已提交
88 89 90 91 92 93 94 95 96
  }
};

}  // namespace operators
}  // namespace paddle

namespace ops = paddle::operators;

REGISTER_OPERATOR(send, ops::SendOp, ops::SendOpMaker);