op_lite.h 7.2 KB
Newer Older
S
superjomn 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <glog/logging.h>
#include <boost/variant.hpp>
#include <map>
20
#include <memory>
S
superjomn 已提交
21 22 23 24
#include <string>
#include "paddle/fluid/framework/lod_tensor.h"
#include "paddle/fluid/framework/op_desc.h"
#include "paddle/fluid/framework/variable.h"
S
superjomn 已提交
25 26 27
#include "paddle/fluid/lite/core/context.h"
#include "paddle/fluid/lite/core/kernel.h"
#include "paddle/fluid/lite/core/scope.h"
S
superjomn 已提交
28 29 30 31 32 33 34 35 36 37 38 39

namespace paddle {
namespace lite {

using any_t = boost::variant<int, float, framework::Variable *>;
using anys_t = std::map<std::string, any_t>;

// For registry factory.
struct Registry {
  void Touch() {}
};

S
superjomn 已提交
40 41 42 43 44
namespace mir {
class Node;
class SSAGraph;
}

45 46
class OpInfo;

S
superjomn 已提交
47 48 49 50 51
/**
 * The base class of an light-weight operators, currently just used in inference
 * to eliminate overhead of some operations in current framework.
 *
 * The Operator are designed as follows:
S
update  
superjomn 已提交
52 53 54
 * - it can has some members to hold the argument and some other computation
 * resources,
 * - it should act like a function call, no more logic included.
S
superjomn 已提交
55 56 57
 */
class OpLite : public Registry {
 public:
S
update  
superjomn 已提交
58
  // The strategies to pick a kernel from candidates.
S
superjomn 已提交
59 60 61 62 63 64 65 66 67
  enum class KernelStrategy {
    // Return the user specified one.
    kStatic = 0,
    // Specify the expected kernel externally.
    kSpecified,
    // Run each kernel to evaluate and get the best kernel.
    kRuntime,
  };

S
superjomn 已提交
68
  OpLite() = default;
S
superjomn 已提交
69
  OpLite(const std::string &type) : op_type_(type) {}
70 71
  OpLite(const std::vector<Place> &valid_places)
      : valid_places_(valid_places) {}
S
superjomn 已提交
72

S
superjomn 已提交
73 74 75 76
  void SetValidPlaces(const std::vector<Place> &places) {
    valid_places_ = places;
  }
  const std::vector<Place> &valid_places() const { return valid_places_; }
S
update  
superjomn 已提交
77
  // Check the shape.
S
superjomn 已提交
78
  virtual bool CheckShape() const { return true; }
S
update  
superjomn 已提交
79
  // Inference the outputs' shape.
S
superjomn 已提交
80
  virtual bool InferShape() const { return true; }
S
update  
superjomn 已提交
81
  // Run this operator.
S
superjomn 已提交
82
  virtual bool Run();
S
update  
superjomn 已提交
83

S
superjomn 已提交
84
  // Link the external execution environ to internal context.
85 86
  bool Attach(const framework::OpDesc &opdesc, lite::Scope *scope);

S
superjomn 已提交
87 88
  const OpInfo *op_info() const { return op_info_.get(); }
  OpInfo *mutable_op_info() { return op_info_.get(); }
S
superjomn 已提交
89

S
update  
superjomn 已提交
90
  // Human-readable information.
S
superjomn 已提交
91 92
  virtual std::string DebugString() const = 0;

S
superjomn 已提交
93 94
  const Place &kernel_place() const { return kernel_place_; }

S
superjomn 已提交
95
  // NOTE This might be discarded.
S
update  
superjomn 已提交
96 97 98
  void PickKernel(const std::vector<Place> &valid_places,
                  KernelStrategy kernel_strategy = KernelStrategy::kStatic);

S
superjomn 已提交
99 100 101 102 103 104 105 106 107
  // Create all the kernels for the valid targets.
  std::vector<std::unique_ptr<KernelBase>> CreateKernels(
      const std::vector<Place> &places, const std::string &kernel_type = "");

  lite::Scope *scope() { return scope_; }

  // Assign op param to kernel.
  virtual void AttachKernel(KernelBase *kernel) = 0;

S
superjomn 已提交
108 109 110
  virtual ~OpLite() = default;

 protected:
S
superjomn 已提交
111 112 113 114
  // Attach it with the runtime environment.
  virtual bool AttachImpl(const framework::OpDesc &opdesc,
                          lite::Scope *scope) = 0;

S
superjomn 已提交
115 116
  // Specify the kernel to run by default. This will specify the value of
  // `kernel_place_`.
S
superjomn 已提交
117 118 119 120
  virtual void StaticPickKernel(const std::vector<Place> &valid_targets) {
    auto kernels = CreateKernels(valid_targets);
    kernel_ = std::move(kernels.front());
  }
S
superjomn 已提交
121

S
update  
superjomn 已提交
122 123 124 125 126 127
  // Wait until all the inputs' events are ready.
  void SyncInputEvents() {}

  // Record the output events, and that will tell all the dependent operators
  // some inputs are ready.
  void RecordOutputEvents() {}
S
superjomn 已提交
128

129 130 131
  const Tensor *GetTensor(lite::Scope *scope, const std::string &name) const;
  Tensor *GetMutableTensor(lite::Scope *scope, const std::string &name) const;

S
superjomn 已提交
132 133 134
  friend class mir::Node;
  friend class mir::SSAGraph;

S
superjomn 已提交
135
 protected:
S
superjomn 已提交
136
  lite::Scope *scope_{};
S
update  
superjomn 已提交
137 138
  std::unique_ptr<KernelBase> kernel_;
  std::string op_type_;
S
superjomn 已提交
139 140
  std::vector<Place> valid_places_;
  Place kernel_place_{TARGET(kHost), PRECISION(kFloat)};
S
superjomn 已提交
141
  std::unique_ptr<OpInfo> op_info_;
142 143 144 145 146 147 148 149
};

/*
 * Operator Information, such as some description. It will be shared by all the
 * kernels of the same operator.
 */
class OpInfo {
 public:
S
superjomn 已提交
150 151 152
  // To avoid the bugs from legancy framework::OpDesc, we use the ProtoBuf
  // message instead.
  void Build(const framework::proto::OpDesc &desc) {
153 154 155
    ExtractInputsAndOutputs(desc);
    CollectInputAndOutputArgnames(desc);
    CollectArguments(desc);
S
superjomn 已提交
156
    desc_.reset(new framework::proto::OpDesc(desc));
157 158
  }

S
superjomn 已提交
159 160 161 162 163
  const framework::proto::OpDesc &desc() const {
    CHECK(desc_) << "desc has't set";
    return *desc_;
  }
  framework::proto::OpDesc *mutable_desc() { return desc_.get(); }
164 165
  const std::list<std::string> &input_names() const { return input_names_; }
  const std::list<std::string> &output_names() const { return output_names_; }
S
superjomn 已提交
166
  const std::map<std::string, std::list<std::string>> &input_argument() const {
167 168
    return input_argument_;
  }
S
superjomn 已提交
169
  const std::map<std::string, std::list<std::string>> &output_argument() const {
170 171
    return output_argument_;
  }
S
superjomn 已提交
172 173
  bool GetInputArgname(const std::string &value_name, std::string *out) const;
  bool GetOutputArgname(const std::string &value_name, std::string *out) const;
174 175 176 177 178 179 180 181 182

  const std::list<std::string> &input_argnames() const {
    return input_argnames_;
  }
  const std::list<std::string> &output_argnames() const {
    return output_argnames_;
  }

 private:
S
superjomn 已提交
183 184 185
  void ExtractInputsAndOutputs(const framework::proto::OpDesc &opdesc) {
    for (const auto &item : opdesc.inputs()) {
      for (const auto &x : item.arguments()) {
186 187 188
        input_names_.push_back(x);
      }
    }
S
superjomn 已提交
189 190
    for (const auto &item : opdesc.outputs()) {
      for (const auto &x : item.arguments()) {
191 192 193 194 195
        output_names_.push_back(x);
      }
    }
  }

S
superjomn 已提交
196 197 198
  void CollectInputAndOutputArgnames(const framework::proto::OpDesc &opdesc) {
    for (const auto &item : opdesc.inputs()) {
      input_argnames_.push_back(item.parameter());
199
    }
S
superjomn 已提交
200 201
    for (const auto &item : opdesc.outputs()) {
      output_argnames_.push_back(item.parameter());
202 203 204
    }
  }

S
superjomn 已提交
205 206 207 208
  void CollectArguments(const framework::proto::OpDesc &opdesc) {
    for (const auto &item : opdesc.inputs()) {
      for (auto &x : item.arguments()) {
        input_argument_[item.parameter()].push_back(x);
209 210
      }
    }
S
superjomn 已提交
211 212 213
    for (const auto &item : opdesc.outputs()) {
      for (auto &x : item.arguments()) {
        output_argument_[item.parameter()].push_back(x);
214 215 216 217 218
      }
    }
  }

 private:
S
superjomn 已提交
219 220
  std::list<std::string> input_names_;
  std::list<std::string> output_names_;
221 222 223 224
  std::list<std::string> input_argnames_;
  std::list<std::string> output_argnames_;
  std::map<std::string, std::list<std::string>> input_argument_;
  std::map<std::string, std::list<std::string>> output_argument_;
S
superjomn 已提交
225 226
  // NOTE too heavy.
  std::unique_ptr<framework::proto::OpDesc> desc_;
S
superjomn 已提交
227 228 229 230
};

}  // namespace lite
}  // namespace paddle