op_lite.h 7.1 KB
Newer Older
S
superjomn 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <glog/logging.h>
#include <boost/variant.hpp>
#include <map>
20
#include <memory>
S
superjomn 已提交
21 22
#include <string>
#include "paddle/fluid/framework/variable.h"
S
superjomn 已提交
23 24 25
#include "paddle/fluid/lite/core/context.h"
#include "paddle/fluid/lite/core/kernel.h"
#include "paddle/fluid/lite/core/scope.h"
26
#include "paddle/fluid/lite/model_parser/compatible_pb.h"
S
superjomn 已提交
27 28 29 30 31 32 33 34 35 36 37 38

namespace paddle {
namespace lite {

using any_t = boost::variant<int, float, framework::Variable *>;
using anys_t = std::map<std::string, any_t>;

// For registry factory.
struct Registry {
  void Touch() {}
};

S
superjomn 已提交
39 40 41 42 43
namespace mir {
class Node;
class SSAGraph;
}

44 45
class OpInfo;

S
superjomn 已提交
46 47 48 49 50
/**
 * The base class of an light-weight operators, currently just used in inference
 * to eliminate overhead of some operations in current framework.
 *
 * The Operator are designed as follows:
S
update  
superjomn 已提交
51 52 53
 * - it can has some members to hold the argument and some other computation
 * resources,
 * - it should act like a function call, no more logic included.
S
superjomn 已提交
54 55 56
 */
class OpLite : public Registry {
 public:
S
update  
superjomn 已提交
57
  // The strategies to pick a kernel from candidates.
S
superjomn 已提交
58 59 60 61 62 63 64 65 66
  enum class KernelStrategy {
    // Return the user specified one.
    kStatic = 0,
    // Specify the expected kernel externally.
    kSpecified,
    // Run each kernel to evaluate and get the best kernel.
    kRuntime,
  };

S
superjomn 已提交
67
  OpLite() = default;
S
superjomn 已提交
68
  OpLite(const std::string &type) : op_type_(type) {}
69 70
  OpLite(const std::vector<Place> &valid_places)
      : valid_places_(valid_places) {}
S
superjomn 已提交
71

S
superjomn 已提交
72 73 74 75
  void SetValidPlaces(const std::vector<Place> &places) {
    valid_places_ = places;
  }
  const std::vector<Place> &valid_places() const { return valid_places_; }
S
update  
superjomn 已提交
76
  // Check the shape.
S
superjomn 已提交
77
  virtual bool CheckShape() const { return true; }
S
update  
superjomn 已提交
78
  // Inference the outputs' shape.
S
superjomn 已提交
79
  virtual bool InferShape() const { return true; }
S
update  
superjomn 已提交
80
  // Run this operator.
S
superjomn 已提交
81
  virtual bool Run();
S
update  
superjomn 已提交
82

S
superjomn 已提交
83
  // Link the external execution environ to internal context.
84
  bool Attach(const OpDesc &opdesc, lite::Scope *scope);
85

S
superjomn 已提交
86 87
  const OpInfo *op_info() const { return op_info_.get(); }
  OpInfo *mutable_op_info() { return op_info_.get(); }
S
superjomn 已提交
88

S
update  
superjomn 已提交
89
  // Human-readable information.
S
superjomn 已提交
90 91
  virtual std::string DebugString() const = 0;

S
superjomn 已提交
92 93
  const Place &kernel_place() const { return kernel_place_; }

S
superjomn 已提交
94
  // NOTE This might be discarded.
S
update  
superjomn 已提交
95 96 97
  void PickKernel(const std::vector<Place> &valid_places,
                  KernelStrategy kernel_strategy = KernelStrategy::kStatic);

S
superjomn 已提交
98 99 100 101 102 103 104 105 106
  // Create all the kernels for the valid targets.
  std::vector<std::unique_ptr<KernelBase>> CreateKernels(
      const std::vector<Place> &places, const std::string &kernel_type = "");

  lite::Scope *scope() { return scope_; }

  // Assign op param to kernel.
  virtual void AttachKernel(KernelBase *kernel) = 0;

S
superjomn 已提交
107 108 109
  virtual ~OpLite() = default;

 protected:
S
superjomn 已提交
110
  // Attach it with the runtime environment.
111
  virtual bool AttachImpl(const OpDesc &opdesc, lite::Scope *scope) = 0;
S
superjomn 已提交
112

S
superjomn 已提交
113 114
  // Specify the kernel to run by default. This will specify the value of
  // `kernel_place_`.
S
superjomn 已提交
115 116 117 118
  virtual void StaticPickKernel(const std::vector<Place> &valid_targets) {
    auto kernels = CreateKernels(valid_targets);
    kernel_ = std::move(kernels.front());
  }
S
superjomn 已提交
119

S
update  
superjomn 已提交
120 121 122 123 124 125
  // Wait until all the inputs' events are ready.
  void SyncInputEvents() {}

  // Record the output events, and that will tell all the dependent operators
  // some inputs are ready.
  void RecordOutputEvents() {}
S
superjomn 已提交
126

127 128 129
  const Tensor *GetTensor(lite::Scope *scope, const std::string &name) const;
  Tensor *GetMutableTensor(lite::Scope *scope, const std::string &name) const;

S
superjomn 已提交
130 131 132
  friend class mir::Node;
  friend class mir::SSAGraph;

S
superjomn 已提交
133
 protected:
S
superjomn 已提交
134
  lite::Scope *scope_{};
S
update  
superjomn 已提交
135 136
  std::unique_ptr<KernelBase> kernel_;
  std::string op_type_;
S
superjomn 已提交
137 138
  std::vector<Place> valid_places_;
  Place kernel_place_{TARGET(kHost), PRECISION(kFloat)};
S
superjomn 已提交
139
  std::unique_ptr<OpInfo> op_info_;
140 141 142 143 144 145 146 147
};

/*
 * Operator Information, such as some description. It will be shared by all the
 * kernels of the same operator.
 */
class OpInfo {
 public:
S
superjomn 已提交
148 149 150
  // To avoid the bugs from legancy framework::OpDesc, we use the ProtoBuf
  // message instead.
  void Build(const framework::proto::OpDesc &desc) {
151 152 153
    ExtractInputsAndOutputs(desc);
    CollectInputAndOutputArgnames(desc);
    CollectArguments(desc);
S
superjomn 已提交
154
    desc_.reset(new framework::proto::OpDesc(desc));
155 156
  }

S
superjomn 已提交
157 158 159 160 161
  const framework::proto::OpDesc &desc() const {
    CHECK(desc_) << "desc has't set";
    return *desc_;
  }
  framework::proto::OpDesc *mutable_desc() { return desc_.get(); }
162 163
  const std::list<std::string> &input_names() const { return input_names_; }
  const std::list<std::string> &output_names() const { return output_names_; }
S
superjomn 已提交
164
  const std::map<std::string, std::list<std::string>> &input_argument() const {
165 166
    return input_argument_;
  }
S
superjomn 已提交
167
  const std::map<std::string, std::list<std::string>> &output_argument() const {
168 169
    return output_argument_;
  }
S
superjomn 已提交
170 171
  bool GetInputArgname(const std::string &value_name, std::string *out) const;
  bool GetOutputArgname(const std::string &value_name, std::string *out) const;
172 173 174 175 176 177 178 179 180

  const std::list<std::string> &input_argnames() const {
    return input_argnames_;
  }
  const std::list<std::string> &output_argnames() const {
    return output_argnames_;
  }

 private:
S
superjomn 已提交
181 182 183
  void ExtractInputsAndOutputs(const framework::proto::OpDesc &opdesc) {
    for (const auto &item : opdesc.inputs()) {
      for (const auto &x : item.arguments()) {
184 185 186
        input_names_.push_back(x);
      }
    }
S
superjomn 已提交
187 188
    for (const auto &item : opdesc.outputs()) {
      for (const auto &x : item.arguments()) {
189 190 191 192 193
        output_names_.push_back(x);
      }
    }
  }

S
superjomn 已提交
194 195 196
  void CollectInputAndOutputArgnames(const framework::proto::OpDesc &opdesc) {
    for (const auto &item : opdesc.inputs()) {
      input_argnames_.push_back(item.parameter());
197
    }
S
superjomn 已提交
198 199
    for (const auto &item : opdesc.outputs()) {
      output_argnames_.push_back(item.parameter());
200 201 202
    }
  }

S
superjomn 已提交
203 204 205 206
  void CollectArguments(const framework::proto::OpDesc &opdesc) {
    for (const auto &item : opdesc.inputs()) {
      for (auto &x : item.arguments()) {
        input_argument_[item.parameter()].push_back(x);
207 208
      }
    }
S
superjomn 已提交
209 210 211
    for (const auto &item : opdesc.outputs()) {
      for (auto &x : item.arguments()) {
        output_argument_[item.parameter()].push_back(x);
212 213 214 215 216
      }
    }
  }

 private:
S
superjomn 已提交
217 218
  std::list<std::string> input_names_;
  std::list<std::string> output_names_;
219 220 221 222
  std::list<std::string> input_argnames_;
  std::list<std::string> output_argnames_;
  std::map<std::string, std::list<std::string>> input_argument_;
  std::map<std::string, std::list<std::string>> output_argument_;
S
superjomn 已提交
223 224
  // NOTE too heavy.
  std::unique_ptr<framework::proto::OpDesc> desc_;
S
superjomn 已提交
225 226 227 228
};

}  // namespace lite
}  // namespace paddle