op_registry.h 14.0 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
F
fengjiayi 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

15 16
#pragma once

17
#include <algorithm>
18
#include <atomic>
Y
Yang Yang 已提交
19 20
#include <string>
#include <tuple>
Y
Yu Yang 已提交
21
#include <type_traits>
F
WIP  
fengjiayi 已提交
22
#include <typeinfo>
23 24
#include <unordered_map>
#include <unordered_set>
Y
Yu Yang 已提交
25

P
peizhilin 已提交
26 27
#define GLOG_NO_ABBREVIATED_SEVERITIES  // msvc conflict logging with windows.h
#include "glog/logging.h"               // For VLOG()
Y
Yi Wang 已提交
28 29 30 31 32 33 34 35
#include "paddle/fluid/framework/attribute.h"
#include "paddle/fluid/framework/details/op_registry.h"
#include "paddle/fluid/framework/framework.pb.h"
#include "paddle/fluid/framework/grad_op_desc_maker.h"
#include "paddle/fluid/framework/op_desc.h"
#include "paddle/fluid/framework/operator.h"
#include "paddle/fluid/framework/scope.h"
#include "paddle/fluid/framework/shape_inference.h"
36 37 38

namespace paddle {
namespace framework {
X
Xin Pan 已提交
39

Y
Yu Yang 已提交
40 41 42 43
class Registrar {
 public:
  // In our design, various kinds of classes, e.g., operators and kernels,
  // have their corresponding registry and registrar. The action of
44 45
  // registration is in the constructor of a global registrar variable, which
  // are not used in the code that calls package framework, and would
Y
Yu Yang 已提交
46 47 48 49 50 51
  // be removed from the generated binary file by the linker. To avoid such
  // removal, we add Touch to all registrar classes and make USE_OP macros to
  // call this method. So, as long as the callee code calls USE_OP, the global
  // registrar variable won't be removed by the linker.
  void Touch() {}
};
52

53
template <typename... ARGS>
Y
Yu Yang 已提交
54
struct OperatorRegistrar : public Registrar {
55
  explicit OperatorRegistrar(const char* op_type) {
56 57 58 59
    PADDLE_ENFORCE(!OpInfoMap::Instance().Has(op_type),
                   "'%s' is registered more than once.", op_type);
    static_assert(sizeof...(ARGS) != 0,
                  "OperatorRegistrar should be invoked at least by OpClass");
60
    OpInfo info;
61
    details::OperatorRegistrarRecursive<0, false, ARGS...>(op_type, &info);
Y
Yu Yang 已提交
62
    OpInfoMap::Instance().Insert(op_type, info);
63 64 65
  }
};

66 67
class OpRegistry {
 public:
Y
Yu Yang 已提交
68
  static std::unique_ptr<OperatorBase> CreateOp(const std::string& type,
Y
Yu Yang 已提交
69 70
                                                const VariableNameMap& inputs,
                                                const VariableNameMap& outputs,
71
                                                AttributeMap attrs);
Y
Yu Yang 已提交
72

73
  static std::unique_ptr<OperatorBase> CreateOp(const proto::OpDesc& op_desc);
Y
Yu Yang 已提交
74

Y
Yu Yang 已提交
75
  static std::unique_ptr<OperatorBase> CreateOp(const OpDesc& op_desc);
F
Fix bug  
fengjiayi 已提交
76
};
F
fengjiayi 已提交
77

78 79 80
template <typename PlaceType, bool at_end, size_t I, typename... KernelType>
struct OpKernelRegistrarFunctor;

81 82
template <typename PlaceType, typename T, typename Func>
inline void RegisterKernelClass(const char* op_type, const char* library_type,
X
Xin Pan 已提交
83
                                int customized_type_value, Func func) {
Y
yuyang18 已提交
84 85 86 87 88 89 90
  std::string library(library_type);
  std::string data_layout = "ANYLAYOUT";
  if (library == "MKLDNN") {
    data_layout = "MKLDNNLAYOUT";
  }
  OpKernelType key(ToDataType(std::type_index(typeid(T))), PlaceType(),
                   StringToDataLayout(data_layout),
X
Xin Pan 已提交
91
                   StringToLibraryType(library_type), customized_type_value);
92
  OperatorWithKernel::AllOpKernels()[op_type][key] = func;
Y
yuyang18 已提交
93 94
}

95 96 97 98
template <typename PlaceType, size_t I, typename... KernelTypes>
struct OpKernelRegistrarFunctor<PlaceType, false, I, KernelTypes...> {
  using KERNEL_TYPE =
      typename std::tuple_element<I, std::tuple<KernelTypes...>>::type;
99

X
Xin Pan 已提交
100 101
  void operator()(const char* op_type, const char* library_type,
                  int customized_type_value) const {
102
    using T = typename KERNEL_TYPE::ELEMENT_TYPE;
103
    RegisterKernelClass<PlaceType, T>(
X
Xin Pan 已提交
104 105 106
        op_type, library_type, customized_type_value,

        [](const framework::ExecutionContext& ctx) {
Y
yuyang18 已提交
107
          KERNEL_TYPE().Compute(ctx);
108
        });
109 110
    constexpr auto size = std::tuple_size<std::tuple<KernelTypes...>>::value;
    OpKernelRegistrarFunctor<PlaceType, I + 1 == size, I + 1, KernelTypes...>
111
        func;
X
Xin Pan 已提交
112
    func(op_type, library_type, customized_type_value);
113 114 115 116 117
  }
};

template <typename PlaceType, size_t I, typename... KernelType>
struct OpKernelRegistrarFunctor<PlaceType, true, I, KernelType...> {
X
Xin Pan 已提交
118 119
  void operator()(const char* op_type, const char* library_type,
                  int customized_type_value) const {}
120 121
};

M
mozga-intel 已提交
122 123
// User can register many kernel in one place. The data type could be
// different.
124
template <typename PlaceType, typename... KernelType>
F
fengjiayi 已提交
125 126
class OpKernelRegistrar : public Registrar {
 public:
X
Xin Pan 已提交
127 128
  explicit OpKernelRegistrar(const char* op_type, const char* library_type,
                             int customized_type_value) {
129
    OpKernelRegistrarFunctor<PlaceType, false, 0, KernelType...> func;
X
Xin Pan 已提交
130
    func(op_type, library_type, customized_type_value);
F
fengjiayi 已提交
131 132 133
  }
};

Y
yuyang18 已提交
134 135 136 137 138 139
template <typename PlaceType, bool at_end, size_t I, typename... KernelType>
struct OpKernelRegistrarFunctorEx;

template <typename PlaceType, typename... DataTypeAndKernelType>
class OpKernelRegistrarEx : public Registrar {
 public:
X
Xin Pan 已提交
140 141
  explicit OpKernelRegistrarEx(const char* op_type, const char* library_type,
                               int customized_type_value) {
Y
yuyang18 已提交
142 143
    OpKernelRegistrarFunctorEx<PlaceType, false, 0, DataTypeAndKernelType...>
        func;
X
Xin Pan 已提交
144
    func(op_type, library_type, customized_type_value);
Y
yuyang18 已提交
145 146 147 148 149 150
  }
};

template <typename PlaceType, size_t I, typename... DataTypeAndKernelType>
struct OpKernelRegistrarFunctorEx<PlaceType, true, I,
                                  DataTypeAndKernelType...> {
X
Xin Pan 已提交
151 152
  void operator()(const char* op_type, const char* library_type,
                  int customized_type_value) const {}
Y
yuyang18 已提交
153 154 155 156 157
};

template <typename PlaceType, size_t I, typename... DataTypeAndKernelType>
struct OpKernelRegistrarFunctorEx<PlaceType, false, I,
                                  DataTypeAndKernelType...> {
158
  using Functor =
Y
yuyang18 已提交
159 160 161 162 163 164
      typename std::tuple_element<I + 1,
                                  std::tuple<DataTypeAndKernelType...>>::type;
  using T =
      typename std::tuple_element<I,
                                  std::tuple<DataTypeAndKernelType...>>::type;

X
Xin Pan 已提交
165 166 167 168
  void operator()(const char* op_type, const char* library_type,
                  int customized_type_value) const {
    RegisterKernelClass<PlaceType, T>(op_type, library_type,
                                      customized_type_value, Functor());
Y
yuyang18 已提交
169 170 171 172 173 174

    constexpr auto size =
        std::tuple_size<std::tuple<DataTypeAndKernelType...>>::value;
    OpKernelRegistrarFunctorEx<PlaceType, I + 2 >= size, I + 2,
                               DataTypeAndKernelType...>
        func;
X
Xin Pan 已提交
175
    func(op_type, library_type, customized_type_value);
Y
yuyang18 已提交
176 177 178
  }
};

X
Xin Pan 已提交
179
// clang-format off
180 181 182
/**
 * check if MACRO is used in GLOBAL NAMESPACE.
 */
Y
Yu Yang 已提交
183 184 185 186 187 188
#define STATIC_ASSERT_GLOBAL_NAMESPACE(uniq_name, msg)                        \
  struct __test_global_namespace_##uniq_name##__ {};                          \
  static_assert(std::is_same<::__test_global_namespace_##uniq_name##__,       \
                             __test_global_namespace_##uniq_name##__>::value, \
                msg)

189 190 191 192 193 194 195 196
/*
  The variadic arguments should be class types derived from one of the
  following classes:
    OpProtoAndCheckerMaker
    GradOpDescMakerBase
    VarTypeInference
    InferShapeBase
*/
Y
yuyang18 已提交
197 198 199 200 201 202 203 204 205
#define REGISTER_OPERATOR(op_type, op_class, ...)                        \
  STATIC_ASSERT_GLOBAL_NAMESPACE(                                        \
      __reg_op__##op_type,                                               \
      "REGISTER_OPERATOR must be called in global namespace");           \
  static ::paddle::framework::OperatorRegistrar<op_class, ##__VA_ARGS__> \
      __op_registrar_##op_type##__(#op_type);                            \
  int TouchOpRegistrar_##op_type() {                                     \
    __op_registrar_##op_type##__.Touch();                                \
    return 0;                                                            \
Y
Yu Yang 已提交
206 207
  }

F
WIP  
fengjiayi 已提交
208
#define REGISTER_OP_WITHOUT_GRADIENT(op_type, op_class, op_maker_class) \
Y
Yu Yang 已提交
209
  REGISTER_OPERATOR(op_type, op_class, op_maker_class)
D
dongzhihong 已提交
210

D
dongzhihong 已提交
211
/**
212
 * Macro to register OperatorKernel.
D
dongzhihong 已提交
213
 */
X
Xin Pan 已提交
214 215 216 217 218 219 220 221 222 223 224 225 226 227 228
#define REGISTER_OP_KERNEL_WITH_CUSTOM_TYPE(op_type, library_type,             \
                                            place_class, customized_name,      \
                                            customized_type_value, ...)        \
  STATIC_ASSERT_GLOBAL_NAMESPACE(                                              \
      __reg_op_kernel_##op_type##_##library_type##_##customized_name##__,      \
                                 "REGISTER_OP_KERNEL must be called in "       \
                                 "global namespace");                          \
  static ::paddle::framework::OpKernelRegistrar<place_class,                   \
                                                __VA_ARGS__>                   \
      __op_kernel_registrar_##op_type##_##library_type##_##customized_name##__(\
          #op_type, #library_type, customized_type_value);                     \
  int TouchOpKernelRegistrar_##op_type##_##library_type##_##customized_name() {\
    __op_kernel_registrar_##op_type##_##library_type##_##customized_name##__   \
        .Touch();                                                              \
    return 0;                                                                  \
F
fengjiayi 已提交
229
  }
D
dongzhihong 已提交
230

X
Xin Pan 已提交
231 232 233 234 235 236
#define REGISTER_OP_KERNEL(op_type, library_type, place_class, ...)   \
  REGISTER_OP_KERNEL_WITH_CUSTOM_TYPE(                                \
      op_type, library_type, place_class, DEFAULT_TYPE,               \
      ::paddle::framework::OpKernelType::kDefaultCustomizedTypeValue, \
      __VA_ARGS__)

Q
QI JUN 已提交
237
#define REGISTER_OP_CUDA_KERNEL(op_type, ...) \
D
dzhwinter 已提交
238
  REGISTER_OP_KERNEL(op_type, CUDA, ::paddle::platform::CUDAPlace, __VA_ARGS__)
F
fengjiayi 已提交
239

F
fengjiayi 已提交
240 241
#define REGISTER_OP_CPU_KERNEL(op_type, ...) \
  REGISTER_OP_KERNEL(op_type, CPU, ::paddle::platform::CPUPlace, __VA_ARGS__)
Y
Yu Yang 已提交
242

X
Xin Pan 已提交
243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258
#define REGISTER_OP_KERNEL_EX(op_type, library_type, place_class,  \
                              customized_name,                     \
                              customized_type_value,               \
                              ...)                                 \
  STATIC_ASSERT_GLOBAL_NAMESPACE(                                  \
      __reg_op_kernel_##op_type##_##library_type##_##customized_name##__, \
                                 "REGISTER_OP_KERNEL_EX must be called in "  \
                                 "global namespace");  \
  static ::paddle::framework::OpKernelRegistrarEx<place_class,  \
                                                  __VA_ARGS__>  \
      __op_kernel_registrar_##op_type##_##library_type##_##customized_name##__(\
          #op_type, #library_type, customized_type_value);  \
  int TouchOpKernelRegistrar_##op_type##_##library_type##_##customized_name() {\
    __op_kernel_registrar_##op_type##_##library_type##_##customized_name##__   \
        .Touch();                                                              \
    return 0;                                                                  \
Y
yuyang18 已提交
259 260
  }

261
#define REGISTER_OP_CUDA_KERNEL_FUNCTOR(op_type, ...)                 \
X
Xin Pan 已提交
262 263 264 265
  REGISTER_OP_KERNEL_EX(                                              \
      op_type, CUDA, ::paddle::platform::CUDAPlace, DEFAULT_TYPE,     \
      ::paddle::framework::OpKernelType::kDefaultCustomizedTypeValue, \
      __VA_ARGS__)
Y
yuyang18 已提交
266

X
Xin Pan 已提交
267 268 269 270 271
#define REGISTER_OP_CPU_KERNEL_FUNCTOR(op_type, ...)                  \
  REGISTER_OP_KERNEL_EX(                                              \
      op_type, CPU, ::paddle::platform::CPUPlace, DEFAULT_TYPE,       \
      ::paddle::framework::OpKernelType::kDefaultCustomizedTypeValue, \
      __VA_ARGS__)
Y
yuyang18 已提交
272

273
/**
274 275
 * Macro to mark what Operator and Kernel
 * we will use and tell the compiler to
276 277
 * link them into target.
 */
D
dzhwinter 已提交
278 279 280 281 282 283
#define USE_OP_ITSELF(op_type)                             \
  STATIC_ASSERT_GLOBAL_NAMESPACE(                          \
      __use_op_itself_##op_type,                           \
      "USE_OP_ITSELF must be called in global namespace"); \
  extern int TouchOpRegistrar_##op_type();                 \
  UNUSED static int use_op_itself_##op_type##_ = TouchOpRegistrar_##op_type()
F
fengjiayi 已提交
284

X
Xin Pan 已提交
285 286 287 288 289 290 291 292
#define USE_OP_DEVICE_KERNEL_WITH_CUSTOM_TYPE(op_type,                     \
                                              LIBRARY_TYPE,                \
                                              customized_name)             \
  STATIC_ASSERT_GLOBAL_NAMESPACE(                                          \
      __use_op_kernel_##op_type##_##LIBRARY_TYPE##_##customized_name##__,  \
      "USE_OP_DEVICE_KERNEL must be in global namespace");                 \
  extern int                                                               \
      TouchOpKernelRegistrar_##op_type##_##LIBRARY_TYPE##_##customized_name(); \
293
  UNUSED static int use_op_kernel_##op_type##_##LIBRARY_TYPE##_##customized_name##_ = /* NOLINT */ \
X
Xin Pan 已提交
294 295 296 297
      TouchOpKernelRegistrar_##op_type##_##LIBRARY_TYPE##_##customized_name()

#define USE_OP_DEVICE_KERNEL(op_type, LIBRARY_TYPE) \
  USE_OP_DEVICE_KERNEL_WITH_CUSTOM_TYPE(op_type, LIBRARY_TYPE, DEFAULT_TYPE)
Y
Yu Yang 已提交
298

299 300
// TODO(fengjiayi): The following macros
// seems ugly, do we have better method?
Y
Yu Yang 已提交
301

302
#ifndef PADDLE_WITH_CUDA
303
#define USE_OP_KERNEL(op_type) USE_OP_DEVICE_KERNEL(op_type, CPU)
Y
Yu Yang 已提交
304
#else
305 306
#define USE_OP_KERNEL(op_type)        \
  USE_OP_DEVICE_KERNEL(op_type, CPU); \
Q
QI JUN 已提交
307
  USE_OP_DEVICE_KERNEL(op_type, CUDA)
Y
Yu Yang 已提交
308
#endif
309

310 311
#define USE_NO_KERNEL_OP(op_type) USE_OP_ITSELF(op_type);

F
WIP  
fengjiayi 已提交
312 313 314
#define USE_CPU_ONLY_OP(op_type) \
  USE_OP_ITSELF(op_type);        \
  USE_OP_DEVICE_KERNEL(op_type, CPU);
315

Q
QI JUN 已提交
316 317 318
#define USE_CUDA_ONLY_OP(op_type) \
  USE_OP_ITSELF(op_type);         \
  USE_OP_DEVICE_KERNEL(op_type, CUDA)
D
Dong Zhihong 已提交
319

F
WIP  
fengjiayi 已提交
320 321 322
#define USE_OP(op_type)   \
  USE_OP_ITSELF(op_type); \
  USE_OP_KERNEL(op_type)
X
Xin Pan 已提交
323
// clang-format on
324

325 326
}  // namespace framework
}  // namespace paddle