op_registry.cc 10.7 KB
Newer Older
Y
Yan Chunwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "lite/core/op_registry.h"
#include <list>
#include <set>

namespace paddle {
namespace lite {

22 23 24 25
const std::map<std::string, std::string> &GetOp2PathDict() {
  return OpKernelInfoCollector::Global().GetOp2PathDict();
}

Y
Yan Chunwei 已提交
26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46
std::list<std::unique_ptr<KernelBase>> KernelRegistry::Create(
    const std::string &op_type,
    TargetType target,
    PrecisionType precision,
    DataLayoutType layout) {
  Place place{target, precision, layout};
  VLOG(5) << "creating " << op_type << " kernel for " << place.DebugString();
#define CREATE_KERNEL1(target__, precision__)                                \
  switch (layout) {                                                          \
    case DATALAYOUT(kNCHW):                                                  \
      return Create<TARGET(target__),                                        \
                    PRECISION(precision__),                                  \
                    DATALAYOUT(kNCHW)>(op_type);                             \
    case DATALAYOUT(kAny):                                                   \
      return Create<TARGET(target__),                                        \
                    PRECISION(precision__),                                  \
                    DATALAYOUT(kAny)>(op_type);                              \
    case DATALAYOUT(kNHWC):                                                  \
      return Create<TARGET(target__),                                        \
                    PRECISION(precision__),                                  \
                    DATALAYOUT(kNHWC)>(op_type);                             \
47 48 49 50 51 52 53 54 55 56 57 58
    case DATALAYOUT(kImageDefault):                                          \
      return Create<TARGET(target__),                                        \
                    PRECISION(precision__),                                  \
                    DATALAYOUT(kImageDefault)>(op_type);                     \
    case DATALAYOUT(kImageFolder):                                           \
      return Create<TARGET(target__),                                        \
                    PRECISION(precision__),                                  \
                    DATALAYOUT(kImageFolder)>(op_type);                      \
    case DATALAYOUT(kImageNW):                                               \
      return Create<TARGET(target__),                                        \
                    PRECISION(precision__),                                  \
                    DATALAYOUT(kImageNW)>(op_type);                          \
Y
Yan Chunwei 已提交
59 60 61 62 63 64 65 66 67 68 69 70 71 72
    default:                                                                 \
      LOG(FATAL) << "unsupported kernel layout " << DataLayoutToStr(layout); \
  }

#define CREATE_KERNEL(target__)                         \
  switch (precision) {                                  \
    case PRECISION(kFloat):                             \
      CREATE_KERNEL1(target__, kFloat);                 \
    case PRECISION(kInt8):                              \
      CREATE_KERNEL1(target__, kInt8);                  \
    case PRECISION(kFP16):                              \
      CREATE_KERNEL1(target__, kFP16);                  \
    case PRECISION(kAny):                               \
      CREATE_KERNEL1(target__, kAny);                   \
J
juncaipeng 已提交
73 74
    case PRECISION(kInt32):                             \
      CREATE_KERNEL1(target__, kInt32);                 \
75 76
    case PRECISION(kInt64):                             \
      CREATE_KERNEL1(target__, kInt64);                 \
Y
Yan Chunwei 已提交
77 78 79 80 81 82 83 84 85
    default:                                            \
      CHECK(false) << "not supported kernel precision " \
                   << PrecisionToStr(precision);        \
  }

  switch (target) {
    case TARGET(kHost): {
      CREATE_KERNEL(kHost);
    } break;
86
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_X86)
Y
Yan Chunwei 已提交
87 88 89
    case TARGET(kX86): {
      CREATE_KERNEL(kX86);
    } break;
90 91
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_CUDA)
Y
Yan Chunwei 已提交
92 93 94
    case TARGET(kCUDA): {
      CREATE_KERNEL(kCUDA);
    } break;
95 96
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_ARM)
Y
Yan Chunwei 已提交
97 98 99
    case TARGET(kARM): {
      CREATE_KERNEL(kARM);
    } break;
100 101
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_OPENCL)
Y
Yan Chunwei 已提交
102 103 104
    case TARGET(kOpenCL): {
      CREATE_KERNEL(kOpenCL);
    } break;
105 106
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_NPU)
Y
Yan Chunwei 已提交
107 108 109
    case TARGET(kNPU): {
      CREATE_KERNEL(kNPU);
    } break;
110 111
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_APU)
H
hong19860320 已提交
112 113 114
    case TARGET(kAPU): {
      CREATE_KERNEL(kAPU);
    } break;
115 116
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_XPU)
117 118 119
    case TARGET(kXPU): {
      CREATE_KERNEL(kXPU);
    } break;
120 121
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_FPGA)
Y
Yan Chunwei 已提交
122 123 124
    case TARGET(kFPGA): {
      CREATE_KERNEL(kFPGA);
    } break;
125 126
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_BM)
127 128 129
    case TARGET(kBM): {
      CREATE_KERNEL(kBM);
    } break;
130 131
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_MLU)
132 133 134
    case TARGET(kMLU): {
      CREATE_KERNEL(kMLU);
    } break;
135 136
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_RKNPU)
137 138 139
    case TARGET(kRKNPU): {
      CREATE_KERNEL(kRKNPU);
    } break;
140
#endif
Y
Yan Chunwei 已提交
141 142 143 144 145 146 147 148
    default:
      CHECK(false) << "not supported kernel target " << TargetToStr(target);
  }

#undef CREATE_KERNEL
  return std::list<std::unique_ptr<KernelBase>>();
}

149 150 151 152 153 154 155 156 157 158
KernelRegistry::KernelRegistry() : registries_() {
#define INIT_FOR(target__, precision__, layout__)            \
  registries_[std::make_tuple(TARGET(target__),              \
                              PRECISION(precision__),        \
                              DATALAYOUT(layout__))]         \
      .set<KernelRegistryForTarget<TARGET(target__),         \
                                   PRECISION(precision__),   \
                                   DATALAYOUT(layout__)> *>( \
          &KernelRegistryForTarget<TARGET(target__),         \
                                   PRECISION(precision__),   \
Y
Yan Chunwei 已提交
159
                                   DATALAYOUT(layout__)>::Global());
160 161
// Currently, just register 2 kernel targets.
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_CUDA)
Y
Yan Chunwei 已提交
162
  INIT_FOR(kCUDA, kFloat, kNCHW);
163
  INIT_FOR(kCUDA, kFloat, kNHWC);
Z
Zhen Wang 已提交
164
  INIT_FOR(kCUDA, kInt8, kNCHW);
165 166
  INIT_FOR(kCUDA, kFP16, kNCHW);
  INIT_FOR(kCUDA, kFP16, kNHWC);
Y
Yan Chunwei 已提交
167 168
  INIT_FOR(kCUDA, kAny, kNCHW);
  INIT_FOR(kCUDA, kAny, kAny);
169
  INIT_FOR(kCUDA, kInt8, kNHWC);
170 171
  INIT_FOR(kCUDA, kInt64, kNCHW);
  INIT_FOR(kCUDA, kInt64, kNHWC);
172 173
  INIT_FOR(kCUDA, kInt32, kNCHW);
  INIT_FOR(kCUDA, kInt32, kNHWC);
174
#endif
Y
Yan Chunwei 已提交
175

176
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_MLU)
177 178 179 180 181 182 183 184
  INIT_FOR(kMLU, kFloat, kNHWC);
  INIT_FOR(kMLU, kFloat, kNCHW);
  INIT_FOR(kMLU, kFP16, kNHWC);
  INIT_FOR(kMLU, kFP16, kNCHW);
  INIT_FOR(kMLU, kInt8, kNHWC);
  INIT_FOR(kMLU, kInt8, kNCHW);
  INIT_FOR(kMLU, kInt16, kNHWC);
  INIT_FOR(kMLU, kInt16, kNCHW);
185
#endif
186

Y
Yan Chunwei 已提交
187 188 189
  INIT_FOR(kHost, kAny, kNCHW);
  INIT_FOR(kHost, kAny, kNHWC);
  INIT_FOR(kHost, kAny, kAny);
190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210
  INIT_FOR(kHost, kBool, kNCHW);
  INIT_FOR(kHost, kBool, kNHWC);
  INIT_FOR(kHost, kBool, kAny);
  INIT_FOR(kHost, kFloat, kNCHW);
  INIT_FOR(kHost, kFloat, kNHWC);
  INIT_FOR(kHost, kFloat, kAny);
  INIT_FOR(kHost, kFP16, kNCHW);
  INIT_FOR(kHost, kFP16, kNHWC);
  INIT_FOR(kHost, kFP16, kAny);
  INIT_FOR(kHost, kInt8, kNCHW);
  INIT_FOR(kHost, kInt8, kNHWC);
  INIT_FOR(kHost, kInt8, kAny);
  INIT_FOR(kHost, kInt16, kNCHW);
  INIT_FOR(kHost, kInt16, kNHWC);
  INIT_FOR(kHost, kInt16, kAny);
  INIT_FOR(kHost, kInt32, kNCHW);
  INIT_FOR(kHost, kInt32, kNHWC);
  INIT_FOR(kHost, kInt32, kAny);
  INIT_FOR(kHost, kInt64, kNCHW);
  INIT_FOR(kHost, kInt64, kNHWC);
  INIT_FOR(kHost, kInt64, kAny);
Y
Yan Chunwei 已提交
211

212
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_X86)
Y
Yan Chunwei 已提交
213 214 215
  INIT_FOR(kX86, kFloat, kNCHW);
  INIT_FOR(kX86, kAny, kNCHW);
  INIT_FOR(kX86, kAny, kAny);
216
  INIT_FOR(kX86, kInt64, kNCHW);
217 218
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_ARM)
Y
Yan Chunwei 已提交
219
  INIT_FOR(kARM, kFloat, kNCHW);
220
  INIT_FOR(kARM, kFloat, kNHWC);
Y
Yan Chunwei 已提交
221
  INIT_FOR(kARM, kInt8, kNCHW);
222
  INIT_FOR(kARM, kInt8, kNHWC);
Y
Yan Chunwei 已提交
223 224
  INIT_FOR(kARM, kAny, kNCHW);
  INIT_FOR(kARM, kAny, kAny);
J
juncaipeng 已提交
225
  INIT_FOR(kARM, kInt32, kNCHW);
X
xiaogang 已提交
226
  INIT_FOR(kARM, kInt64, kNCHW);
227 228
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_OPENCL)
Y
Yan Chunwei 已提交
229
  INIT_FOR(kOpenCL, kFloat, kNCHW);
230
  INIT_FOR(kOpenCL, kFloat, kNHWC);
Y
Yan Chunwei 已提交
231
  INIT_FOR(kOpenCL, kAny, kNCHW);
232 233 234
  INIT_FOR(kOpenCL, kAny, kNHWC);
  INIT_FOR(kOpenCL, kFloat, kAny);
  INIT_FOR(kOpenCL, kInt8, kNCHW);
Y
Yan Chunwei 已提交
235
  INIT_FOR(kOpenCL, kAny, kAny);
236 237 238 239 240 241 242 243 244 245 246
  INIT_FOR(kOpenCL, kFP16, kNCHW);
  INIT_FOR(kOpenCL, kFP16, kNHWC);
  INIT_FOR(kOpenCL, kFP16, kImageDefault);
  INIT_FOR(kOpenCL, kFP16, kImageFolder);
  INIT_FOR(kOpenCL, kFP16, kImageNW);
  INIT_FOR(kOpenCL, kFloat, kImageDefault);
  INIT_FOR(kOpenCL, kFloat, kImageFolder);
  INIT_FOR(kOpenCL, kFloat, kImageNW);
  INIT_FOR(kOpenCL, kAny, kImageDefault);
  INIT_FOR(kOpenCL, kAny, kImageFolder);
  INIT_FOR(kOpenCL, kAny, kImageNW);
247 248
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_NPU)
Y
Yan Chunwei 已提交
249
  INIT_FOR(kNPU, kFloat, kNCHW);
250
  INIT_FOR(kNPU, kFloat, kNHWC);
Y
Yan Chunwei 已提交
251
  INIT_FOR(kNPU, kInt8, kNCHW);
252
  INIT_FOR(kNPU, kInt8, kNHWC);
Y
Yan Chunwei 已提交
253
  INIT_FOR(kNPU, kAny, kNCHW);
254
  INIT_FOR(kNPU, kAny, kNHWC);
Y
Yan Chunwei 已提交
255
  INIT_FOR(kNPU, kAny, kAny);
256 257
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_APU)
H
hong19860320 已提交
258
  INIT_FOR(kAPU, kInt8, kNCHW);
259 260 261 262
  INIT_FOR(kXPU, kFloat, kNCHW);
  INIT_FOR(kXPU, kInt8, kNCHW);
  INIT_FOR(kXPU, kAny, kNCHW);
  INIT_FOR(kXPU, kAny, kAny);
263 264
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_FPGA)
Y
Yan Chunwei 已提交
265 266 267 268 269
  INIT_FOR(kFPGA, kFP16, kNHWC);
  INIT_FOR(kFPGA, kFP16, kAny);
  INIT_FOR(kFPGA, kFloat, kNHWC);
  INIT_FOR(kFPGA, kAny, kNHWC);
  INIT_FOR(kFPGA, kAny, kAny);
270 271
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_BM)
272 273 274 275
  INIT_FOR(kBM, kFloat, kNCHW);
  INIT_FOR(kBM, kInt8, kNCHW);
  INIT_FOR(kBM, kAny, kNCHW);
  INIT_FOR(kBM, kAny, kAny);
276 277
#endif
#if !defined(LITE_ON_TINY_PUBLISH) || defined(LITE_WITH_RKNPU)
278 279 280 281
  INIT_FOR(kRKNPU, kFloat, kNCHW);
  INIT_FOR(kRKNPU, kInt8, kNCHW);
  INIT_FOR(kRKNPU, kAny, kNCHW);
  INIT_FOR(kRKNPU, kAny, kAny);
282 283
#endif

Y
Yan Chunwei 已提交
284 285 286 287 288 289 290 291 292 293
#undef INIT_FOR
}

KernelRegistry &KernelRegistry::Global() {
  static auto *x = new KernelRegistry;
  return *x;
}

}  // namespace lite
}  // namespace paddle