dynamic_loader.cc 14.0 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Q
qijun 已提交
2 3 4 5 6 7 8 9 10 11 12 13

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
Y
Yi Wang 已提交
14
#include "paddle/fluid/platform/dynload/dynamic_loader.h"
15

Q
qijun 已提交
16
#include <string>
17
#include <vector>
18

Q
qijun 已提交
19 20
#include "gflags/gflags.h"
#include "glog/logging.h"
21
#include "paddle/fluid/platform/dynload/cupti_lib_path.h"
Y
Yi Wang 已提交
22
#include "paddle/fluid/platform/enforce.h"
Q
qijun 已提交
23 24 25 26 27 28 29 30

DEFINE_string(cudnn_dir, "",
              "Specify path for loading libcudnn.so. For instance, "
              "/usr/local/cudnn/lib. If empty [default], dlopen "
              "will search cudnn from LD_LIBRARY_PATH");

DEFINE_string(cuda_dir, "",
              "Specify path for loading cuda library, such as libcublas, "
31 32
              "libcurand, libcusolver. For instance, /usr/local/cuda/lib64. "
              "If default, dlopen will search cuda from LD_LIBRARY_PATH");
Q
qijun 已提交
33

Y
Yu Yang 已提交
34
DEFINE_string(nccl_dir, "",
35 36
              "Specify path for loading nccl library, such as libnccl.so. "
              "For instance, /usr/local/cuda/lib64. If default, "
Y
Yu Yang 已提交
37 38
              "dlopen will search cuda from LD_LIBRARY_PATH");

39 40
DEFINE_string(cupti_dir, "", "Specify path for loading cupti.so.");

Y
Yan Chunwei 已提交
41 42 43 44
DEFINE_string(
    tensorrt_dir, "",
    "Specify path for loading tensorrt library, such as libnvinfer.so.");

45 46
DEFINE_string(mklml_dir, "", "Specify path for loading libmklml_intel.so.");

47 48
DEFINE_string(op_dir, "", "Specify path for loading user-defined op library.");

Q
qijun 已提交
49 50
namespace paddle {
namespace platform {
Q
qijun 已提交
51
namespace dynload {
52 53 54 55 56 57

struct PathNode {
  PathNode() {}
  std::string path = "";
};

58
static constexpr char cupti_lib_path[] = CUPTI_LIB_PATH;
59

60 61 62 63 64 65
// NOTE: In order to adapt to the default installation path of cuda
#if defined(_WIN32) && defined(PADDLE_WITH_CUDA)
static constexpr char cuda_lib_path[] = CUDA_TOOLKIT_ROOT_DIR "/bin";
#else
static constexpr char cuda_lib_path[] = "/usr/local/cuda/lib64";
#endif
66 67

static PathNode s_py_site_pkg_path;
68

P
peizhilin 已提交
69
#if defined(_WIN32) && defined(PADDLE_WITH_CUDA)
Z
Zhou Wei 已提交
70
static constexpr char* win_cudnn_lib = "cudnn64_" CUDNN_MAJOR_VERSION ".dll";
71 72 73
static constexpr char* win_cublas_lib =
    "cublas64_" CUDA_VERSION_MAJOR CUDA_VERSION_MINOR
    ".dll;cublas64_" CUDA_VERSION_MAJOR ".dll";
Z
Zhou Wei 已提交
74 75 76 77 78 79 80 81
#if CUDA_VERSION >= 11000
static constexpr char* win_curand_lib =
    "curand64_" CUDA_VERSION_MAJOR CUDA_VERSION_MINOR
    ".dll;curand64_" CUDA_VERSION_MAJOR ".dll;curand64_10.dll";
static constexpr char* win_cusolver_lib =
    "cusolver64_" CUDA_VERSION_MAJOR CUDA_VERSION_MINOR
    ".dll;cusolver64_" CUDA_VERSION_MAJOR ".dll;cusolver64_10.dll";
#else
82 83 84
static constexpr char* win_curand_lib =
    "curand64_" CUDA_VERSION_MAJOR CUDA_VERSION_MINOR
    ".dll;curand64_" CUDA_VERSION_MAJOR ".dll";
85
static constexpr char* win_cusolver_lib =
86 87
    "cusolver64_" CUDA_VERSION_MAJOR CUDA_VERSION_MINOR
    ".dll;cusolver64_" CUDA_VERSION_MAJOR ".dll";
Z
Zhou Wei 已提交
88
#endif  // CUDA_VERSION
P
peizhilin 已提交
89 90
#endif

Q
qijun 已提交
91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107
static inline std::string join(const std::string& part1,
                               const std::string& part2) {
  // directory separator
  const char sep = '/';
  if (!part2.empty() && part2.front() == sep) {
    return part2;
  }
  std::string ret;
  ret.reserve(part1.size() + part2.size() + 1);
  ret = part1;
  if (!ret.empty() && ret.back() != sep) {
    ret += sep;
  }
  ret += part2;
  return ret;
}

108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
static inline std::vector<std::string> split(
    const std::string& str, const std::string separator = " ") {
  std::vector<std::string> str_list;
  std::string::size_type firstPos;
  firstPos = str.find_first_not_of(separator, 0);
  std::string::size_type lastPos;
  lastPos = str.find_first_of(separator, firstPos);
  while (std::string::npos != firstPos && std::string::npos != lastPos) {
    str_list.push_back(str.substr(firstPos, lastPos - firstPos));
    firstPos = str.find_first_not_of(separator, lastPos);
    lastPos = str.find_first_of(separator, firstPos);
  }
  if (std::string::npos == lastPos) {
    str_list.push_back(str.substr(firstPos, lastPos - firstPos));
  }
  return str_list;
}

126 127 128 129 130
void SetPaddleLibPath(const std::string& py_site_pkg_path) {
  s_py_site_pkg_path.path = py_site_pkg_path;
  VLOG(3) << "Set paddle lib path : " << py_site_pkg_path;
}

131 132 133 134 135 136 137 138 139 140 141 142 143 144
static inline void* GetDsoHandleFromSpecificPath(const std::string& spec_path,
                                                 const std::string& dso_name,
                                                 int dynload_flags) {
  void* dso_handle = nullptr;
  if (!spec_path.empty()) {
    // search xxx.so from custom path
    VLOG(3) << "Try to find library: " << dso_name
            << " from specific path: " << spec_path;
    std::string dso_path = join(spec_path, dso_name);
    dso_handle = dlopen(dso_path.c_str(), dynload_flags);
  }
  return dso_handle;
}

145 146
static inline void* GetDsoHandleFromDefaultPath(const std::string& dso_path,
                                                int dynload_flags) {
Q
qijun 已提交
147
  // default search from LD_LIBRARY_PATH/DYLD_LIBRARY_PATH
148
  // and /usr/local/lib path
149
  void* dso_handle = dlopen(dso_path.c_str(), dynload_flags);
150 151
  VLOG(3) << "Try to find library: " << dso_path
          << " from default system path.";
Q
qijun 已提交
152

153
// TODO(chenweihang): This path is used to search which libs?
Q
qijun 已提交
154 155 156 157
// DYLD_LIBRARY_PATH is disabled after Mac OS 10.11 to
// bring System Integrity Projection (SIP), if dso_handle
// is null, search from default package path in Mac OS.
#if defined(__APPLE__) || defined(__OSX__)
158 159 160
  if (nullptr == dso_handle) {
    dso_handle =
        dlopen(join("/usr/local/cuda/lib/", dso_path).c_str(), dynload_flags);
Q
qijun 已提交
161 162
  }
#endif
163 164

  return dso_handle;
Q
qijun 已提交
165 166
}

167 168 169 170 171 172 173 174 175 176 177 178 179 180
/*
 * We define three priorities for dynamic library search:
 *
 * First: Search for the path specified by the user
 * Second: Search the system default path
 * Third: Search for a special path corresponding to
 *        a specific library to adapt to changes and easy to expand.
 */

static inline void* GetDsoHandleFromSearchPath(
    const std::string& config_path, const std::string& dso_name,
    bool throw_on_error = true,
    const std::vector<std::string>& extra_paths = std::vector<std::string>(),
    const std::string& warning_msg = std::string()) {
D
dzhwinter 已提交
181
#if !defined(_WIN32)
Q
qijun 已提交
182
  int dynload_flags = RTLD_LAZY | RTLD_LOCAL;
D
dzhwinter 已提交
183 184 185
#else
  int dynload_flags = 0;
#endif  // !_WIN32
186 187 188 189 190 191 192 193 194 195 196 197 198 199 200
  std::vector<std::string> dso_names = split(dso_name, ";");
  void* dso_handle = nullptr;
  for (auto dso : dso_names) {
    // 1. search in user config path by FLAGS
    dso_handle = GetDsoHandleFromSpecificPath(config_path, dso, dynload_flags);
    // 2. search in extra paths
    if (nullptr == dso_handle) {
      for (auto path : extra_paths) {
        VLOG(3) << "extra_paths: " << path;
        dso_handle = GetDsoHandleFromSpecificPath(path, dso, dynload_flags);
      }
    }
    // 3. search in system default path
    if (nullptr == dso_handle) {
      dso_handle = GetDsoHandleFromDefaultPath(dso, dynload_flags);
201
    }
202
    if (nullptr != dso_handle) break;
203
  }
Q
qijun 已提交
204

205
  // 4. [If Failed for All dso_names] logging warning if exists
206 207 208 209
  if (nullptr == dso_handle && !warning_msg.empty()) {
    LOG(WARNING) << warning_msg;
  }

210
  // 5. [If Failed for All dso_names] logging or throw error info
211 212
  if (nullptr == dso_handle) {
    auto error_msg =
213 214 215 216 217 218 219 220 221 222 223 224 225
        "The third-party dynamic library (%s) that Paddle depends on is not "
        "configured correctly. (error code is %s)\n"
        "  Suggestions:\n"
        "  1. Check if the third-party dynamic library (e.g. CUDA, CUDNN) "
        "is installed correctly and its version is matched with paddlepaddle "
        "you installed.\n"
        "  2. Configure third-party dynamic library environment variables as "
        "follows:\n"
        "  - Linux: set LD_LIBRARY_PATH by `export LD_LIBRARY_PATH=...`\n"
        "  - Windows: set PATH by `set PATH=XXX;%PATH%`\n"
        "  - Mac: set  DYLD_LIBRARY_PATH by `export DYLD_LIBRARY_PATH=...` "
        "[Note: After Mac OS 10.11, using the DYLD_LIBRARY_PATH is "
        "impossible unless System Integrity Protection (SIP) is disabled.]";
D
dzhwinter 已提交
226 227 228 229 230
#if !defined(_WIN32)
    auto errorno = dlerror();
#else
    auto errorno = GetLastError();
#endif  // !_WIN32
231 232
    if (throw_on_error) {
      // NOTE: Special error report case, no need to change its format
233 234
      PADDLE_THROW(
          platform::errors::PreconditionNotMet(error_msg, dso_name, errorno));
235 236
    } else {
      LOG(WARNING) << string::Sprintf(error_msg, dso_name, errorno);
Q
qijun 已提交
237 238
    }
  }
239 240

  return dso_handle;
Q
qijun 已提交
241 242
}

243
void* GetCublasDsoHandle() {
Q
qijun 已提交
244
#if defined(__APPLE__) || defined(__OSX__)
245
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.dylib");
P
peizhilin 已提交
246
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
247 248
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cublas_lib, true,
                                    {cuda_lib_path});
Q
qijun 已提交
249
#else
250
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.so");
Q
qijun 已提交
251 252 253
#endif
}

254
void* GetCUDNNDsoHandle() {
Q
qijun 已提交
255
#if defined(__APPLE__) || defined(__OSX__)
256 257 258 259 260 261 262 263
  std::string mac_warn_meg(
      "Note: [Recommend] copy cudnn into /usr/local/cuda/ \n "
      "For instance, sudo tar -xzf "
      "cudnn-7.5-osx-x64-v5.0-ga.tgz -C /usr/local \n sudo "
      "chmod a+r /usr/local/cuda/include/cudnn.h "
      "/usr/local/cuda/lib/libcudnn*");
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.dylib", false,
                                    {}, mac_warn_meg);
P
peizhilin 已提交
264
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
265 266 267 268 269 270 271 272 273 274
  std::string win_warn_meg(
      "Note: [Recommend] copy cudnn into CUDA installation directory. \n "
      "For instance, download cudnn-10.0-windows10-x64-v7.6.5.32.zip from "
      "NVIDIA's official website, \n"
      "then, unzip it and copy it into C:\\Program Files\\NVIDIA GPU Computing "
      "Toolkit\\CUDA/v10.0\n"
      "You should do this according to your CUDA installation directory and "
      "CUDNN version.");
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, win_cudnn_lib, true,
                                    {cuda_lib_path}, win_warn_meg);
Q
qijun 已提交
275
#else
276
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.so", false,
277
                                    {cuda_lib_path});
Q
qijun 已提交
278 279 280
#endif
}

281
void* GetCUPTIDsoHandle() {
282
#if defined(__APPLE__) || defined(__OSX__)
283 284
  return GetDsoHandleFromSearchPath(FLAGS_cupti_dir, "libcupti.dylib", false,
                                    {cupti_lib_path});
285
#else
286 287
  return GetDsoHandleFromSearchPath(FLAGS_cupti_dir, "libcupti.so", false,
                                    {cupti_lib_path});
288 289 290
#endif
}

291
void* GetCurandDsoHandle() {
Q
qijun 已提交
292
#if defined(__APPLE__) || defined(__OSX__)
293
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.dylib");
P
peizhilin 已提交
294
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
295 296
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_curand_lib, true,
                                    {cuda_lib_path});
Q
qijun 已提交
297
#else
298
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.so");
Q
qijun 已提交
299 300 301
#endif
}

G
Guo Sheng 已提交
302 303 304 305
void* GetCusolverDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcusolver.dylib");
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
306 307
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cusolver_lib, true,
                                    {cuda_lib_path});
G
Guo Sheng 已提交
308 309 310 311 312
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcusolver.so");
#endif
}

313 314
void* GetNVRTCDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
315
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.dylib", false);
316
#else
317
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.so", false);
318 319 320 321 322
#endif
}

void* GetCUDADsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
323
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.dylib", false);
324
#else
325
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.so", false);
326 327 328
#endif
}

329
void* GetWarpCTCDsoHandle() {
330 331 332
  std::string warpctc_dir = "";
  if (!s_py_site_pkg_path.path.empty()) {
    warpctc_dir = s_py_site_pkg_path.path;
333
  }
Q
qijun 已提交
334
#if defined(__APPLE__) || defined(__OSX__)
335
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.dylib");
P
peizhilin 已提交
336
#elif defined(_WIN32)
337
  return GetDsoHandleFromSearchPath(warpctc_dir, "warpctc.dll");
Q
qijun 已提交
338
#else
339
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.so");
Q
qijun 已提交
340 341 342
#endif
}

343
void* GetNCCLDsoHandle() {
344 345 346 347
  std::string warning_msg(
      "You may need to install 'nccl2' from NVIDIA official website: "
      "https://developer.nvidia.com/nccl/nccl-download"
      "before install PaddlePaddle.");
Y
Yu Yang 已提交
348
#if defined(__APPLE__) || defined(__OSX__)
349 350
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.dylib", true, {},
                                    warning_msg);
Y
Yu Yang 已提交
351
#else
352 353
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.so", true, {},
                                    warning_msg);
Y
Yu Yang 已提交
354 355 356
#endif
}

Y
Yan Chunwei 已提交
357 358 359
void* GetTensorRtDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.dylib");
360 361
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "nvinfer.dll");
Y
Yan Chunwei 已提交
362 363 364 365 366
#else
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.so");
#endif
}

367 368 369
void* GetMKLMLDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.dylib");
P
peizhilin 已提交
370 371
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "mklml.dll");
372 373 374 375 376
#else
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.so");
#endif
}

377 378
void* GetOpDsoHandle(const std::string& dso_name) {
#if defined(__APPLE__) || defined(__OSX__)
G
GaoWei8 已提交
379 380
  PADDLE_THROW(platform::errors::Unimplemented(
      "Create custom cpp op outside framework do not support Apple."));
381
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
G
GaoWei8 已提交
382 383
  PADDLE_THROW(platform::errors::Unimplemented(
      "Create custom cpp op outside framework do not support Windows."));
384 385 386 387 388
#else
  return GetDsoHandleFromSearchPath(FLAGS_op_dir, dso_name);
#endif
}

Q
qijun 已提交
389
}  // namespace dynload
Q
qijun 已提交
390 391
}  // namespace platform
}  // namespace paddle