dynamic_loader.cc 10.5 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Q
qijun 已提交
2 3 4 5 6 7 8 9 10 11 12 13

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
Y
Yi Wang 已提交
14
#include "paddle/fluid/platform/dynload/dynamic_loader.h"
15

Q
qijun 已提交
16
#include <memory>
17
#include <mutex>  // NOLINT
Q
qijun 已提交
18
#include <string>
19

Q
qijun 已提交
20 21
#include "gflags/gflags.h"
#include "glog/logging.h"
22
#include "paddle/fluid/platform/dynload/cupti_lib_path.h"
Y
Yi Wang 已提交
23
#include "paddle/fluid/platform/enforce.h"
D
dzhwinter 已提交
24
#include "paddle/fluid/platform/port.h"
Q
qijun 已提交
25 26 27 28 29 30 31 32

DEFINE_string(cudnn_dir, "",
              "Specify path for loading libcudnn.so. For instance, "
              "/usr/local/cudnn/lib. If empty [default], dlopen "
              "will search cudnn from LD_LIBRARY_PATH");

DEFINE_string(cuda_dir, "",
              "Specify path for loading cuda library, such as libcublas, "
33 34
              "libcurand, libcusolver. For instance, /usr/local/cuda/lib64. "
              "If default, dlopen will search cuda from LD_LIBRARY_PATH");
Q
qijun 已提交
35

Y
Yu Yang 已提交
36
DEFINE_string(nccl_dir, "",
37 38
              "Specify path for loading nccl library, such as libnccl.so. "
              "For instance, /usr/local/cuda/lib64. If default, "
Y
Yu Yang 已提交
39 40
              "dlopen will search cuda from LD_LIBRARY_PATH");

41 42
DEFINE_string(cupti_dir, "", "Specify path for loading cupti.so.");

Y
Yan Chunwei 已提交
43 44 45 46
DEFINE_string(
    tensorrt_dir, "",
    "Specify path for loading tensorrt library, such as libnvinfer.so.");

47 48
DEFINE_string(mklml_dir, "", "Specify path for loading libmklml_intel.so.");

49 50
DEFINE_string(op_dir, "", "Specify path for loading user-defined op library.");

Q
qijun 已提交
51 52
namespace paddle {
namespace platform {
Q
qijun 已提交
53
namespace dynload {
54 55 56 57 58 59

struct PathNode {
  PathNode() {}
  std::string path = "";
};

60
static constexpr char cupti_lib_path[] = CUPTI_LIB_PATH;
61 62

static PathNode s_py_site_pkg_path;
63

P
peizhilin 已提交
64 65 66 67
#if defined(_WIN32) && defined(PADDLE_WITH_CUDA)
static constexpr char* win_cublas_lib = "cublas64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_curand_lib = "curand64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_cudnn_lib = "cudnn64_" PADDLE_CUDNN_BINVER ".dll";
68 69
static constexpr char* win_cusolver_lib =
    "cusolver64_" PADDLE_CUDA_BINVER ".dll";
P
peizhilin 已提交
70 71
#endif

Q
qijun 已提交
72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88
static inline std::string join(const std::string& part1,
                               const std::string& part2) {
  // directory separator
  const char sep = '/';
  if (!part2.empty() && part2.front() == sep) {
    return part2;
  }
  std::string ret;
  ret.reserve(part1.size() + part2.size() + 1);
  ret = part1;
  if (!ret.empty() && ret.back() != sep) {
    ret += sep;
  }
  ret += part2;
  return ret;
}

89 90 91 92 93
void SetPaddleLibPath(const std::string& py_site_pkg_path) {
  s_py_site_pkg_path.path = py_site_pkg_path;
  VLOG(3) << "Set paddle lib path : " << py_site_pkg_path;
}

94 95
static inline void* GetDsoHandleFromDefaultPath(const std::string& dso_path,
                                                int dynload_flags) {
M
minqiyang 已提交
96 97
  VLOG(3) << "Try to find library: " << dso_path
          << " from default system path.";
Q
qijun 已提交
98
  // default search from LD_LIBRARY_PATH/DYLD_LIBRARY_PATH
99
  // and /usr/local/lib path
100
  void* dso_handle = dlopen(dso_path.c_str(), dynload_flags);
Q
qijun 已提交
101 102 103 104 105

// DYLD_LIBRARY_PATH is disabled after Mac OS 10.11 to
// bring System Integrity Projection (SIP), if dso_handle
// is null, search from default package path in Mac OS.
#if defined(__APPLE__) || defined(__OSX__)
106 107 108 109
  if (nullptr == dso_handle) {
    dso_handle =
        dlopen(join("/usr/local/cuda/lib/", dso_path).c_str(), dynload_flags);
    if (nullptr == dso_handle) {
Q
qijun 已提交
110
      if (dso_path == "libcudnn.dylib") {
111 112 113 114 115
        LOG(WARNING) << "Note: [Recommend] copy cudnn into /usr/local/cuda/ \n "
                        "For instance, sudo tar -xzf "
                        "cudnn-7.5-osx-x64-v5.0-ga.tgz -C /usr/local \n sudo "
                        "chmod a+r /usr/local/cuda/include/cudnn.h "
                        "/usr/local/cuda/lib/libcudnn*";
Q
qijun 已提交
116 117 118 119
      }
    }
  }
#endif
120

121 122
  if (nullptr == dso_handle) {
    LOG(WARNING) << "Can not find library: " << dso_path
C
chengduo 已提交
123 124
                 << ". The process maybe hang. Please try to add the lib path "
                    "to LD_LIBRARY_PATH.";
125
  }
126
  return dso_handle;
Q
qijun 已提交
127 128
}

129 130 131
static inline void* GetDsoHandleFromSearchPath(const std::string& search_root,
                                               const std::string& dso_name,
                                               bool throw_on_error = true) {
D
dzhwinter 已提交
132
#if !defined(_WIN32)
Q
qijun 已提交
133
  int dynload_flags = RTLD_LAZY | RTLD_LOCAL;
D
dzhwinter 已提交
134 135 136
#else
  int dynload_flags = 0;
#endif  // !_WIN32
137
  void* dso_handle = nullptr;
Q
qijun 已提交
138 139 140

  std::string dlPath = dso_name;
  if (search_root.empty()) {
141
    dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
142 143 144
  } else {
    // search xxx.so from custom path
    dlPath = join(search_root, dso_name);
145
    dso_handle = dlopen(dlPath.c_str(), dynload_flags);
D
dzhwinter 已提交
146 147 148 149 150
#if !defined(_WIN32)
    auto errorno = dlerror();
#else
    auto errorno = GetLastError();
#endif  // !_WIN32
Q
qijun 已提交
151
    // if not found, search from default path
152
    if (nullptr == dso_handle) {
Q
qijun 已提交
153
      LOG(WARNING) << "Failed to find dynamic library: " << dlPath << " ("
D
dzhwinter 已提交
154
                   << errorno << ")";
J
JiabinYang 已提交
155 156 157 158 159 160
      if (dlPath.find("nccl") != std::string::npos) {
        std::cout
            << "You may need to install 'nccl2' from NVIDIA official website: "
            << "https://developer.nvidia.com/nccl/nccl-download"
            << "before install PaddlePaddle" << std::endl;
      }
Q
qijun 已提交
161
      dlPath = dso_name;
162
      dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
163 164
    }
  }
165 166 167 168 169 170 171 172
  auto error_msg =
      "Failed to find dynamic library: %s ( %s ) \n Please specify "
      "its path correctly using following ways: \n Method. set "
      "environment variable LD_LIBRARY_PATH on Linux or "
      "DYLD_LIBRARY_PATH on Mac OS. \n For instance, issue command: "
      "export LD_LIBRARY_PATH=... \n Note: After Mac OS 10.11, "
      "using the DYLD_LIBRARY_PATH is impossible unless System "
      "Integrity Protection (SIP) is disabled.";
D
dzhwinter 已提交
173 174 175 176 177
#if !defined(_WIN32)
  auto errorno = dlerror();
#else
  auto errorno = GetLastError();
#endif  // !_WIN32
178
  if (throw_on_error) {
D
dzhwinter 已提交
179
    PADDLE_ENFORCE(nullptr != dso_handle, error_msg, dlPath, errorno);
180
  } else if (nullptr == dso_handle) {
D
dzhwinter 已提交
181
    LOG(WARNING) << string::Sprintf(error_msg, dlPath, errorno);
182
  }
183 184

  return dso_handle;
Q
qijun 已提交
185 186
}

187
void* GetCublasDsoHandle() {
Q
qijun 已提交
188
#if defined(__APPLE__) || defined(__OSX__)
189
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.dylib");
P
peizhilin 已提交
190 191
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cublas_lib);
Q
qijun 已提交
192
#else
193
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.so");
Q
qijun 已提交
194 195 196
#endif
}

197
void* GetCUDNNDsoHandle() {
Q
qijun 已提交
198
#if defined(__APPLE__) || defined(__OSX__)
199
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.dylib", false);
P
peizhilin 已提交
200 201
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, win_cudnn_lib);
Q
qijun 已提交
202
#else
203
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.so", false);
Q
qijun 已提交
204 205 206
#endif
}

207
void* GetCUPTIDsoHandle() {
208 209 210 211 212
  std::string cupti_path = cupti_lib_path;
  if (!FLAGS_cupti_dir.empty()) {
    cupti_path = FLAGS_cupti_dir;
  }
#if defined(__APPLE__) || defined(__OSX__)
213
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.dylib", false);
214
#else
215
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.so", false);
216 217 218
#endif
}

219
void* GetCurandDsoHandle() {
Q
qijun 已提交
220
#if defined(__APPLE__) || defined(__OSX__)
221
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.dylib");
P
peizhilin 已提交
222 223
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_curand_lib);
Q
qijun 已提交
224
#else
225
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.so");
Q
qijun 已提交
226 227 228
#endif
}

G
Guo Sheng 已提交
229 230 231 232
void* GetCusolverDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcusolver.dylib");
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
233 234 235 236
  // TODO(guosheng): Fix cusolver support on windows.
  // return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cusolver_lib);
  PADDLE_THROW(platform::errors::Unavailable(
      "Cusolver loader cannot support Windows temporarily."));
G
Guo Sheng 已提交
237 238 239 240 241
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcusolver.so");
#endif
}

242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257
void* GetNVRTCDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.dylib");
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.so");
#endif
}

void* GetCUDADsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.dylib");
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.so");
#endif
}

258
void* GetWarpCTCDsoHandle() {
259 260 261
  std::string warpctc_dir = "";
  if (!s_py_site_pkg_path.path.empty()) {
    warpctc_dir = s_py_site_pkg_path.path;
262
  }
Q
qijun 已提交
263
#if defined(__APPLE__) || defined(__OSX__)
264
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.dylib");
P
peizhilin 已提交
265
#elif defined(_WIN32)
266
  return GetDsoHandleFromSearchPath(warpctc_dir, "warpctc.dll");
Q
qijun 已提交
267
#else
268
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.so");
Q
qijun 已提交
269 270 271
#endif
}

272
void* GetNCCLDsoHandle() {
Y
Yu Yang 已提交
273
#if defined(__APPLE__) || defined(__OSX__)
274
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.dylib");
Y
Yu Yang 已提交
275
#else
276
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.so");
Y
Yu Yang 已提交
277 278 279
#endif
}

Y
Yan Chunwei 已提交
280 281 282
void* GetTensorRtDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.dylib");
283 284
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "nvinfer.dll");
Y
Yan Chunwei 已提交
285 286 287 288 289
#else
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.so");
#endif
}

290 291 292
void* GetMKLMLDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.dylib");
P
peizhilin 已提交
293 294
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "mklml.dll");
295 296 297 298 299
#else
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.so");
#endif
}

300 301 302 303 304 305 306 307 308 309
void* GetOpDsoHandle(const std::string& dso_name) {
#if defined(__APPLE__) || defined(__OSX__)
  PADDLE_THROW("Do not support Apple.");
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  PADDLE_THROW("Do not support Windows.");
#else
  return GetDsoHandleFromSearchPath(FLAGS_op_dir, dso_name);
#endif
}

Q
qijun 已提交
310
}  // namespace dynload
Q
qijun 已提交
311 312
}  // namespace platform
}  // namespace paddle