dynamic_loader.cc 10.6 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Q
qijun 已提交
2 3 4 5 6 7 8 9 10 11 12 13

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
Y
Yi Wang 已提交
14
#include "paddle/fluid/platform/dynload/dynamic_loader.h"
15

Q
qijun 已提交
16
#include <memory>
17
#include <mutex>  // NOLINT
Q
qijun 已提交
18
#include <string>
19

Q
qijun 已提交
20 21
#include "gflags/gflags.h"
#include "glog/logging.h"
22
#include "paddle/fluid/platform/dynload/cupti_lib_path.h"
Y
Yi Wang 已提交
23
#include "paddle/fluid/platform/enforce.h"
D
dzhwinter 已提交
24
#include "paddle/fluid/platform/port.h"
Q
qijun 已提交
25 26 27 28 29 30 31 32

DEFINE_string(cudnn_dir, "",
              "Specify path for loading libcudnn.so. For instance, "
              "/usr/local/cudnn/lib. If empty [default], dlopen "
              "will search cudnn from LD_LIBRARY_PATH");

DEFINE_string(cuda_dir, "",
              "Specify path for loading cuda library, such as libcublas, "
33 34
              "libcurand, libcusolver. For instance, /usr/local/cuda/lib64. "
              "If default, dlopen will search cuda from LD_LIBRARY_PATH");
Q
qijun 已提交
35

Y
Yu Yang 已提交
36
DEFINE_string(nccl_dir, "",
37 38
              "Specify path for loading nccl library, such as libnccl.so. "
              "For instance, /usr/local/cuda/lib64. If default, "
Y
Yu Yang 已提交
39 40
              "dlopen will search cuda from LD_LIBRARY_PATH");

41 42
DEFINE_string(cupti_dir, "", "Specify path for loading cupti.so.");

Y
Yan Chunwei 已提交
43 44 45 46
DEFINE_string(
    tensorrt_dir, "",
    "Specify path for loading tensorrt library, such as libnvinfer.so.");

47 48
DEFINE_string(mklml_dir, "", "Specify path for loading libmklml_intel.so.");

49 50
DEFINE_string(op_dir, "", "Specify path for loading user-defined op library.");

Q
qijun 已提交
51 52
namespace paddle {
namespace platform {
Q
qijun 已提交
53
namespace dynload {
54 55 56 57 58 59

struct PathNode {
  PathNode() {}
  std::string path = "";
};

60
static constexpr char cupti_lib_path[] = CUPTI_LIB_PATH;
61
static constexpr char linux_cudnn_lib_path[] = "/usr/local/cuda/lib64";
62 63

static PathNode s_py_site_pkg_path;
64

P
peizhilin 已提交
65 66 67 68
#if defined(_WIN32) && defined(PADDLE_WITH_CUDA)
static constexpr char* win_cublas_lib = "cublas64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_curand_lib = "curand64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_cudnn_lib = "cudnn64_" PADDLE_CUDNN_BINVER ".dll";
69 70
static constexpr char* win_cusolver_lib =
    "cusolver64_" PADDLE_CUDA_BINVER ".dll";
P
peizhilin 已提交
71 72
#endif

Q
qijun 已提交
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89
static inline std::string join(const std::string& part1,
                               const std::string& part2) {
  // directory separator
  const char sep = '/';
  if (!part2.empty() && part2.front() == sep) {
    return part2;
  }
  std::string ret;
  ret.reserve(part1.size() + part2.size() + 1);
  ret = part1;
  if (!ret.empty() && ret.back() != sep) {
    ret += sep;
  }
  ret += part2;
  return ret;
}

90 91 92 93 94
void SetPaddleLibPath(const std::string& py_site_pkg_path) {
  s_py_site_pkg_path.path = py_site_pkg_path;
  VLOG(3) << "Set paddle lib path : " << py_site_pkg_path;
}

95 96
static inline void* GetDsoHandleFromDefaultPath(const std::string& dso_path,
                                                int dynload_flags) {
M
minqiyang 已提交
97 98
  VLOG(3) << "Try to find library: " << dso_path
          << " from default system path.";
Q
qijun 已提交
99
  // default search from LD_LIBRARY_PATH/DYLD_LIBRARY_PATH
100
  // and /usr/local/lib path
101
  void* dso_handle = dlopen(dso_path.c_str(), dynload_flags);
Q
qijun 已提交
102 103 104 105 106

// DYLD_LIBRARY_PATH is disabled after Mac OS 10.11 to
// bring System Integrity Projection (SIP), if dso_handle
// is null, search from default package path in Mac OS.
#if defined(__APPLE__) || defined(__OSX__)
107 108 109 110
  if (nullptr == dso_handle) {
    dso_handle =
        dlopen(join("/usr/local/cuda/lib/", dso_path).c_str(), dynload_flags);
    if (nullptr == dso_handle) {
Q
qijun 已提交
111
      if (dso_path == "libcudnn.dylib") {
112 113 114 115 116
        LOG(WARNING) << "Note: [Recommend] copy cudnn into /usr/local/cuda/ \n "
                        "For instance, sudo tar -xzf "
                        "cudnn-7.5-osx-x64-v5.0-ga.tgz -C /usr/local \n sudo "
                        "chmod a+r /usr/local/cuda/include/cudnn.h "
                        "/usr/local/cuda/lib/libcudnn*";
Q
qijun 已提交
117 118 119 120
      }
    }
  }
#endif
121

122 123
  if (nullptr == dso_handle) {
    LOG(WARNING) << "Can not find library: " << dso_path
C
chengduo 已提交
124 125
                 << ". The process maybe hang. Please try to add the lib path "
                    "to LD_LIBRARY_PATH.";
126
  }
127
  return dso_handle;
Q
qijun 已提交
128 129
}

130 131 132
static inline void* GetDsoHandleFromSearchPath(const std::string& search_root,
                                               const std::string& dso_name,
                                               bool throw_on_error = true) {
D
dzhwinter 已提交
133
#if !defined(_WIN32)
Q
qijun 已提交
134
  int dynload_flags = RTLD_LAZY | RTLD_LOCAL;
D
dzhwinter 已提交
135 136 137
#else
  int dynload_flags = 0;
#endif  // !_WIN32
138
  void* dso_handle = nullptr;
Q
qijun 已提交
139 140 141

  std::string dlPath = dso_name;
  if (search_root.empty()) {
142
    dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
143 144 145
  } else {
    // search xxx.so from custom path
    dlPath = join(search_root, dso_name);
146
    dso_handle = dlopen(dlPath.c_str(), dynload_flags);
D
dzhwinter 已提交
147 148 149 150 151
#if !defined(_WIN32)
    auto errorno = dlerror();
#else
    auto errorno = GetLastError();
#endif  // !_WIN32
Q
qijun 已提交
152
    // if not found, search from default path
153
    if (nullptr == dso_handle) {
Q
qijun 已提交
154
      LOG(WARNING) << "Failed to find dynamic library: " << dlPath << " ("
D
dzhwinter 已提交
155
                   << errorno << ")";
J
JiabinYang 已提交
156 157 158 159 160 161
      if (dlPath.find("nccl") != std::string::npos) {
        std::cout
            << "You may need to install 'nccl2' from NVIDIA official website: "
            << "https://developer.nvidia.com/nccl/nccl-download"
            << "before install PaddlePaddle" << std::endl;
      }
Q
qijun 已提交
162
      dlPath = dso_name;
163
      dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
164 165
    }
  }
166 167
  auto error_msg =
      "Failed to find dynamic library: %s ( %s ) \n Please specify "
168
      "its path correctly using following ways: \n   set "
169
      "environment variable LD_LIBRARY_PATH on Linux or "
170 171
      "DYLD_LIBRARY_PATH on Mac OS. \n   For instance, issue command: "
      "export LD_LIBRARY_PATH=... \n   Note: After Mac OS 10.11, "
172 173
      "using the DYLD_LIBRARY_PATH is impossible unless System "
      "Integrity Protection (SIP) is disabled.";
D
dzhwinter 已提交
174 175 176 177 178
#if !defined(_WIN32)
  auto errorno = dlerror();
#else
  auto errorno = GetLastError();
#endif  // !_WIN32
179
  if (throw_on_error) {
D
dzhwinter 已提交
180
    PADDLE_ENFORCE(nullptr != dso_handle, error_msg, dlPath, errorno);
181
  } else if (nullptr == dso_handle) {
D
dzhwinter 已提交
182
    LOG(WARNING) << string::Sprintf(error_msg, dlPath, errorno);
183
  }
184 185

  return dso_handle;
Q
qijun 已提交
186 187
}

188
void* GetCublasDsoHandle() {
Q
qijun 已提交
189
#if defined(__APPLE__) || defined(__OSX__)
190
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.dylib");
P
peizhilin 已提交
191 192
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cublas_lib);
Q
qijun 已提交
193
#else
194
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.so");
Q
qijun 已提交
195 196 197
#endif
}

198
void* GetCUDNNDsoHandle() {
Q
qijun 已提交
199
#if defined(__APPLE__) || defined(__OSX__)
200
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.dylib", false);
P
peizhilin 已提交
201 202
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, win_cudnn_lib);
Q
qijun 已提交
203
#else
204 205 206 207 208
  std::string linux_cudnn_path = linux_cudnn_lib_path;
  if (!FLAGS_cudnn_dir.empty()) {
    linux_cudnn_path = FLAGS_cudnn_dir;
  }
  return GetDsoHandleFromSearchPath(linux_cudnn_path, "libcudnn.so", false);
Q
qijun 已提交
209 210 211
#endif
}

212
void* GetCUPTIDsoHandle() {
213 214 215 216 217
  std::string cupti_path = cupti_lib_path;
  if (!FLAGS_cupti_dir.empty()) {
    cupti_path = FLAGS_cupti_dir;
  }
#if defined(__APPLE__) || defined(__OSX__)
218
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.dylib", false);
219
#else
220
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.so", false);
221 222 223
#endif
}

224
void* GetCurandDsoHandle() {
Q
qijun 已提交
225
#if defined(__APPLE__) || defined(__OSX__)
226
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.dylib");
P
peizhilin 已提交
227 228
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_curand_lib);
Q
qijun 已提交
229
#else
230
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.so");
Q
qijun 已提交
231 232 233
#endif
}

G
Guo Sheng 已提交
234 235 236 237
void* GetCusolverDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcusolver.dylib");
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
238
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cusolver_lib);
G
Guo Sheng 已提交
239 240 241 242 243
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcusolver.so");
#endif
}

244 245
void* GetNVRTCDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
246
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.dylib", false);
247
#else
248
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.so", false);
249 250 251 252 253
#endif
}

void* GetCUDADsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
254
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.dylib", false);
255
#else
256
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.so", false);
257 258 259
#endif
}

260
void* GetWarpCTCDsoHandle() {
261 262 263
  std::string warpctc_dir = "";
  if (!s_py_site_pkg_path.path.empty()) {
    warpctc_dir = s_py_site_pkg_path.path;
264
  }
Q
qijun 已提交
265
#if defined(__APPLE__) || defined(__OSX__)
266
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.dylib");
P
peizhilin 已提交
267
#elif defined(_WIN32)
268
  return GetDsoHandleFromSearchPath(warpctc_dir, "warpctc.dll");
Q
qijun 已提交
269
#else
270
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.so");
Q
qijun 已提交
271 272 273
#endif
}

274
void* GetNCCLDsoHandle() {
Y
Yu Yang 已提交
275
#if defined(__APPLE__) || defined(__OSX__)
276
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.dylib");
Y
Yu Yang 已提交
277
#else
278
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.so");
Y
Yu Yang 已提交
279 280 281
#endif
}

Y
Yan Chunwei 已提交
282 283 284
void* GetTensorRtDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.dylib");
285 286
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "nvinfer.dll");
Y
Yan Chunwei 已提交
287 288 289 290 291
#else
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.so");
#endif
}

292 293 294
void* GetMKLMLDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.dylib");
P
peizhilin 已提交
295 296
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "mklml.dll");
297 298 299 300 301
#else
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.so");
#endif
}

302 303 304 305 306 307 308 309 310 311
void* GetOpDsoHandle(const std::string& dso_name) {
#if defined(__APPLE__) || defined(__OSX__)
  PADDLE_THROW("Do not support Apple.");
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  PADDLE_THROW("Do not support Windows.");
#else
  return GetDsoHandleFromSearchPath(FLAGS_op_dir, dso_name);
#endif
}

Q
qijun 已提交
312
}  // namespace dynload
Q
qijun 已提交
313 314
}  // namespace platform
}  // namespace paddle