dynamic_loader.cc 10.3 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Q
qijun 已提交
2 3 4 5 6 7 8 9 10 11 12 13

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
Y
Yi Wang 已提交
14
#include "paddle/fluid/platform/dynload/dynamic_loader.h"
15

Q
qijun 已提交
16
#include <memory>
17
#include <mutex>  // NOLINT
Q
qijun 已提交
18
#include <string>
19

Q
qijun 已提交
20 21
#include "gflags/gflags.h"
#include "glog/logging.h"
22
#include "paddle/fluid/platform/dynload/cupti_lib_path.h"
Y
Yi Wang 已提交
23
#include "paddle/fluid/platform/enforce.h"
D
dzhwinter 已提交
24
#include "paddle/fluid/platform/port.h"
Q
qijun 已提交
25 26 27 28 29 30 31 32 33 34 35

DEFINE_string(cudnn_dir, "",
              "Specify path for loading libcudnn.so. For instance, "
              "/usr/local/cudnn/lib. If empty [default], dlopen "
              "will search cudnn from LD_LIBRARY_PATH");

DEFINE_string(cuda_dir, "",
              "Specify path for loading cuda library, such as libcublas, "
              "libcurand. For instance, /usr/local/cuda/lib64. If default, "
              "dlopen will search cuda from LD_LIBRARY_PATH");

Y
Yu Yang 已提交
36 37 38 39 40
DEFINE_string(nccl_dir, "",
              "Specify path for loading nccl library, such as libcublas, "
              "libcurand. For instance, /usr/local/cuda/lib64. If default, "
              "dlopen will search cuda from LD_LIBRARY_PATH");

41 42
DEFINE_string(cupti_dir, "", "Specify path for loading cupti.so.");

Y
Yan Chunwei 已提交
43 44 45 46
DEFINE_string(
    tensorrt_dir, "",
    "Specify path for loading tensorrt library, such as libnvinfer.so.");

47 48
DEFINE_string(mklml_dir, "", "Specify path for loading libmklml_intel.so.");

49 50
DEFINE_string(op_dir, "", "Specify path for loading user-defined op library.");

Q
qijun 已提交
51 52
namespace paddle {
namespace platform {
Q
qijun 已提交
53
namespace dynload {
54 55 56 57 58 59

struct PathNode {
  PathNode() {}
  std::string path = "";
};

60
static constexpr char cupti_lib_path[] = CUPTI_LIB_PATH;
61 62

static PathNode s_py_site_pkg_path;
63

P
peizhilin 已提交
64 65 66 67 68 69
#if defined(_WIN32) && defined(PADDLE_WITH_CUDA)
static constexpr char* win_cublas_lib = "cublas64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_curand_lib = "curand64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_cudnn_lib = "cudnn64_" PADDLE_CUDNN_BINVER ".dll";
#endif

Q
qijun 已提交
70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86
static inline std::string join(const std::string& part1,
                               const std::string& part2) {
  // directory separator
  const char sep = '/';
  if (!part2.empty() && part2.front() == sep) {
    return part2;
  }
  std::string ret;
  ret.reserve(part1.size() + part2.size() + 1);
  ret = part1;
  if (!ret.empty() && ret.back() != sep) {
    ret += sep;
  }
  ret += part2;
  return ret;
}

87 88 89 90 91
void SetPaddleLibPath(const std::string& py_site_pkg_path) {
  s_py_site_pkg_path.path = py_site_pkg_path;
  VLOG(3) << "Set paddle lib path : " << py_site_pkg_path;
}

92 93
static inline void* GetDsoHandleFromDefaultPath(const std::string& dso_path,
                                                int dynload_flags) {
M
minqiyang 已提交
94 95
  VLOG(3) << "Try to find library: " << dso_path
          << " from default system path.";
Q
qijun 已提交
96
  // default search from LD_LIBRARY_PATH/DYLD_LIBRARY_PATH
97
  // and /usr/local/lib path
98
  void* dso_handle = dlopen(dso_path.c_str(), dynload_flags);
Q
qijun 已提交
99 100 101 102 103

// DYLD_LIBRARY_PATH is disabled after Mac OS 10.11 to
// bring System Integrity Projection (SIP), if dso_handle
// is null, search from default package path in Mac OS.
#if defined(__APPLE__) || defined(__OSX__)
104 105 106 107
  if (nullptr == dso_handle) {
    dso_handle =
        dlopen(join("/usr/local/cuda/lib/", dso_path).c_str(), dynload_flags);
    if (nullptr == dso_handle) {
Q
qijun 已提交
108
      if (dso_path == "libcudnn.dylib") {
109 110 111 112 113
        LOG(WARNING) << "Note: [Recommend] copy cudnn into /usr/local/cuda/ \n "
                        "For instance, sudo tar -xzf "
                        "cudnn-7.5-osx-x64-v5.0-ga.tgz -C /usr/local \n sudo "
                        "chmod a+r /usr/local/cuda/include/cudnn.h "
                        "/usr/local/cuda/lib/libcudnn*";
Q
qijun 已提交
114 115 116 117
      }
    }
  }
#endif
118

119 120
  if (nullptr == dso_handle) {
    LOG(WARNING) << "Can not find library: " << dso_path
C
chengduo 已提交
121 122
                 << ". The process maybe hang. Please try to add the lib path "
                    "to LD_LIBRARY_PATH.";
123
  }
124
  return dso_handle;
Q
qijun 已提交
125 126
}

127 128 129
static inline void* GetDsoHandleFromSearchPath(const std::string& search_root,
                                               const std::string& dso_name,
                                               bool throw_on_error = true) {
D
dzhwinter 已提交
130
#if !defined(_WIN32)
Q
qijun 已提交
131
  int dynload_flags = RTLD_LAZY | RTLD_LOCAL;
D
dzhwinter 已提交
132 133 134
#else
  int dynload_flags = 0;
#endif  // !_WIN32
135
  void* dso_handle = nullptr;
Q
qijun 已提交
136 137 138

  std::string dlPath = dso_name;
  if (search_root.empty()) {
139
    dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
140 141 142
  } else {
    // search xxx.so from custom path
    dlPath = join(search_root, dso_name);
143
    dso_handle = dlopen(dlPath.c_str(), dynload_flags);
D
dzhwinter 已提交
144 145 146 147 148
#if !defined(_WIN32)
    auto errorno = dlerror();
#else
    auto errorno = GetLastError();
#endif  // !_WIN32
Q
qijun 已提交
149
    // if not found, search from default path
150
    if (nullptr == dso_handle) {
Q
qijun 已提交
151
      LOG(WARNING) << "Failed to find dynamic library: " << dlPath << " ("
D
dzhwinter 已提交
152
                   << errorno << ")";
J
JiabinYang 已提交
153 154 155 156 157 158
      if (dlPath.find("nccl") != std::string::npos) {
        std::cout
            << "You may need to install 'nccl2' from NVIDIA official website: "
            << "https://developer.nvidia.com/nccl/nccl-download"
            << "before install PaddlePaddle" << std::endl;
      }
Q
qijun 已提交
159
      dlPath = dso_name;
160
      dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
161 162
    }
  }
163 164 165 166 167 168 169 170
  auto error_msg =
      "Failed to find dynamic library: %s ( %s ) \n Please specify "
      "its path correctly using following ways: \n Method. set "
      "environment variable LD_LIBRARY_PATH on Linux or "
      "DYLD_LIBRARY_PATH on Mac OS. \n For instance, issue command: "
      "export LD_LIBRARY_PATH=... \n Note: After Mac OS 10.11, "
      "using the DYLD_LIBRARY_PATH is impossible unless System "
      "Integrity Protection (SIP) is disabled.";
D
dzhwinter 已提交
171 172 173 174 175
#if !defined(_WIN32)
  auto errorno = dlerror();
#else
  auto errorno = GetLastError();
#endif  // !_WIN32
176
  if (throw_on_error) {
D
dzhwinter 已提交
177
    PADDLE_ENFORCE(nullptr != dso_handle, error_msg, dlPath, errorno);
178
  } else if (nullptr == dso_handle) {
D
dzhwinter 已提交
179
    LOG(WARNING) << string::Sprintf(error_msg, dlPath, errorno);
180
  }
181 182

  return dso_handle;
Q
qijun 已提交
183 184
}

185
void* GetCublasDsoHandle() {
Q
qijun 已提交
186
#if defined(__APPLE__) || defined(__OSX__)
187
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.dylib");
P
peizhilin 已提交
188 189
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cublas_lib);
Q
qijun 已提交
190
#else
191
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.so");
Q
qijun 已提交
192 193 194
#endif
}

195
void* GetCUDNNDsoHandle() {
Q
qijun 已提交
196
#if defined(__APPLE__) || defined(__OSX__)
197
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.dylib", false);
P
peizhilin 已提交
198 199
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, win_cudnn_lib);
Q
qijun 已提交
200
#else
201
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.so", false);
Q
qijun 已提交
202 203 204
#endif
}

205
void* GetCUPTIDsoHandle() {
206 207 208 209 210
  std::string cupti_path = cupti_lib_path;
  if (!FLAGS_cupti_dir.empty()) {
    cupti_path = FLAGS_cupti_dir;
  }
#if defined(__APPLE__) || defined(__OSX__)
211
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.dylib", false);
212
#else
213
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.so", false);
214 215 216
#endif
}

217
void* GetCurandDsoHandle() {
Q
qijun 已提交
218
#if defined(__APPLE__) || defined(__OSX__)
219
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.dylib");
P
peizhilin 已提交
220 221
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_curand_lib);
Q
qijun 已提交
222
#else
223
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.so");
Q
qijun 已提交
224 225 226
#endif
}

G
Guo Sheng 已提交
227 228 229 230 231 232 233 234 235 236
void* GetCusolverDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcusolver.dylib");
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cusolver_lib);
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcusolver.so");
#endif
}

237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252
void* GetNVRTCDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.dylib");
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.so");
#endif
}

void* GetCUDADsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.dylib");
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.so");
#endif
}

253
void* GetWarpCTCDsoHandle() {
254 255 256
  std::string warpctc_dir = "";
  if (!s_py_site_pkg_path.path.empty()) {
    warpctc_dir = s_py_site_pkg_path.path;
257
  }
Q
qijun 已提交
258
#if defined(__APPLE__) || defined(__OSX__)
259
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.dylib");
P
peizhilin 已提交
260
#elif defined(_WIN32)
261
  return GetDsoHandleFromSearchPath(warpctc_dir, "warpctc.dll");
Q
qijun 已提交
262
#else
263
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.so");
Q
qijun 已提交
264 265 266
#endif
}

267
void* GetNCCLDsoHandle() {
Y
Yu Yang 已提交
268
#if defined(__APPLE__) || defined(__OSX__)
269
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.dylib");
Y
Yu Yang 已提交
270
#else
271
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.so");
Y
Yu Yang 已提交
272 273 274
#endif
}

Y
Yan Chunwei 已提交
275 276 277
void* GetTensorRtDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.dylib");
278 279
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "nvinfer.dll");
Y
Yan Chunwei 已提交
280 281 282 283 284
#else
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.so");
#endif
}

285 286 287
void* GetMKLMLDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.dylib");
P
peizhilin 已提交
288 289
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "mklml.dll");
290 291 292 293 294
#else
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.so");
#endif
}

295 296 297 298 299 300 301 302 303 304
void* GetOpDsoHandle(const std::string& dso_name) {
#if defined(__APPLE__) || defined(__OSX__)
  PADDLE_THROW("Do not support Apple.");
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  PADDLE_THROW("Do not support Windows.");
#else
  return GetDsoHandleFromSearchPath(FLAGS_op_dir, dso_name);
#endif
}

Q
qijun 已提交
305
}  // namespace dynload
Q
qijun 已提交
306 307
}  // namespace platform
}  // namespace paddle