dynamic_loader.cc 9.5 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Q
qijun 已提交
2 3 4 5 6 7 8 9 10 11 12 13

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
Y
Yi Wang 已提交
14
#include "paddle/fluid/platform/dynload/dynamic_loader.h"
15

Q
qijun 已提交
16
#include <memory>
17
#include <mutex>  // NOLINT
Q
qijun 已提交
18
#include <string>
19

Q
qijun 已提交
20 21
#include "gflags/gflags.h"
#include "glog/logging.h"
22
#include "paddle/fluid/platform/dynload/cupti_lib_path.h"
Y
Yi Wang 已提交
23
#include "paddle/fluid/platform/enforce.h"
D
dzhwinter 已提交
24
#include "paddle/fluid/platform/port.h"
Q
qijun 已提交
25 26 27 28 29 30 31 32 33 34 35

DEFINE_string(cudnn_dir, "",
              "Specify path for loading libcudnn.so. For instance, "
              "/usr/local/cudnn/lib. If empty [default], dlopen "
              "will search cudnn from LD_LIBRARY_PATH");

DEFINE_string(cuda_dir, "",
              "Specify path for loading cuda library, such as libcublas, "
              "libcurand. For instance, /usr/local/cuda/lib64. If default, "
              "dlopen will search cuda from LD_LIBRARY_PATH");

Y
Yu Yang 已提交
36 37 38 39 40
DEFINE_string(nccl_dir, "",
              "Specify path for loading nccl library, such as libcublas, "
              "libcurand. For instance, /usr/local/cuda/lib64. If default, "
              "dlopen will search cuda from LD_LIBRARY_PATH");

41 42
DEFINE_string(cupti_dir, "", "Specify path for loading cupti.so.");

Y
Yan Chunwei 已提交
43 44 45 46
DEFINE_string(
    tensorrt_dir, "",
    "Specify path for loading tensorrt library, such as libnvinfer.so.");

47 48
DEFINE_string(mklml_dir, "", "Specify path for loading libmklml_intel.so.");

Q
qijun 已提交
49 50
namespace paddle {
namespace platform {
Q
qijun 已提交
51
namespace dynload {
52 53 54 55 56 57

struct PathNode {
  PathNode() {}
  std::string path = "";
};

58
static constexpr char cupti_lib_path[] = CUPTI_LIB_PATH;
59 60

static PathNode s_py_site_pkg_path;
61

P
peizhilin 已提交
62 63 64 65 66 67
#if defined(_WIN32) && defined(PADDLE_WITH_CUDA)
static constexpr char* win_cublas_lib = "cublas64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_curand_lib = "curand64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_cudnn_lib = "cudnn64_" PADDLE_CUDNN_BINVER ".dll";
#endif

Q
qijun 已提交
68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84
static inline std::string join(const std::string& part1,
                               const std::string& part2) {
  // directory separator
  const char sep = '/';
  if (!part2.empty() && part2.front() == sep) {
    return part2;
  }
  std::string ret;
  ret.reserve(part1.size() + part2.size() + 1);
  ret = part1;
  if (!ret.empty() && ret.back() != sep) {
    ret += sep;
  }
  ret += part2;
  return ret;
}

85 86 87 88 89
void SetPaddleLibPath(const std::string& py_site_pkg_path) {
  s_py_site_pkg_path.path = py_site_pkg_path;
  VLOG(3) << "Set paddle lib path : " << py_site_pkg_path;
}

90 91
static inline void* GetDsoHandleFromDefaultPath(const std::string& dso_path,
                                                int dynload_flags) {
M
minqiyang 已提交
92 93
  VLOG(3) << "Try to find library: " << dso_path
          << " from default system path.";
Q
qijun 已提交
94
  // default search from LD_LIBRARY_PATH/DYLD_LIBRARY_PATH
95
  // and /usr/local/lib path
96
  void* dso_handle = dlopen(dso_path.c_str(), dynload_flags);
Q
qijun 已提交
97 98 99 100 101

// DYLD_LIBRARY_PATH is disabled after Mac OS 10.11 to
// bring System Integrity Projection (SIP), if dso_handle
// is null, search from default package path in Mac OS.
#if defined(__APPLE__) || defined(__OSX__)
102 103 104 105
  if (nullptr == dso_handle) {
    dso_handle =
        dlopen(join("/usr/local/cuda/lib/", dso_path).c_str(), dynload_flags);
    if (nullptr == dso_handle) {
Q
qijun 已提交
106
      if (dso_path == "libcudnn.dylib") {
107 108 109 110 111
        LOG(WARNING) << "Note: [Recommend] copy cudnn into /usr/local/cuda/ \n "
                        "For instance, sudo tar -xzf "
                        "cudnn-7.5-osx-x64-v5.0-ga.tgz -C /usr/local \n sudo "
                        "chmod a+r /usr/local/cuda/include/cudnn.h "
                        "/usr/local/cuda/lib/libcudnn*";
Q
qijun 已提交
112 113 114 115
      }
    }
  }
#endif
116

117 118
  if (nullptr == dso_handle) {
    LOG(WARNING) << "Can not find library: " << dso_path
C
chengduo 已提交
119 120
                 << ". The process maybe hang. Please try to add the lib path "
                    "to LD_LIBRARY_PATH.";
121
  }
122
  return dso_handle;
Q
qijun 已提交
123 124
}

125 126 127
static inline void* GetDsoHandleFromSearchPath(const std::string& search_root,
                                               const std::string& dso_name,
                                               bool throw_on_error = true) {
D
dzhwinter 已提交
128
#if !defined(_WIN32)
Q
qijun 已提交
129
  int dynload_flags = RTLD_LAZY | RTLD_LOCAL;
D
dzhwinter 已提交
130 131 132
#else
  int dynload_flags = 0;
#endif  // !_WIN32
133
  void* dso_handle = nullptr;
Q
qijun 已提交
134 135 136

  std::string dlPath = dso_name;
  if (search_root.empty()) {
137
    dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
138 139 140
  } else {
    // search xxx.so from custom path
    dlPath = join(search_root, dso_name);
141
    dso_handle = dlopen(dlPath.c_str(), dynload_flags);
D
dzhwinter 已提交
142 143 144 145 146
#if !defined(_WIN32)
    auto errorno = dlerror();
#else
    auto errorno = GetLastError();
#endif  // !_WIN32
Q
qijun 已提交
147
    // if not found, search from default path
148
    if (nullptr == dso_handle) {
Q
qijun 已提交
149
      LOG(WARNING) << "Failed to find dynamic library: " << dlPath << " ("
D
dzhwinter 已提交
150
                   << errorno << ")";
J
JiabinYang 已提交
151 152 153 154 155 156
      if (dlPath.find("nccl") != std::string::npos) {
        std::cout
            << "You may need to install 'nccl2' from NVIDIA official website: "
            << "https://developer.nvidia.com/nccl/nccl-download"
            << "before install PaddlePaddle" << std::endl;
      }
Q
qijun 已提交
157
      dlPath = dso_name;
158
      dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
159 160
    }
  }
161 162 163 164 165 166 167 168
  auto error_msg =
      "Failed to find dynamic library: %s ( %s ) \n Please specify "
      "its path correctly using following ways: \n Method. set "
      "environment variable LD_LIBRARY_PATH on Linux or "
      "DYLD_LIBRARY_PATH on Mac OS. \n For instance, issue command: "
      "export LD_LIBRARY_PATH=... \n Note: After Mac OS 10.11, "
      "using the DYLD_LIBRARY_PATH is impossible unless System "
      "Integrity Protection (SIP) is disabled.";
D
dzhwinter 已提交
169 170 171 172 173
#if !defined(_WIN32)
  auto errorno = dlerror();
#else
  auto errorno = GetLastError();
#endif  // !_WIN32
174
  if (throw_on_error) {
D
dzhwinter 已提交
175
    PADDLE_ENFORCE(nullptr != dso_handle, error_msg, dlPath, errorno);
176
  } else if (nullptr == dso_handle) {
D
dzhwinter 已提交
177
    LOG(WARNING) << string::Sprintf(error_msg, dlPath, errorno);
178
  }
179 180

  return dso_handle;
Q
qijun 已提交
181 182
}

183
void* GetCublasDsoHandle() {
Q
qijun 已提交
184
#if defined(__APPLE__) || defined(__OSX__)
185
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.dylib");
P
peizhilin 已提交
186 187
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cublas_lib);
Q
qijun 已提交
188
#else
189
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.so");
Q
qijun 已提交
190 191 192
#endif
}

193
void* GetCUDNNDsoHandle() {
Q
qijun 已提交
194
#if defined(__APPLE__) || defined(__OSX__)
195
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.dylib", false);
P
peizhilin 已提交
196 197
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, win_cudnn_lib);
Q
qijun 已提交
198
#else
199
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.so", false);
Q
qijun 已提交
200 201 202
#endif
}

203
void* GetCUPTIDsoHandle() {
204 205 206 207 208
  std::string cupti_path = cupti_lib_path;
  if (!FLAGS_cupti_dir.empty()) {
    cupti_path = FLAGS_cupti_dir;
  }
#if defined(__APPLE__) || defined(__OSX__)
209
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.dylib", false);
210
#else
211
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.so", false);
212 213 214
#endif
}

215
void* GetCurandDsoHandle() {
Q
qijun 已提交
216
#if defined(__APPLE__) || defined(__OSX__)
217
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.dylib");
P
peizhilin 已提交
218 219
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_curand_lib);
Q
qijun 已提交
220
#else
221
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.so");
Q
qijun 已提交
222 223 224
#endif
}

225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240
void* GetNVRTCDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.dylib");
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libnvrtc.so");
#endif
}

void* GetCUDADsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.dylib");
#else
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcuda.so");
#endif
}

241
void* GetWarpCTCDsoHandle() {
242 243 244
  std::string warpctc_dir = "";
  if (!s_py_site_pkg_path.path.empty()) {
    warpctc_dir = s_py_site_pkg_path.path;
245
  }
Q
qijun 已提交
246
#if defined(__APPLE__) || defined(__OSX__)
247
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.dylib");
P
peizhilin 已提交
248
#elif defined(_WIN32)
249
  return GetDsoHandleFromSearchPath(warpctc_dir, "warpctc.dll");
Q
qijun 已提交
250
#else
251
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.so");
Q
qijun 已提交
252 253 254
#endif
}

255
void* GetNCCLDsoHandle() {
Y
Yu Yang 已提交
256
#if defined(__APPLE__) || defined(__OSX__)
257
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.dylib");
Y
Yu Yang 已提交
258
#else
259
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.so");
Y
Yu Yang 已提交
260 261 262
#endif
}

Y
Yan Chunwei 已提交
263 264 265
void* GetTensorRtDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.dylib");
266 267
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "nvinfer.dll");
Y
Yan Chunwei 已提交
268 269 270 271 272
#else
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.so");
#endif
}

273 274 275
void* GetMKLMLDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.dylib");
P
peizhilin 已提交
276 277
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "mklml.dll");
278 279 280 281 282
#else
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.so");
#endif
}

Q
qijun 已提交
283
}  // namespace dynload
Q
qijun 已提交
284 285
}  // namespace platform
}  // namespace paddle