dynamic_loader.cc 8.9 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Q
qijun 已提交
2 3 4 5 6 7 8 9 10 11 12 13

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
Y
Yi Wang 已提交
14
#include "paddle/fluid/platform/dynload/dynamic_loader.h"
15

Q
qijun 已提交
16
#include <memory>
17
#include <mutex>  // NOLINT
Q
qijun 已提交
18
#include <string>
19

Q
qijun 已提交
20 21
#include "gflags/gflags.h"
#include "glog/logging.h"
22
#include "paddle/fluid/platform/dynload/cupti_lib_path.h"
23
#include "paddle/fluid/platform/dynload/warpctc_lib_path.h"
Y
Yi Wang 已提交
24
#include "paddle/fluid/platform/enforce.h"
D
dzhwinter 已提交
25
#include "paddle/fluid/platform/port.h"
Q
qijun 已提交
26 27 28 29 30 31 32 33 34 35 36 37 38

DEFINE_string(cudnn_dir, "",
              "Specify path for loading libcudnn.so. For instance, "
              "/usr/local/cudnn/lib. If empty [default], dlopen "
              "will search cudnn from LD_LIBRARY_PATH");

DEFINE_string(cuda_dir, "",
              "Specify path for loading cuda library, such as libcublas, "
              "libcurand. For instance, /usr/local/cuda/lib64. If default, "
              "dlopen will search cuda from LD_LIBRARY_PATH");

DEFINE_string(warpctc_dir, "", "Specify path for loading libwarpctc.so.");

Y
Yu Yang 已提交
39 40 41 42 43
DEFINE_string(nccl_dir, "",
              "Specify path for loading nccl library, such as libcublas, "
              "libcurand. For instance, /usr/local/cuda/lib64. If default, "
              "dlopen will search cuda from LD_LIBRARY_PATH");

44 45
DEFINE_string(cupti_dir, "", "Specify path for loading cupti.so.");

Y
Yan Chunwei 已提交
46 47 48 49
DEFINE_string(
    tensorrt_dir, "",
    "Specify path for loading tensorrt library, such as libnvinfer.so.");

50 51
DEFINE_string(mklml_dir, "", "Specify path for loading libmklml_intel.so.");

Q
qijun 已提交
52 53
namespace paddle {
namespace platform {
Q
qijun 已提交
54
namespace dynload {
55
static constexpr char cupti_lib_path[] = CUPTI_LIB_PATH;
56
static constexpr char warpctc_lib_path[] = WARPCTC_LIB_PATH;
57

P
peizhilin 已提交
58 59 60 61 62 63
#if defined(_WIN32) && defined(PADDLE_WITH_CUDA)
static constexpr char* win_cublas_lib = "cublas64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_curand_lib = "curand64_" PADDLE_CUDA_BINVER ".dll";
static constexpr char* win_cudnn_lib = "cudnn64_" PADDLE_CUDNN_BINVER ".dll";
#endif

Q
qijun 已提交
64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80
static inline std::string join(const std::string& part1,
                               const std::string& part2) {
  // directory separator
  const char sep = '/';
  if (!part2.empty() && part2.front() == sep) {
    return part2;
  }
  std::string ret;
  ret.reserve(part1.size() + part2.size() + 1);
  ret = part1;
  if (!ret.empty() && ret.back() != sep) {
    ret += sep;
  }
  ret += part2;
  return ret;
}

81 82
static inline void* GetDsoHandleFromDefaultPath(const std::string& dso_path,
                                                int dynload_flags) {
M
minqiyang 已提交
83 84
  VLOG(3) << "Try to find library: " << dso_path
          << " from default system path.";
Q
qijun 已提交
85
  // default search from LD_LIBRARY_PATH/DYLD_LIBRARY_PATH
86
  // and /usr/local/lib path
87
  void* dso_handle = dlopen(dso_path.c_str(), dynload_flags);
Q
qijun 已提交
88 89 90 91 92

// DYLD_LIBRARY_PATH is disabled after Mac OS 10.11 to
// bring System Integrity Projection (SIP), if dso_handle
// is null, search from default package path in Mac OS.
#if defined(__APPLE__) || defined(__OSX__)
93 94 95 96
  if (nullptr == dso_handle) {
    dso_handle =
        dlopen(join("/usr/local/cuda/lib/", dso_path).c_str(), dynload_flags);
    if (nullptr == dso_handle) {
Q
qijun 已提交
97
      if (dso_path == "libcudnn.dylib") {
98 99 100 101 102
        LOG(WARNING) << "Note: [Recommend] copy cudnn into /usr/local/cuda/ \n "
                        "For instance, sudo tar -xzf "
                        "cudnn-7.5-osx-x64-v5.0-ga.tgz -C /usr/local \n sudo "
                        "chmod a+r /usr/local/cuda/include/cudnn.h "
                        "/usr/local/cuda/lib/libcudnn*";
Q
qijun 已提交
103 104 105 106
      }
    }
  }
#endif
107

108 109
  if (nullptr == dso_handle) {
    LOG(WARNING) << "Can not find library: " << dso_path
C
chengduo 已提交
110 111
                 << ". The process maybe hang. Please try to add the lib path "
                    "to LD_LIBRARY_PATH.";
112
  }
113
  return dso_handle;
Q
qijun 已提交
114 115
}

116 117 118
static inline void* GetDsoHandleFromSearchPath(const std::string& search_root,
                                               const std::string& dso_name,
                                               bool throw_on_error = true) {
D
dzhwinter 已提交
119
#if !defined(_WIN32)
Q
qijun 已提交
120
  int dynload_flags = RTLD_LAZY | RTLD_LOCAL;
D
dzhwinter 已提交
121 122 123
#else
  int dynload_flags = 0;
#endif  // !_WIN32
124
  void* dso_handle = nullptr;
Q
qijun 已提交
125 126 127

  std::string dlPath = dso_name;
  if (search_root.empty()) {
128
    dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
129 130 131
  } else {
    // search xxx.so from custom path
    dlPath = join(search_root, dso_name);
132
    dso_handle = dlopen(dlPath.c_str(), dynload_flags);
D
dzhwinter 已提交
133 134 135 136 137
#if !defined(_WIN32)
    auto errorno = dlerror();
#else
    auto errorno = GetLastError();
#endif  // !_WIN32
Q
qijun 已提交
138
    // if not found, search from default path
139
    if (nullptr == dso_handle) {
Q
qijun 已提交
140
      LOG(WARNING) << "Failed to find dynamic library: " << dlPath << " ("
D
dzhwinter 已提交
141
                   << errorno << ")";
J
JiabinYang 已提交
142 143 144 145 146 147
      if (dlPath.find("nccl") != std::string::npos) {
        std::cout
            << "You may need to install 'nccl2' from NVIDIA official website: "
            << "https://developer.nvidia.com/nccl/nccl-download"
            << "before install PaddlePaddle" << std::endl;
      }
Q
qijun 已提交
148
      dlPath = dso_name;
149
      dso_handle = GetDsoHandleFromDefaultPath(dlPath, dynload_flags);
Q
qijun 已提交
150 151
    }
  }
152 153 154 155 156 157 158 159
  auto error_msg =
      "Failed to find dynamic library: %s ( %s ) \n Please specify "
      "its path correctly using following ways: \n Method. set "
      "environment variable LD_LIBRARY_PATH on Linux or "
      "DYLD_LIBRARY_PATH on Mac OS. \n For instance, issue command: "
      "export LD_LIBRARY_PATH=... \n Note: After Mac OS 10.11, "
      "using the DYLD_LIBRARY_PATH is impossible unless System "
      "Integrity Protection (SIP) is disabled.";
D
dzhwinter 已提交
160 161 162 163 164
#if !defined(_WIN32)
  auto errorno = dlerror();
#else
  auto errorno = GetLastError();
#endif  // !_WIN32
165
  if (throw_on_error) {
D
dzhwinter 已提交
166
    PADDLE_ENFORCE(nullptr != dso_handle, error_msg, dlPath, errorno);
167
  } else if (nullptr == dso_handle) {
D
dzhwinter 已提交
168
    LOG(WARNING) << string::Sprintf(error_msg, dlPath, errorno);
169
  }
170 171

  return dso_handle;
Q
qijun 已提交
172 173
}

174
void* GetCublasDsoHandle() {
Q
qijun 已提交
175
#if defined(__APPLE__) || defined(__OSX__)
176
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.dylib");
P
peizhilin 已提交
177 178
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_cublas_lib);
Q
qijun 已提交
179
#else
180
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcublas.so");
Q
qijun 已提交
181 182 183
#endif
}

184
void* GetCUDNNDsoHandle() {
Q
qijun 已提交
185
#if defined(__APPLE__) || defined(__OSX__)
186
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.dylib", false);
P
peizhilin 已提交
187 188
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, win_cudnn_lib);
Q
qijun 已提交
189
#else
190
  return GetDsoHandleFromSearchPath(FLAGS_cudnn_dir, "libcudnn.so", false);
Q
qijun 已提交
191 192 193
#endif
}

194
void* GetCUPTIDsoHandle() {
195 196 197 198 199
  std::string cupti_path = cupti_lib_path;
  if (!FLAGS_cupti_dir.empty()) {
    cupti_path = FLAGS_cupti_dir;
  }
#if defined(__APPLE__) || defined(__OSX__)
200
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.dylib", false);
201
#else
202
  return GetDsoHandleFromSearchPath(cupti_path, "libcupti.so", false);
203 204 205
#endif
}

206
void* GetCurandDsoHandle() {
Q
qijun 已提交
207
#if defined(__APPLE__) || defined(__OSX__)
208
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.dylib");
P
peizhilin 已提交
209 210
#elif defined(_WIN32) && defined(PADDLE_WITH_CUDA)
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, win_curand_lib);
Q
qijun 已提交
211
#else
212
  return GetDsoHandleFromSearchPath(FLAGS_cuda_dir, "libcurand.so");
Q
qijun 已提交
213 214 215
#endif
}

216
void* GetWarpCTCDsoHandle() {
217 218 219 220
  std::string warpctc_dir = warpctc_lib_path;
  if (!FLAGS_warpctc_dir.empty()) {
    warpctc_dir = FLAGS_warpctc_dir;
  }
Q
qijun 已提交
221
#if defined(__APPLE__) || defined(__OSX__)
222
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.dylib");
P
peizhilin 已提交
223
#elif defined(_WIN32)
224
  return GetDsoHandleFromSearchPath(warpctc_dir, "warpctc.dll");
Q
qijun 已提交
225
#else
226
  return GetDsoHandleFromSearchPath(warpctc_dir, "libwarpctc.so");
Q
qijun 已提交
227 228 229
#endif
}

230
void* GetNCCLDsoHandle() {
Y
Yu Yang 已提交
231
#if defined(__APPLE__) || defined(__OSX__)
232
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.dylib");
Y
Yu Yang 已提交
233
#else
234
  return GetDsoHandleFromSearchPath(FLAGS_nccl_dir, "libnccl.so");
Y
Yu Yang 已提交
235 236 237
#endif
}

Y
Yan Chunwei 已提交
238 239 240 241 242 243 244 245
void* GetTensorRtDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.dylib");
#else
  return GetDsoHandleFromSearchPath(FLAGS_tensorrt_dir, "libnvinfer.so");
#endif
}

246 247 248
void* GetMKLMLDsoHandle() {
#if defined(__APPLE__) || defined(__OSX__)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.dylib");
P
peizhilin 已提交
249 250
#elif defined(_WIN32)
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "mklml.dll");
251 252 253 254 255
#else
  return GetDsoHandleFromSearchPath(FLAGS_mklml_dir, "libmklml_intel.so");
#endif
}

Q
qijun 已提交
256
}  // namespace dynload
Q
qijun 已提交
257 258
}  // namespace platform
}  // namespace paddle