enforce.h 10.3 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once

17 18
#include <dlfcn.h>     // for dladdr
#include <execinfo.h>  // for backtrace
19 20 21 22 23 24 25 26 27 28 29 30 31

#ifdef __GNUC__
#include <cxxabi.h>  // for __cxa_demangle
#endif               // __GNUC__

#ifdef PADDLE_WITH_CUDA
#include <cublas_v2.h>
#include <cudnn.h>
#include <curand.h>
#include <thrust/system/cuda/error.h>
#include <thrust/system_error.h>
#endif  // PADDLE_WITH_CUDA

Y
Yu Yang 已提交
32
#include <iomanip>
L
liaogang 已提交
33
#include <memory>
34 35 36
#include <sstream>
#include <stdexcept>
#include <string>
37

38
#include "glog/logging.h"
Y
Yi Wang 已提交
39
#include "paddle/fluid/platform/macros.h"
40 41
#include "paddle/fluid/string/printf.h"
#include "paddle/fluid/string/to_string.h"
42

43
#ifdef PADDLE_WITH_CUDA
Y
Yi Wang 已提交
44 45 46
#include "paddle/fluid/platform/dynload/cublas.h"
#include "paddle/fluid/platform/dynload/cudnn.h"
#include "paddle/fluid/platform/dynload/curand.h"
Y
Yi Wang 已提交
47
#ifndef __APPLE__
Y
Yi Wang 已提交
48
#include "paddle/fluid/platform/dynload/nccl.h"
Y
Yi Wang 已提交
49 50
#endif  // __APPLE__
#endif  // PADDLE_WITH_CUDA
51 52 53 54

namespace paddle {
namespace platform {

L
liaogang 已提交
55 56 57 58 59 60 61 62 63 64 65
#ifdef __GNUC__
inline std::string demangle(std::string name) {
  int status = -4;  // some arbitrary value to eliminate the compiler warning
  std::unique_ptr<char, void (*)(void*)> res{
      abi::__cxa_demangle(name.c_str(), NULL, NULL, &status), std::free};
  return (status == 0) ? res.get() : name;
}
#else
inline std::string demangle(std::string name) { return name; }
#endif

66 67 68 69
struct EnforceNotMet : public std::exception {
  std::exception_ptr exp_;
  std::string err_str_;
  EnforceNotMet(std::exception_ptr e, const char* f, int l) : exp_(e) {
Y
Yu Yang 已提交
70
    static constexpr int TRACE_STACK_LIMIT = 100;
71 72 73
    try {
      std::rethrow_exception(exp_);
    } catch (const std::exception& exp) {
Y
Yu Yang 已提交
74
      std::ostringstream sout;
75

Y
Yu Yang 已提交
76
      sout << string::Sprintf("%s at [%s:%d]", exp.what(), f, l) << std::endl;
77 78
      sout << "PaddlePaddle Call Stacks: " << std::endl;

Y
Yu Yang 已提交
79
      void* call_stack[TRACE_STACK_LIMIT];
80 81 82 83 84
      auto size = backtrace(call_stack, TRACE_STACK_LIMIT);
      auto symbols = backtrace_symbols(call_stack, size);

      Dl_info info;
      for (int i = 0; i < size; ++i) {
L
liaogang 已提交
85 86
        if (dladdr(call_stack[i], &info) && info.dli_sname) {
          auto demangled = demangle(info.dli_sname);
87 88 89 90 91
          auto addr_offset = static_cast<char*>(call_stack[i]) -
                             static_cast<char*>(info.dli_saddr);
          sout << string::Sprintf("%-3d %*0p %s + %zd\n", i,
                                  2 + sizeof(void*) * 2, call_stack[i],
                                  demangled, addr_offset);
92
        } else {
93
          sout << string::Sprintf("%-3d %*0p\n", i, 2 + sizeof(void*) * 2,
94 95
                                  call_stack[i]);
        }
Y
Yu Yang 已提交
96
      }
97
      free(symbols);
Y
Yu Yang 已提交
98
      err_str_ = sout.str();
99 100 101 102 103 104
    }
  }

  const char* what() const noexcept { return err_str_.c_str(); }
};

L
liaogang 已提交
105 106 107 108 109
// Because most enforce conditions would evaluate to true, we can use
// __builtin_expect to instruct the C++ compiler to generate code that
// always forces branch prediction of true.
// This generates faster binary code. __builtin_expect is since C++11.
// For more details, please check https://stackoverflow.com/a/43870188/724872.
110 111
#define UNLIKELY(condition) __builtin_expect(static_cast<bool>(condition), 0)

L
liaogang 已提交
112 113
template <typename... Args>
inline typename std::enable_if<sizeof...(Args) != 0, void>::type throw_on_error(
Y
Yu Yang 已提交
114
    bool stat, const Args&... args) {
L
liaogang 已提交
115
  if (UNLIKELY(!(stat))) {
116
#ifndef REPLACE_ENFORCE_GLOG
117
    throw std::runtime_error(string::Sprintf(args...));
118 119 120
#else
    LOG(FATAL) << string::Sprintf(args...);
#endif
L
liaogang 已提交
121 122 123
  }
}

124
#ifdef PADDLE_WITH_CUDA
125 126

template <typename... Args>
L
liaogang 已提交
127 128
inline typename std::enable_if<sizeof...(Args) != 0, void>::type throw_on_error(
    cudaError_t e, const Args&... args) {
L
liaogang 已提交
129
  if (UNLIKELY(e)) {
130
#ifndef REPLACE_ENFORCE_GLOG
131 132
    throw thrust::system_error(e, thrust::cuda_category(),
                               string::Sprintf(args...));
133 134 135
#else
    LOG(FATAL) << string::Sprintf(args...);
#endif
136 137 138 139
  }
}

template <typename... Args>
L
liaogang 已提交
140 141
inline typename std::enable_if<sizeof...(Args) != 0, void>::type throw_on_error(
    curandStatus_t stat, const Args&... args) {
142
  if (stat != CURAND_STATUS_SUCCESS) {
143
#ifndef REPLACE_ENFORCE_GLOG
144 145
    throw thrust::system_error(cudaErrorLaunchFailure, thrust::cuda_category(),
                               string::Sprintf(args...));
146 147 148
#else
    LOG(FATAL) << string::Sprintf(args...);
#endif
149 150 151 152
  }
}

template <typename... Args>
L
liaogang 已提交
153 154
inline typename std::enable_if<sizeof...(Args) != 0, void>::type throw_on_error(
    cudnnStatus_t stat, const Args&... args) {
155 156 157
  if (stat == CUDNN_STATUS_SUCCESS) {
    return;
  } else {
158
#ifndef REPLACE_ENFORCE_GLOG
159 160
    throw std::runtime_error(platform::dynload::cudnnGetErrorString(stat) +
                             string::Sprintf(args...));
161 162 163
#else
    LOG(FATAL) << string::Sprintf(args...);
#endif
164 165 166 167
  }
}

template <typename... Args>
L
liaogang 已提交
168 169
inline typename std::enable_if<sizeof...(Args) != 0, void>::type throw_on_error(
    cublasStatus_t stat, const Args&... args) {
L
liaogang 已提交
170
  std::string err;
171 172 173
  if (stat == CUBLAS_STATUS_SUCCESS) {
    return;
  } else if (stat == CUBLAS_STATUS_NOT_INITIALIZED) {
L
liaogang 已提交
174
    err = "CUBLAS: not initialized, ";
175
  } else if (stat == CUBLAS_STATUS_ALLOC_FAILED) {
L
liaogang 已提交
176
    err = "CUBLAS: alloc failed, ";
177
  } else if (stat == CUBLAS_STATUS_INVALID_VALUE) {
L
liaogang 已提交
178
    err = "CUBLAS: invalid value, ";
179
  } else if (stat == CUBLAS_STATUS_ARCH_MISMATCH) {
L
liaogang 已提交
180
    err = "CUBLAS: arch mismatch, ";
181
  } else if (stat == CUBLAS_STATUS_MAPPING_ERROR) {
L
liaogang 已提交
182
    err = "CUBLAS: mapping error, ";
183
  } else if (stat == CUBLAS_STATUS_EXECUTION_FAILED) {
L
liaogang 已提交
184
    err = "CUBLAS: execution failed, ";
185
  } else if (stat == CUBLAS_STATUS_INTERNAL_ERROR) {
L
liaogang 已提交
186
    err = "CUBLAS: internal error, ";
187
  } else if (stat == CUBLAS_STATUS_NOT_SUPPORTED) {
L
liaogang 已提交
188
    err = "CUBLAS: not supported, ";
189
  } else if (stat == CUBLAS_STATUS_LICENSE_ERROR) {
L
liaogang 已提交
190
    err = "CUBLAS: license error, ";
191
  }
192
#ifndef REPLACE_ENFORCE_GLOG
193
  throw std::runtime_error(err + string::Sprintf(args...));
194 195 196
#else
  LOG(FATAL) << err << string::Sprintf(args...);
#endif
197 198
}

Y
Yi Wang 已提交
199
#ifndef __APPLE__
Y
Yu Yang 已提交
200 201 202 203 204 205
template <typename... Args>
inline typename std::enable_if<sizeof...(Args) != 0, void>::type throw_on_error(
    ncclResult_t stat, const Args&... args) {
  if (stat == ncclSuccess) {
    return;
  } else {
206
#ifndef REPLACE_ENFORCE_GLOG
Y
Yu Yang 已提交
207 208
    throw std::runtime_error(platform::dynload::ncclGetErrorString(stat) +
                             string::Sprintf(args...));
209 210 211 212
#else
    LOG(FATAL) << platform::dynload::ncclGetErrorString(stat)
               << string::Sprintf(args...);
#endif
Y
Yu Yang 已提交
213 214
  }
}
Y
Yi Wang 已提交
215
#endif  // __APPLE__
216
#endif  // PADDLE_WITH_CUDA
217

L
liaogang 已提交
218 219 220 221 222
template <typename T>
inline void throw_on_error(T e) {
  throw_on_error(e, "");
}

Q
qijun 已提交
223 224 225 226 227 228
#define PADDLE_THROW(...)                                              \
  do {                                                                 \
    throw ::paddle::platform::EnforceNotMet(                           \
        std::make_exception_ptr(                                       \
            std::runtime_error(paddle::string::Sprintf(__VA_ARGS__))), \
        __FILE__, __LINE__);                                           \
Y
Yu Yang 已提交
229
  } while (false)
L
liaogang 已提交
230

231
#ifndef REPLACE_ENFORCE_GLOG
232 233 234 235 236 237 238 239
#define PADDLE_ENFORCE(...)                                             \
  do {                                                                  \
    try {                                                               \
      ::paddle::platform::throw_on_error(__VA_ARGS__);                  \
    } catch (...) {                                                     \
      throw ::paddle::platform::EnforceNotMet(std::current_exception(), \
                                              __FILE__, __LINE__);      \
    }                                                                   \
Y
Yu Yang 已提交
240
  } while (false)
241 242 243
#else
#define PADDLE_ENFORCE(...) ::paddle::platform::throw_on_error(__VA_ARGS__);
#endif
244

S
Superjom 已提交
245 246 247 248 249 250 251
/*
 * Some enforce helpers here, usage:
 *    int a = 1;
 *    int b = 2;
 *    PADDLE_ENFORCE_EQ(a, b);
 *
 *    will raise an expression described as follows:
252
 *    "enforce a == b failed, 1 != 2" with detailed stack information.
S
Superjom 已提交
253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269
 *
 *    extra messages is also supported, for example:
 *    PADDLE_ENFORCE(a, b, "some simple enforce failed between %d numbers", 2)
 */

#define PADDLE_ENFORCE_EQ(__VAL0, __VAL1, ...) \
  __PADDLE_BINARY_COMPARE(__VAL0, __VAL1, ==, !=, __VA_ARGS__)
#define PADDLE_ENFORCE_NE(__VAL0, __VAL1, ...) \
  __PADDLE_BINARY_COMPARE(__VAL0, __VAL1, !=, ==, __VA_ARGS__)
#define PADDLE_ENFORCE_GT(__VAL0, __VAL1, ...) \
  __PADDLE_BINARY_COMPARE(__VAL0, __VAL1, >, <=, __VA_ARGS__)
#define PADDLE_ENFORCE_GE(__VAL0, __VAL1, ...) \
  __PADDLE_BINARY_COMPARE(__VAL0, __VAL1, >=, <, __VA_ARGS__)
#define PADDLE_ENFORCE_LT(__VAL0, __VAL1, ...) \
  __PADDLE_BINARY_COMPARE(__VAL0, __VAL1, <, >=, __VA_ARGS__)
#define PADDLE_ENFORCE_LE(__VAL0, __VAL1, ...) \
  __PADDLE_BINARY_COMPARE(__VAL0, __VAL1, <=, >, __VA_ARGS__)
270 271 272 273 274 275 276 277 278 279
#define PADDLE_ENFORCE_NOT_NULL(__VAL, ...)                  \
  do {                                                       \
    if (UNLIKELY(nullptr == (__VAL))) {                      \
      PADDLE_THROW(#__VAL " should not be null\n%s",         \
                   paddle::string::Sprintf("" __VA_ARGS__)); \
    }                                                        \
  } while (0)

#define __PADDLE_BINARY_COMPARE(__VAL0, __VAL1, __CMP, __INV_CMP, ...)  \
  do {                                                                  \
C
chengduo 已提交
280
    if (UNLIKELY(!((__VAL0)__CMP(__VAL1)))) {                           \
281 282 283 284 285 286 287
      PADDLE_THROW("enforce %s " #__CMP " %s failed, %s " #__INV_CMP    \
                   " %s\n%s",                                           \
                   #__VAL0, #__VAL1, paddle::string::to_string(__VAL0), \
                   paddle::string::to_string(__VAL1),                   \
                   paddle::string::Sprintf("" __VA_ARGS__));            \
    }                                                                   \
  } while (0)
S
add EQ  
Superjom 已提交
288

289 290
}  // namespace platform
}  // namespace paddle