/* Copyright (c) 2016 Baidu, Inc. All Rights Reserve. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ #include "Util.h" #include #include #include #include #include #include #include #include #include "paddle/utils/Logging.h" #include "CommandLineParser.h" #include "CustomStackTrace.h" #include "Thread.h" #include "ThreadLocal.h" #include "Version.h" #include "StringUtil.h" P_DEFINE_int32(seed, 1, "random number seed. 0 for srand(time)"); #ifdef WITH_GOOGLE_PERFTOOLS /* In order to use google profiler, you need to install gperftools, which can be obtained at: https://gperftools.googlecode.com/files/gperftools-2.0.tar.gz gperftools should be configured with --enable-frame-pointers Then link the executable with -lprofiler. After you start the application, you can use kill -s signal PID to start/stop profiling. The profile data will be stored in file FLAGS_profile_data_file, which can be analyzed by pprof. */ #include P_DEFINE_int32(profile_signal, 12, "signal for switch google profiler"); P_DEFINE_string(profile_data_file, "gperf.prof", "file for storing profile data"); static void profilerSwitch(int signalNumber) { bool static started = false; if (!started) { if (ProfilerStart(FLAGS_profile_data_file.c_str())) { LOG(INFO) << "Profiler started"; } else { LOG(WARNING) << "Can't turn on cpu profiling for " << FLAGS_profile_data_file; } } else { ProfilerStop(); LOG(INFO) << "Profiler stopped"; } started = !started; } static void installProfilerSwitch() { sighandler_t oldHandler = signal(FLAGS_profile_signal, profilerSwitch); if (!oldHandler) { LOG(INFO) << "Using signal " << FLAGS_profile_signal << " to turn on/off profiler"; } else { LOG(WARNING) << "Signal " << FLAGS_profile_signal << " is already in use\n"; } } #else static void installProfilerSwitch() {} #endif // WITH_GOOGLE_PERFTOOLS namespace paddle { pid_t getTID() { #if defined(__APPLE__) || defined(__OSX__) pid_t tid = syscall(SYS_thread_selfid); #else #ifndef __NR_gettid #define __NR_gettid 224 #endif pid_t tid = syscall(__NR_gettid); #endif CHECK_NE(tid, -1); return tid; } static bool g_initialized = false; typedef std::pair> PriorityFuncPair; typedef std::vector InitFuncList; static InitFuncList* g_initFuncs = nullptr; static std::once_flag g_onceFlag; void registerInitFunction(std::function func, int priority) { if (g_initialized) { LOG(FATAL) << "registerInitFunction() should only called before initMain()"; } if (!g_initFuncs) { g_initFuncs = new InitFuncList(); } g_initFuncs->push_back(std::make_pair(priority, func)); } void runInitFunctions() { std::call_once(g_onceFlag, []() { LOG(INFO) << "Calling runInitFunctions"; if (g_initFuncs) { std::sort(g_initFuncs->begin(), g_initFuncs->end(), [](const PriorityFuncPair& x, const PriorityFuncPair& y) { return x.first > y.first; }); for (auto& f : *g_initFuncs) { f.second(); } delete g_initFuncs; g_initFuncs = nullptr; } g_initialized = true; LOG(INFO) << "Call runInitFunctions done."; }); } void initMain(int argc, char** argv) { initializeLogging(argc, argv); installLayerStackTracer(); std::string line; for (int i = 0; i < argc; ++i) { line += argv[i]; line += ' '; } LOG(INFO) << "commandline: " << line; ParseCommandLineFlags(&argc, argv, true); CHECK_EQ(argc, 1) << "Unknown commandline argument: " << argv[1]; installProfilerSwitch(); _MM_SET_FLUSH_ZERO_MODE(_MM_FLUSH_ZERO_ON); _MM_SET_DENORMALS_ZERO_MODE(_MM_DENORMALS_ZERO_ON); if (FLAGS_seed == 0) { unsigned int t = time(NULL); srand(t); ThreadLocalRand::initSeed(t); LOG(INFO) << "random number seed=" << t; } else { srand(FLAGS_seed); ThreadLocalRand::initSeed(FLAGS_seed); } if (FLAGS_use_gpu) { // This is the initialization of the CUDA environment, // need before runInitFunctions. // TODO(hedaoyuan) Can be considered in the runInitFunctions, // but to ensure that it is the first to initialize. hl_start(); hl_init(FLAGS_gpu_id); } version::printVersion(); runInitFunctions(); } std::string readFile(const std::string& fileName) { std::ifstream is(fileName); // get length of file: is.seekg(0, is.end); size_t length = is.tellg(); is.seekg(0, is.beg); std::string str(length, (char)0); CHECK(is.read(&str[0], length)) << "Fail to read file: " << fileName; return str; } namespace path { std::string basename(const std::string& path) { size_t pos = path.rfind(sep); ++pos; return path.substr(pos, std::string::npos); } std::string dirname(const std::string& path) { size_t pos = path.rfind(sep); if (pos == std::string::npos) return std::string(); return path.substr(0, pos); } std::string join(const std::string& part1, const std::string& part2) { if (!part2.empty() && part2.front() == sep) { return part2; } std::string ret; ret.reserve(part1.size() + part2.size() + 1); ret = part1; if (!ret.empty() && ret.back() != sep) { ret += sep; } ret += part2; return ret; } } // namespace path void copyFileToPath(const std::string& file, const std::string& dir) { LOG(INFO) << "copy " << file << " to " << dir; std::string fileName = path::basename(file); std::string dst = path::join(dir, fileName); std::ifstream source(file, std::ios_base::binary); std::ofstream dest(dst, std::ios_base::binary); CHECK(source) << "Fail to open " << file; CHECK(dest) << "Fail to open " << dst; dest << source.rdbuf(); source.close(); dest.close(); } bool fileExist(const char* filename) { return (access(filename, 0) == 0); } void touchFile(const char* filename) { if (!fileExist(filename)) { std::ofstream os(filename); } } int isDir(const char* path) { struct stat s_buf; if (stat(path, &s_buf)) { return 0; } return S_ISDIR(s_buf.st_mode); } void rmDir(const char* folderName) { if (isDir(folderName)) { DIR* dp; struct dirent* ep; std::string buf; dp = opendir(folderName); while ((ep = readdir(dp)) != NULL) { if (strcmp(ep->d_name, ".") && strcmp(ep->d_name, "..")) { buf = std::string(folderName) + "/" + std::string(ep->d_name); if (isDir(buf.c_str())) { rmDir(buf.c_str()); } else { remove(buf.c_str()); } } } closedir(dp); rmdir(folderName); } } void mkDir(const char* filename) { if (mkdir(filename, 0755)) { CHECK(errno == EEXIST) << filename << "mkdir failed!"; } } void mkDirRecursively(const char *dir) { struct stat sb; if (!stat(dir, &sb)) return; mkDirRecursively(path::dirname(dir).c_str()); mkDir(dir); } void loadFileList(const std::string& fileListFileName, std::vector& fileList) { std::ifstream is(fileListFileName); CHECK(is) << "Fail to open " << fileListFileName; std::string line; while (is) { if (!getline(is, line)) break; fileList.push_back(line); } } double getMemoryUsage() { FILE* fp = fopen("/proc/meminfo", "r"); CHECK(fp) << "failed to fopen /proc/meminfo"; size_t bufsize = 256 * sizeof(char); char* buf = new (std::nothrow) char[bufsize]; CHECK(buf); int totalMem = -1; int freeMem = -1; int bufMem = -1; int cacheMem = -1; while (getline(&buf, &bufsize, fp) >= 0) { if (0 == strncmp(buf, "MemTotal", 8)) { if (1 != sscanf(buf, "%*s%d", &totalMem)) { LOG(FATAL) << "failed to get MemTotal from string: [" << buf << "]"; } } else if (0 == strncmp(buf, "MemFree", 7)) { if (1 != sscanf(buf, "%*s%d", &freeMem)) { LOG(FATAL) << "failed to get MemFree from string: [" << buf << "]"; } } else if (0 == strncmp(buf, "Buffers", 7)) { if (1 != sscanf(buf, "%*s%d", &bufMem)) { LOG(FATAL) << "failed to get Buffers from string: [" << buf << "]"; } } else if (0 == strncmp(buf, "Cached", 6)) { if (1 != sscanf(buf, "%*s%d", &cacheMem)) { LOG(FATAL) << "failed to get Cached from string: [" << buf << "]"; } } if (totalMem != -1 && freeMem != -1 && bufMem != -1 && cacheMem != -1) { break; } } CHECK(totalMem != -1 && freeMem != -1 && bufMem != -1 && cacheMem != -1) << "failed to get all information"; fclose(fp); delete[] buf; double usedMem = 1.0 - 1.0 * (freeMem + bufMem + cacheMem) / totalMem; return usedMem; } SyncThreadPool* getGlobalSyncThreadPool() { static std::unique_ptr syncThreadPool; if (syncThreadPool && syncThreadPool->getNumThreads() != (size_t)FLAGS_trainer_count) { LOG(WARNING) << "trainer_count changed in training process!"; syncThreadPool.reset(nullptr); } if (!syncThreadPool) { syncThreadPool.reset(new SyncThreadPool(FLAGS_trainer_count)); } return syncThreadPool.get(); } size_t calculateServiceNum(const std::string& pservers, int ports_num) { std::vector hosts; str::split(pservers, ',', &hosts); return hosts.size() * ports_num; } void memcpyWithCheck(void* dest, const void* src, size_t num, const void* srcEnd) { int minus = (char*)srcEnd - (char*)src - num; CHECK_LE(0, minus) << "memcpyWithCheck: copy " << num << " bytes data out of range."; memcpy(dest, src, num); } hl_activation_mode_t hlActiveType(const std::string& type) { if (type == "sigmoid") { return HL_ACTIVATION_SIGMOID; } else if (type == "relu") { return HL_ACTIVATION_RELU; } else if (type == "tanh") { return HL_ACTIVATION_TANH; } else if (type == "linear") { return HL_ACTIVATION_LINEAR; } else { LOG(FATAL) << "Do not support activation type " << type; } } } // namespace paddle