From 1bdea0a8d2fffe282c741712ade39d3604472fb9 Mon Sep 17 00:00:00 2001
From: wanghaoshuang <wanghaoshuang@baidu.com>
Date: Tue, 24 Apr 2018 13:41:39 +0800
Subject: [PATCH] Add init interface for customize devices.

---
 paddle/fluid/framework/init.cc | 73 ++++++++++++++++++++++++++++++++++
 paddle/fluid/framework/init.h  |  4 ++
 paddle/fluid/inference/io.cc   |  2 +
 paddle/fluid/inference/io.h    |  2 +
 4 files changed, 81 insertions(+)
diff --git a/paddle/fluid/framework/init.cc b/paddle/fluid/framework/init.cc
index 75c557fa42..3ce37041cb 100644
--- a/paddle/fluid/framework/init.cc
+++ b/paddle/fluid/framework/init.cc
@@ -15,19 +15,40 @@ limitations under the License. */
 #include <algorithm>
 #include <stdexcept>
 #include <string>
+#include <vector>
 
 #include "paddle/fluid/framework/init.h"
 #include "paddle/fluid/framework/operator.h"
 #include "paddle/fluid/platform/device_context.h"
+#include "paddle/fluid/platform/device_context.h"
 #include "paddle/fluid/platform/place.h"
 #include "paddle/fluid/string/piece.h"
 
 namespace paddle {
 namespace framework {
 
+DEFINE_string(devices, "", "The devices to be used.");
+DEFINE_bool(init_p2p, true, "Whether to init p2p.");
+
 std::once_flag gflags_init_flag;
 std::once_flag p2p_init_flag;
 
+using paddle::platform::DeviceContextPool;
+
+void Init(int argc, char **argv) {
+  std::call_once(gflags_init_flag,
+                 [&]() { google::ParseCommandLineFlags(&argc, &argv, true); });
+
+  // init devices
+  std::vector<int> devices;
+  std::string token;
+  std::istringstream tokenStream(FLAGS_devices);
+  while (std::getline(tokenStream, token, ',')) {
+    devices.push_back(std::stoi(token));
+  }
+  InitDevices(FLAGS_init_p2p, devices);
+}
+
 void InitGflags(std::vector<std::string> &argv) {
   std::call_once(gflags_init_flag, [&]() {
     int argc = argv.size();
@@ -64,6 +85,30 @@ void InitP2P(int count) {
 #endif
 }
 
+void InitP2P(std::vector<int> devices) {
+#ifdef PADDLE_WITH_CUDA
+  std::call_once(p2p_init_flag, [&]() {
+    int count = devices.size();
+    for (int i = 0; i < count; ++i) {
+      for (int j = 0; j < count; ++j) {
+        if (devices[i] == devices[j]) continue;
+        int can_acess = -1;
+        PADDLE_ENFORCE(
+            cudaDeviceCanAccessPeer(&can_acess, devices[i], devices[j]),
+            "Failed to test P2P access.");
+        if (can_acess != 1) {
+          LOG(WARNING) << "Cannot enable P2P access from " << devices[i]
+                       << " to " << devices[j];
+        } else {
+          cudaSetDevice(devices[i]);
+          cudaDeviceEnablePeerAccess(devices[j], 0);
+        }
+      }
+    }
+  });
+#endif
+}
+
 void InitDevices(bool init_p2p) {
   /*Init all avaiable devices by default */
 
@@ -91,6 +136,34 @@ void InitDevices(bool init_p2p) {
   platform::DeviceContextPool::Init(places);
 }
 
+void InitDevices(bool init_p2p, const std::vector<int> devices) {
+  std::vector<platform::Place> places;
+  int count = 0;
+#ifdef PADDLE_WITH_CUDA
+  try {
+    count = platform::GetCUDADeviceCount();
+  } catch (const std::exception &exp) {
+    LOG(WARNING) << "Compiled with WITH_GPU, but no GPU found in runtime.";
+  }
+#else
+  LOG(WARNING)
+      << "'CUDA' is not supported, Please re-compile with WITH_GPU option";
+#endif
+
+  for (size_t i = 0; i < devices.size(); ++i) {
+    if (devices[i] >= count) {
+      LOG(WARNING) << "Invalid devices id.";
+      continue;
+    }
+    places.emplace_back(platform::CUDAPlace(devices[i]));
+  }
+  if (init_p2p) {
+    InitP2P(devices);
+  }
+  places.emplace_back(platform::CPUPlace());
+  platform::DeviceContextPool::Init(places);
+}
+
 void InitGLOG(const std::string &prog_name) {
   // glog will not hold the ARGV[0] inside.
   // Use strdup to alloc a new string.
diff --git a/paddle/fluid/framework/init.h b/paddle/fluid/framework/init.h
index fae98a60b5..38604d232c 100644
--- a/paddle/fluid/framework/init.h
+++ b/paddle/fluid/framework/init.h
@@ -20,11 +20,15 @@ limitations under the License. */
 namespace paddle {
 namespace framework {
 
+void Init(int argc, char **argv);
+
 void InitGflags(std::vector<std::string> &argv);
 
 void InitGLOG(const std::string &prog_name);
 
 void InitDevices(bool init_p2p);
 
+void InitDevices(bool init_p2p, const std::vector<int> devices);
+
 }  // namespace framework
 }  // namespace paddle
diff --git a/paddle/fluid/inference/io.cc b/paddle/fluid/inference/io.cc
index 78d2f16746..74068d9dbe 100644
--- a/paddle/fluid/inference/io.cc
+++ b/paddle/fluid/inference/io.cc
@@ -28,6 +28,8 @@ namespace inference {
 // linking the inference shared library.
 void Init(bool init_p2p) { framework::InitDevices(init_p2p); }
 
+void Init(int argc, char** argv) { framework::Init(argc, argv); }
+
 void ReadBinaryFile(const std::string& filename, std::string* contents) {
   std::ifstream fin(filename, std::ios::in | std::ios::binary);
   PADDLE_ENFORCE(static_cast<bool>(fin), "Cannot open file %s", filename);
diff --git a/paddle/fluid/inference/io.h b/paddle/fluid/inference/io.h
index ba3e45099a..988b8aebbe 100644
--- a/paddle/fluid/inference/io.h
+++ b/paddle/fluid/inference/io.h
@@ -27,6 +27,8 @@ namespace inference {
 
 void Init(bool init_p2p);
 
+void Init(int argc, char** argv);
+
 void LoadPersistables(framework::Executor* executor, framework::Scope* scope,
                       const framework::ProgramDesc& main_program,
                       const std::string& dirname,
-- 
GitLab