未验证 提交 6b7d4845 编写于 作者: T Thunderbrook 提交者: GitHub

add shard_id (#40261)

* shard_id

* format
上级 64223620
...@@ -148,7 +148,7 @@ void PSGPUWrapper::PreBuildTask(std::shared_ptr<HeterContext> gpu_task) { ...@@ -148,7 +148,7 @@ void PSGPUWrapper::PreBuildTask(std::shared_ptr<HeterContext> gpu_task) {
t.join(); t.join();
} }
timeline.Pause(); timeline.Pause();
VLOG(1) << "GpuPs build task cost " << timeline.ElapsedSec() << " seconds."; VLOG(0) << "GpuPs build task cost " << timeline.ElapsedSec() << " seconds.";
} else { } else {
CHECK(data_set_name.find("MultiSlotDataset") != std::string::npos); CHECK(data_set_name.find("MultiSlotDataset") != std::string::npos);
VLOG(0) << "ps_gpu_wrapper use MultiSlotDataset"; VLOG(0) << "ps_gpu_wrapper use MultiSlotDataset";
...@@ -182,7 +182,7 @@ void PSGPUWrapper::PreBuildTask(std::shared_ptr<HeterContext> gpu_task) { ...@@ -182,7 +182,7 @@ void PSGPUWrapper::PreBuildTask(std::shared_ptr<HeterContext> gpu_task) {
t.join(); t.join();
} }
timeline.Pause(); timeline.Pause();
VLOG(1) << "GpuPs build task cost " << timeline.ElapsedSec() << " seconds."; VLOG(0) << "GpuPs build task cost " << timeline.ElapsedSec() << " seconds.";
} }
timeline.Start(); timeline.Start();
...@@ -300,7 +300,7 @@ void PSGPUWrapper::BuildPull(std::shared_ptr<HeterContext> gpu_task) { ...@@ -300,7 +300,7 @@ void PSGPUWrapper::BuildPull(std::shared_ptr<HeterContext> gpu_task) {
int32_t cnt = 0; int32_t cnt = 0;
while (true) { while (true) {
auto tt = fleet_ptr->pslib_ptr_->_worker_ptr->pull_sparse_ptr( auto tt = fleet_ptr->pslib_ptr_->_worker_ptr->pull_sparse_ptr(
reinterpret_cast<char**>(local_ptr[i].data()), this->table_id_, i, reinterpret_cast<char**>(local_ptr[i].data()), this->table_id_,
local_keys[i].data(), key_size); local_keys[i].data(), key_size);
bool flag = true; bool flag = true;
...@@ -378,8 +378,8 @@ void PSGPUWrapper::BuildPull(std::shared_ptr<HeterContext> gpu_task) { ...@@ -378,8 +378,8 @@ void PSGPUWrapper::BuildPull(std::shared_ptr<HeterContext> gpu_task) {
int32_t cnt = 0; int32_t cnt = 0;
while (true) { while (true) {
auto tt = fleet_ptr->pslib_ptr_->_worker_ptr->pull_sparse_ptr( auto tt = fleet_ptr->pslib_ptr_->_worker_ptr->pull_sparse_ptr(
reinterpret_cast<char**>(local_dim_ptr[i][j].data()), this->table_id_, i, reinterpret_cast<char**>(local_dim_ptr[i][j].data()),
local_dim_keys[i][j].data(), key_size); this->table_id_, local_dim_keys[i][j].data(), key_size);
bool flag = true; bool flag = true;
tt.wait(); tt.wait();
...@@ -431,7 +431,7 @@ void PSGPUWrapper::BuildPull(std::shared_ptr<HeterContext> gpu_task) { ...@@ -431,7 +431,7 @@ void PSGPUWrapper::BuildPull(std::shared_ptr<HeterContext> gpu_task) {
t.join(); t.join();
} }
timeline.Pause(); timeline.Pause();
VLOG(1) << "pull sparse from CpuPS into GpuPS cost " << timeline.ElapsedSec() VLOG(0) << "pull sparse from CpuPS into GpuPS cost " << timeline.ElapsedSec()
<< " seconds."; << " seconds.";
if (multi_node_) { if (multi_node_) {
auto gloo_wrapper = paddle::framework::GlooWrapper::GetInstance(); auto gloo_wrapper = paddle::framework::GlooWrapper::GetInstance();
...@@ -603,7 +603,7 @@ void PSGPUWrapper::BuildPull(std::shared_ptr<HeterContext> gpu_task) { ...@@ -603,7 +603,7 @@ void PSGPUWrapper::BuildPull(std::shared_ptr<HeterContext> gpu_task) {
t.join(); t.join();
} }
timeline.Pause(); timeline.Pause();
VLOG(1) << "GpuPs prepare for build hbm cost " << timeline.ElapsedSec() VLOG(0) << "GpuPs prepare for build hbm cost " << timeline.ElapsedSec()
<< " seconds."; << " seconds.";
} }
...@@ -746,7 +746,7 @@ void PSGPUWrapper::BeginPass() { ...@@ -746,7 +746,7 @@ void PSGPUWrapper::BeginPass() {
"[BeginPass] after build_task, current task is not null.")); "[BeginPass] after build_task, current task is not null."));
} }
VLOG(1) << "BeginPass end, cost time: " << timer.ElapsedSec() << "s"; VLOG(0) << "BeginPass end, cost time: " << timer.ElapsedSec() << "s";
} }
void PSGPUWrapper::EndPass() { void PSGPUWrapper::EndPass() {
...@@ -769,7 +769,7 @@ void PSGPUWrapper::EndPass() { ...@@ -769,7 +769,7 @@ void PSGPUWrapper::EndPass() {
current_task_ = nullptr; current_task_ = nullptr;
gpu_free_channel_->Put(current_task_); gpu_free_channel_->Put(current_task_);
timer.Pause(); timer.Pause();
VLOG(1) << "EndPass end, cost time: " << timer.ElapsedSec() << "s"; VLOG(0) << "EndPass end, cost time: " << timer.ElapsedSec() << "s";
} }
void PSGPUWrapper::PullSparse(const paddle::platform::Place& place, void PSGPUWrapper::PullSparse(const paddle::platform::Place& place,
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册