未验证 提交 08fa98f7 编写于 作者: Z Zeng Jinle 提交者: GitHub

Fix gpu_info PADDLE_ENFORCE_GT when fraction_of_gpu_memory_to_use=1.0 (#18950)

* fix gpu_info, test=develop

* fix reserving gpu memory calculation bug, add fraction=1 unittest, test=develop

* fix bug again for reserving size, test=develop
上级 3ab1866c
...@@ -208,6 +208,31 @@ TEST(BuddyAllocator, AllocFromAvailable) { ...@@ -208,6 +208,31 @@ TEST(BuddyAllocator, AllocFromAvailable) {
TestBuddyAllocator(&buddy_allocator, 10 << 10); TestBuddyAllocator(&buddy_allocator, 10 << 10);
TestBuddyAllocator(&buddy_allocator, 10 << 20); TestBuddyAllocator(&buddy_allocator, 10 << 20);
TestBuddyAllocator(&buddy_allocator, static_cast<size_t>(1 << 30)); TestBuddyAllocator(&buddy_allocator, static_cast<size_t>(1 << 30));
if (p) {
EXPECT_TRUE(cudaFree(p) == cudaSuccess);
}
}
TEST(BuddyAllocator, AllocFromAvailableWhenFractionIsOne) {
FLAGS_fraction_of_gpu_memory_to_use = 1.0;
FLAGS_initial_gpu_memory_in_mb = 0;
FLAGS_reallocate_gpu_memory_in_mb = 0;
void* p = nullptr;
EXPECT_TRUE(cudaMalloc(&p, static_cast<size_t>(4) << 30) == cudaSuccess);
// BuddyAllocator should be able to alloc the remaining GPU
BuddyAllocator buddy_allocator(
std::unique_ptr<SystemAllocator>(new GPUAllocator(TEST_GPU_ID)),
platform::GpuMinChunkSize(), platform::GpuMaxChunkSize());
TestBuddyAllocator(&buddy_allocator, static_cast<size_t>(1) << 30);
TestBuddyAllocator(&buddy_allocator, static_cast<size_t>(5) << 30);
if (p) {
EXPECT_TRUE(cudaFree(p) == cudaSuccess);
}
} }
#endif #endif
......
...@@ -230,12 +230,15 @@ void GpuMemoryUsage(size_t *available, size_t *total) { ...@@ -230,12 +230,15 @@ void GpuMemoryUsage(size_t *available, size_t *total) {
size_t GpuAvailableMemToAlloc() { size_t GpuAvailableMemToAlloc() {
size_t total = 0; size_t total = 0;
size_t available = 0; size_t available = 0;
size_t reserving = static_cast<size_t>(fraction_reserve_gpu_memory * total);
GpuMemoryUsage(&available, &total); GpuMemoryUsage(&available, &total);
size_t reserving =
static_cast<size_t>(fraction_reserve_gpu_memory * available);
// If available size is less than minimum chunk size, no usable memory exists // If available size is less than minimum chunk size, no usable memory exists
size_t available_to_alloc = available - reserving;
size_t min_chunk_size = GpuMinChunkSize(); size_t min_chunk_size = GpuMinChunkSize();
size_t available_to_alloc = if (available_to_alloc < min_chunk_size) {
std::min(available > min_chunk_size ? available : 0, total - reserving); available_to_alloc = 0;
}
VLOG(10) << "GPU usage " << (available >> 20) << "M/" << (total >> 20) VLOG(10) << "GPU usage " << (available >> 20) << "M/" << (total >> 20)
<< "M, " << (available_to_alloc >> 20) << "M available to allocate"; << "M, " << (available_to_alloc >> 20) << "M available to allocate";
return available_to_alloc; return available_to_alloc;
...@@ -255,7 +258,7 @@ static size_t GpuAllocSize(bool realloc) { ...@@ -255,7 +258,7 @@ static size_t GpuAllocSize(bool realloc) {
size_t alloc_bytes = size_t alloc_bytes =
(flag_mb > 0ul ? flag_mb << 20 : available_to_alloc * (flag_mb > 0ul ? flag_mb << 20 : available_to_alloc *
FLAGS_fraction_of_gpu_memory_to_use); FLAGS_fraction_of_gpu_memory_to_use);
PADDLE_ENFORCE_GT(available_to_alloc, alloc_bytes, PADDLE_ENFORCE_GE(available_to_alloc, alloc_bytes,
"No enough available GPU memory"); "No enough available GPU memory");
VLOG(10) << "Alloc size is " << (alloc_bytes >> 20) VLOG(10) << "Alloc size is " << (alloc_bytes >> 20)
<< " MiB, is it Re-alloc: " << realloc; << " MiB, is it Re-alloc: " << realloc;
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册