memory.cc 4.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/memory/memory.h"
16

L
liaogang 已提交
17 18
#include "glog/logging.h"

L
liaogang 已提交
19 20
#include "paddle/memory/detail/buddy_allocator.h"
#include "paddle/memory/detail/system_allocator.h"
L
liaogang 已提交
21 22 23
#include "paddle/platform/gpu_info.h"

DECLARE_double(fraction_of_gpu_memory_to_use);
L
liaogang 已提交
24

25 26 27
namespace paddle {
namespace memory {

28 29 30
using BuddyAllocator = detail::BuddyAllocator;

BuddyAllocator* GetCPUBuddyAllocator() {
31 32 33 34 35 36 37
  static detail::BuddyAllocator* a = nullptr;
  if (a == nullptr) {
    a = new detail::BuddyAllocator(new detail::CPUAllocator,
                                   platform::CpuMinChunkSize(),
                                   platform::CpuMaxChunkSize());
  }
  return a;
L
liaogang 已提交
38 39
}

L
liaogang 已提交
40 41
template <>
void* Alloc<platform::CPUPlace>(platform::CPUPlace place, size_t size) {
42
  VLOG(10) << "Allocate " << size << " bytes on " << platform::Place(place);
43
  void* p = GetCPUBuddyAllocator()->Alloc(size);
44
  VLOG(10) << "  pointer=" << p;
45
  return p;
L
liaogang 已提交
46 47 48 49
}

template <>
void Free<platform::CPUPlace>(platform::CPUPlace place, void* p) {
50
  VLOG(10) << "Free pointer=" << p << " on " << platform::Place(place);
L
liaogang 已提交
51 52 53 54 55 56 57 58
  GetCPUBuddyAllocator()->Free(p);
}

template <>
size_t Used<platform::CPUPlace>(platform::CPUPlace place) {
  return GetCPUBuddyAllocator()->Used();
}

59
#ifdef PADDLE_WITH_CUDA
L
liaogang 已提交
60

61
BuddyAllocator* GetGPUBuddyAllocator(int gpu_id) {
62 63
  static BuddyAllocator** as = NULL;
  if (as == NULL) {
64
    int gpu_num = platform::GetCUDADeviceCount();
65
    as = new BuddyAllocator*[gpu_num];
L
liaogang 已提交
66
    for (int gpu = 0; gpu < gpu_num; gpu++) {
67
      as[gpu] = nullptr;
L
liaogang 已提交
68
    }
69 70 71 72 73 74
  }
  platform::SetDeviceId(gpu_id);
  if (!as[gpu_id]) {
    as[gpu_id] = new BuddyAllocator(new detail::GPUAllocator,
                                    platform::GpuMinChunkSize(),
                                    platform::GpuMaxChunkSize());
75 76 77
    VLOG(10) << "\n\nNOTE: each GPU device use "
             << FLAGS_fraction_of_gpu_memory_to_use * 100
             << "% of GPU memory.\n"
78 79
             << "You can set GFlags environment variable '"
             << "FLAGS_fraction_of_gpu_memory_to_use"
80
             << "' to change the fraction of GPU usage.\n\n";
81 82
  }
  return as[gpu_id];
L
liaogang 已提交
83 84
}

L
liaogang 已提交
85
template <>
D
dzhwinter 已提交
86
size_t Used<platform::CUDAPlace>(platform::CUDAPlace place) {
87
  return GetGPUBuddyAllocator(place.device)->Used();
L
liaogang 已提交
88
}
L
liaogang 已提交
89

L
liaogang 已提交
90
template <>
D
dzhwinter 已提交
91
void* Alloc<platform::CUDAPlace>(platform::CUDAPlace place, size_t size) {
92 93 94 95 96 97 98 99 100 101 102 103
  auto* buddy_allocator = GetGPUBuddyAllocator(place.device);
  auto* ptr = buddy_allocator->Alloc(size);
  if (ptr == nullptr) {
    int cur_dev = platform::GetCurrentDeviceId();
    platform::SetDeviceId(place.device);
    size_t avail, total;
    platform::GpuMemoryUsage(avail, total);
    LOG(WARNING) << "Cannot allocate " << size << " bytes in GPU "
                 << place.device << ", available " << avail << " bytes";
    LOG(WARNING) << "total " << total;
    LOG(WARNING) << "GpuMinChunkSize " << platform::GpuMinChunkSize();
    LOG(WARNING) << "GpuMaxChunkSize " << platform::GpuMaxChunkSize();
D
dzhwinter 已提交
104
    LOG(WARNING) << "GPU memory used: " << Used<platform::CUDAPlace>(place);
105 106 107
    platform::SetDeviceId(cur_dev);
  }
  return ptr;
108 109
}

L
liaogang 已提交
110
template <>
D
dzhwinter 已提交
111
void Free<platform::CUDAPlace>(platform::CUDAPlace place, void* p) {
112
  GetGPUBuddyAllocator(place.device)->Free(p);
113 114
}

L
Luo Tao 已提交
115
#endif
116

117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132
size_t Usage::operator()(const platform::CPUPlace& cpu) const {
  return Used(cpu);
}

size_t Usage::operator()(const platform::CUDAPlace& gpu) const {
#ifdef PADDLE_WITH_CUDA
  return Used(gpu);
#else
  PADDLE_THROW("'CUDAPlace' is not supported in CPU only device.");
#endif
}

size_t memory_usage(const platform::Place& p) {
  return boost::apply_visitor(Usage(), p);
}

133 134
}  // namespace memory
}  // namespace paddle