memory.cc 5.5 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
2 3 4 5 6 7 8 9 10 11 12 13 14

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

Y
Yi Wang 已提交
15
#include "paddle/fluid/memory/memory.h"
16

L
liaogang 已提交
17 18
#include "glog/logging.h"

Y
Yi Wang 已提交
19 20 21
#include "paddle/fluid/memory/detail/buddy_allocator.h"
#include "paddle/fluid/memory/detail/system_allocator.h"
#include "paddle/fluid/platform/gpu_info.h"
L
liaogang 已提交
22 23

DECLARE_double(fraction_of_gpu_memory_to_use);
L
liaogang 已提交
24

25 26 27
namespace paddle {
namespace memory {

28 29 30
using BuddyAllocator = detail::BuddyAllocator;

BuddyAllocator* GetCPUBuddyAllocator() {
31 32 33 34 35 36 37
  static detail::BuddyAllocator* a = nullptr;
  if (a == nullptr) {
    a = new detail::BuddyAllocator(new detail::CPUAllocator,
                                   platform::CpuMinChunkSize(),
                                   platform::CpuMaxChunkSize());
  }
  return a;
L
liaogang 已提交
38 39
}

L
liaogang 已提交
40
template <>
C
chengduoZH 已提交
41
void* Alloc<platform::CPUPlace>(platform::CPUPlace place, size_t size,
C
chengduoZH 已提交
42
                                bool is_pinned) {
43
  VLOG(10) << "Allocate " << size << " bytes on " << platform::Place(place);
44
  void* p = GetCPUBuddyAllocator()->Alloc(size);
45
  VLOG(10) << "  pointer=" << p;
46
  return p;
L
liaogang 已提交
47 48 49
}

template <>
C
chengduoZH 已提交
50
void Free<platform::CPUPlace>(platform::CPUPlace place, void* p,
C
chengduoZH 已提交
51
                              bool is_pinned) {
52
  VLOG(10) << "Free pointer=" << p << " on " << platform::Place(place);
L
liaogang 已提交
53 54 55 56 57 58 59 60
  GetCPUBuddyAllocator()->Free(p);
}

template <>
size_t Used<platform::CPUPlace>(platform::CPUPlace place) {
  return GetCPUBuddyAllocator()->Used();
}

61
#ifdef PADDLE_WITH_CUDA
L
liaogang 已提交
62

63
BuddyAllocator* GetGPUBuddyAllocator(int gpu_id) {
64 65
  static BuddyAllocator** as = NULL;
  if (as == NULL) {
66
    int gpu_num = platform::GetCUDADeviceCount();
67
    as = new BuddyAllocator*[gpu_num];
L
liaogang 已提交
68
    for (int gpu = 0; gpu < gpu_num; gpu++) {
69
      as[gpu] = nullptr;
L
liaogang 已提交
70
    }
71 72 73 74 75 76
  }
  platform::SetDeviceId(gpu_id);
  if (!as[gpu_id]) {
    as[gpu_id] = new BuddyAllocator(new detail::GPUAllocator,
                                    platform::GpuMinChunkSize(),
                                    platform::GpuMaxChunkSize());
77 78 79
    VLOG(10) << "\n\nNOTE: each GPU device use "
             << FLAGS_fraction_of_gpu_memory_to_use * 100
             << "% of GPU memory.\n"
80 81
             << "You can set GFlags environment variable '"
             << "FLAGS_fraction_of_gpu_memory_to_use"
82
             << "' to change the fraction of GPU usage.\n\n";
83 84
  }
  return as[gpu_id];
L
liaogang 已提交
85 86
}

C
chengduoZH 已提交
87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110
BuddyAllocator* GetCUDAPinnedBuddyAllocator(int gpu_id) {
  static BuddyAllocator** as = NULL;
  if (as == NULL) {
    int gpu_num = platform::GetCUDADeviceCount();
    as = new BuddyAllocator*[gpu_num];
    for (int gpu = 0; gpu < gpu_num; gpu++) {
      as[gpu] = nullptr;
    }
  }
  platform::SetDeviceId(gpu_id);
  if (!as[gpu_id]) {
    as[gpu_id] = new BuddyAllocator(new detail::CUDAPinnedAllocator,
                                    platform::GpuMinChunkSize(),
                                    platform::GpuMaxChunkSize());
    VLOG(10) << "\n\nNOTE: each GPU device use "
             << FLAGS_fraction_of_gpu_memory_to_use * 100
             << "% of GPU memory.\n"
             << "You can set GFlags environment variable '"
             << "FLAGS_fraction_of_gpu_memory_to_use"
             << "' to change the fraction of GPU usage.\n\n";
  }
  return as[gpu_id];
}

L
liaogang 已提交
111
template <>
D
dzhwinter 已提交
112
size_t Used<platform::CUDAPlace>(platform::CUDAPlace place) {
113
  return GetGPUBuddyAllocator(place.device)->Used();
L
liaogang 已提交
114
}
L
liaogang 已提交
115

L
liaogang 已提交
116
template <>
C
chengduoZH 已提交
117
void* Alloc<platform::CUDAPlace>(platform::CUDAPlace place, size_t size,
C
chengduoZH 已提交
118
                                 bool is_pinned) {
C
chengduoZH 已提交
119
  void* ptr;
C
chengduoZH 已提交
120
  if (is_pinned) {
C
chengduoZH 已提交
121 122 123 124 125 126 127
    auto* buddy_allocator = GetCUDAPinnedBuddyAllocator(place.device);
    ptr = buddy_allocator->Alloc(size);
  } else {
    auto* buddy_allocator = GetGPUBuddyAllocator(place.device);
    ptr = buddy_allocator->Alloc(size);
  }

128 129 130 131 132 133 134 135 136 137
  if (ptr == nullptr) {
    int cur_dev = platform::GetCurrentDeviceId();
    platform::SetDeviceId(place.device);
    size_t avail, total;
    platform::GpuMemoryUsage(avail, total);
    LOG(WARNING) << "Cannot allocate " << size << " bytes in GPU "
                 << place.device << ", available " << avail << " bytes";
    LOG(WARNING) << "total " << total;
    LOG(WARNING) << "GpuMinChunkSize " << platform::GpuMinChunkSize();
    LOG(WARNING) << "GpuMaxChunkSize " << platform::GpuMaxChunkSize();
D
dzhwinter 已提交
138
    LOG(WARNING) << "GPU memory used: " << Used<platform::CUDAPlace>(place);
139 140 141
    platform::SetDeviceId(cur_dev);
  }
  return ptr;
142 143
}

L
liaogang 已提交
144
template <>
C
chengduoZH 已提交
145
void Free<platform::CUDAPlace>(platform::CUDAPlace place, void* p,
C
chengduoZH 已提交
146 147
                               bool is_pinned) {
  if (is_pinned) {
C
chengduoZH 已提交
148 149 150 151
    GetCUDAPinnedBuddyAllocator(place.device)->Free(p);
  } else {
    GetGPUBuddyAllocator(place.device)->Free(p);
  }
152 153
}

L
Luo Tao 已提交
154
#endif
155

156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171
size_t Usage::operator()(const platform::CPUPlace& cpu) const {
  return Used(cpu);
}

size_t Usage::operator()(const platform::CUDAPlace& gpu) const {
#ifdef PADDLE_WITH_CUDA
  return Used(gpu);
#else
  PADDLE_THROW("'CUDAPlace' is not supported in CPU only device.");
#endif
}

size_t memory_usage(const platform::Place& p) {
  return boost::apply_visitor(Usage(), p);
}

172 173
}  // namespace memory
}  // namespace paddle