diff --git a/paddle/fluid/memory/allocation/CMakeLists.txt b/paddle/fluid/memory/allocation/CMakeLists.txt
index b2be837832336b2e5e08291feae67333854ae676..2f69b5c0c8619b09453dbb66cb40f0a18ba204d8 100644
--- a/paddle/fluid/memory/allocation/CMakeLists.txt
+++ b/paddle/fluid/memory/allocation/CMakeLists.txt
@@ -2,6 +2,7 @@ cc_library(allocator SRCS allocator.cc DEPS place)
 cc_library(cpu_allocator SRCS cpu_allocator.cc DEPS allocator)
 cc_library(best_fit_allocator SRCS best_fit_allocator.cc DEPS allocator)
 cc_library(locked_allocator SRCS locked_allocator.cc DEPS allocator)
+cc_library(buffered_allocator SRCS buffered_allocator.cc DEPS allocator)
 
 if (WITH_GPU)
   nv_library(cuda_allocator SRCS cuda_allocator.cc DEPS allocator cuda_device_guard)
@@ -51,7 +52,8 @@ cc_library(allocator_facade SRCS allocator_facade.cc DEPS
         auto_increment_allocator
         zero_size_allocator
         conditional_allocator
-        retry_allocator)
+        retry_allocator
+        buffered_allocator)
 
 nv_test(allocation_and_eigen_test SRCS allocation_and_eigen_test.cu DEPS allocator_facade)
 
diff --git a/paddle/fluid/memory/allocation/allocator.h b/paddle/fluid/memory/allocation/allocator.h
index e117a2d1537a899e3d0fe990e2aece38c1cfbd63..9c838362d975b5b7c99f5196da7f757286126242 100644
--- a/paddle/fluid/memory/allocation/allocator.h
+++ b/paddle/fluid/memory/allocation/allocator.h
@@ -12,22 +12,6 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
-#include <utility>
-
-// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//     http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
 #pragma once
 #include <memory>
 #include <string>
@@ -141,11 +125,7 @@ class Allocator {
 // a manally managed allocator.
 class UnmanagedAllocator : public Allocator {
  public:
-  virtual void Free(Allocation* allocation) = 0;
-
-  void FreeUniquePtr(std::unique_ptr<Allocation> allocation) {
-    Free(allocation.get());
-  }
+  virtual void FreeUniquePtr(std::unique_ptr<Allocation> allocation) = 0;
 };
 
 // The allocation will be managed by smart pointers. i.e., users do not need
diff --git a/paddle/fluid/memory/allocation/best_fit_allocator.cc b/paddle/fluid/memory/allocation/best_fit_allocator.cc
index 8cc943c861acff4abb148bde1397343f03e896b1..b903fa437bb5d4aae1a0d152263d2ec70c8034b3 100644
--- a/paddle/fluid/memory/allocation/best_fit_allocator.cc
+++ b/paddle/fluid/memory/allocation/best_fit_allocator.cc
@@ -104,8 +104,8 @@ BestFitAllocator::ListIt BestFitAllocator::SplitChunk(size_t request_size,
   return to_use_it;
 }
 
-void BestFitAllocator::Free(Allocation* allocation) {
-  auto* bf_allocation = dynamic_cast<BestFitAllocation*>(allocation);
+void BestFitAllocator::FreeUniquePtr(std::unique_ptr<Allocation> allocation) {
+  auto* bf_allocation = dynamic_cast<BestFitAllocation*>(allocation.get());
   auto chunk_it = bf_allocation->ChunkIterator();
   PADDLE_ENFORCE(!chunk_it->is_free);
   chunk_it->is_free = true;
diff --git a/paddle/fluid/memory/allocation/best_fit_allocator.h b/paddle/fluid/memory/allocation/best_fit_allocator.h
index da62bc4bb61e09f8b49cdc5e67f7932aa21a860e..405306bba7b17abe7305740d1b700185076f8ee8 100644
--- a/paddle/fluid/memory/allocation/best_fit_allocator.h
+++ b/paddle/fluid/memory/allocation/best_fit_allocator.h
@@ -109,7 +109,7 @@ class BestFitAllocator : public UnmanagedAllocator {
 
   std::unique_ptr<Allocation> Allocate(size_t size,
                                        Attr attr = kDefault) override;
-  void Free(Allocation* allocation) override;
+  void FreeUniquePtr(std::unique_ptr<Allocation> allocation) override;
 
   size_t NumFreeChunks() const;
 
diff --git a/paddle/fluid/memory/allocation/buffered_allocator.cc b/paddle/fluid/memory/allocation/buffered_allocator.cc
new file mode 100644
index 0000000000000000000000000000000000000000..1eb1d3c7e8d402e1d889d7ec0f1ed82acae64758
--- /dev/null
+++ b/paddle/fluid/memory/allocation/buffered_allocator.cc
@@ -0,0 +1,176 @@
+// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "paddle/fluid/memory/allocation/buffered_allocator.h"
+#include <algorithm>
+#include <limits>
+#include <utility>
+
+namespace paddle {
+namespace memory {
+namespace allocation {
+
+BufferedAllocator::BufferedAllocator(std::unique_ptr<Allocator>&& allocator) {
+  std::vector<size_t> division_plan(8 * sizeof(size_t));
+  for (size_t i = 0; i < 8 * sizeof(size_t); ++i) {
+    division_plan[i] = (static_cast<size_t>(1) << i);
+  }
+  InitAndEnforceCheck(std::move(allocator), division_plan);
+}
+
+BufferedAllocator::BufferedAllocator(std::unique_ptr<Allocator>&& allocator,
+                                     const std::vector<size_t>& division_plan) {
+  InitAndEnforceCheck(std::move(allocator), division_plan);
+}
+
+BufferedAllocator::~BufferedAllocator() {
+  for (auto& v : allocations_) {
+    for (auto& pair : v) {
+      underlying_allocator_->FreeUniquePtr(std::move(pair.second));
+    }
+  }
+}
+
+void BufferedAllocator::InitAndEnforceCheck(
+    std::unique_ptr<Allocator>&& allocator,
+    const std::vector<size_t>& division_plan) {
+  underlying_allocator_.reset(
+      dynamic_cast<UnmanagedAllocator*>(allocator.release()));
+  PADDLE_ENFORCE_NOT_NULL(
+      underlying_allocator_,
+      "Underlying allocator of BufferedAllocator must be unmanaged");
+  if (underlying_allocator_->IsAllocThreadSafe()) {
+    mtx_.reset(new std::mutex());
+  }
+  constexpr size_t kMax = std::numeric_limits<size_t>::max();
+  if (division_plan.empty()) {
+    division_plan_.assign({0, kMax});
+  } else {
+    auto from = division_plan.front() == 0 ? division_plan.begin() + 1
+                                           : division_plan.begin();
+    auto to = division_plan.back() == kMax ? division_plan.end() - 1
+                                           : division_plan.end();
+    division_plan_.reserve(to - from + 2);
+    division_plan_.push_back(0);
+    division_plan_.insert(division_plan_.end(), from, to);
+    division_plan_.push_back(kMax);
+    for (size_t i = 1; i < division_plan_.size(); ++i) {
+      PADDLE_ENFORCE_LT(division_plan_[i - 1], division_plan_[i],
+                        "Division plan must be strictly sorted");
+    }
+  }
+  allocations_.resize(division_plan_.size() - 1);
+}
+
+void BufferedAllocator::InsertAllocationImpl(
+    std::unique_ptr<Allocation>&& allocation) {
+  auto size = allocation->size();
+  auto idx = GetListIndex(size);
+  allocations_[idx].insert(std::pair<size_t, std::unique_ptr<Allocation>>(
+      size, std::move(allocation)));
+}
+
+void BufferedAllocator::InsertAllocation(
+    std::unique_ptr<Allocation>&& allocation) {
+  if (mtx_) {
+    std::lock_guard<std::mutex> lock(*mtx_);
+    InsertAllocationImpl(std::move(allocation));
+  } else {
+    InsertAllocationImpl(std::move(allocation));
+  }
+}
+
+bool BufferedAllocator::Match(const std::unique_ptr<Allocation>& allocation,
+                              size_t size) {
+  return (allocation->size() >> 1) <= size;
+}
+
+size_t BufferedAllocator::GetListIndex(size_t size) {
+  auto it =
+      std::upper_bound(division_plan_.begin(), division_plan_.end(), size);
+  return static_cast<size_t>(it - division_plan_.begin()) - 1;
+}
+
+std::unique_ptr<Allocation> BufferedAllocator::RemoveAllocationImpl(
+    size_t size) {
+  auto idx = GetListIndex(size);
+  auto& allocation_map = allocations_[idx];
+  auto it = allocation_map.lower_bound(size);
+  // Only remove allocation whose size is not more than twice of requested size
+  if (it != allocation_map.end() && Match(it->second, size)) {
+    auto ret = std::move(it->second);
+    allocation_map.erase(it);
+    return ret;
+  } else {
+    return nullptr;
+  }
+}
+
+std::unique_ptr<Allocation> BufferedAllocator::RemoveAllocation(size_t size) {
+  if (mtx_) {
+    std::lock_guard<std::mutex> lock(*mtx_);
+    return RemoveAllocationImpl(size);
+  } else {
+    return RemoveAllocationImpl(size);
+  }
+}
+
+std::unique_ptr<Allocation> BufferedAllocator::Allocate(size_t size,
+                                                        Allocator::Attr attr) {
+  auto ret = RemoveAllocation(size);
+  if (!ret) {
+    try {
+      return underlying_allocator_->Allocate(size, attr);
+    } catch (BadAlloc&) {
+      // if allocation failed, try to free some memorys from buffers
+      FreeAllocations(size);
+      return underlying_allocator_->Allocate(size, attr);
+    }
+  }
+  return ret;
+}
+
+void BufferedAllocator::FreeAllocationsImpl(size_t size) {
+  if (UNLIKELY(size == 0)) return;
+  size_t cur = 0;
+  for (auto& alloc_map : allocations_) {
+    // use reverse iterator to free large allocations first
+    while (!alloc_map.empty()) {
+      auto it = --(alloc_map.end());
+      cur += it->second->size();
+      underlying_allocator_->FreeUniquePtr(std::move(it->second));
+      alloc_map.erase(it);
+      if (cur >= size) return;
+    }
+  }
+}
+
+void BufferedAllocator::FreeAllocations(size_t size) {
+  if (mtx_) {
+    std::lock_guard<std::mutex> lock(*mtx_);
+    FreeAllocationsImpl(size);
+  } else {
+    FreeAllocationsImpl(size);
+  }
+}
+
+void BufferedAllocator::FreeUniquePtr(std::unique_ptr<Allocation> allocation) {
+  InsertAllocation(std::move(allocation));
+}
+
+bool BufferedAllocator::IsAllocThreadSafe() const { return mtx_ != nullptr; }
+
+}  // namespace allocation
+}  // namespace memory
+}  // namespace paddle
diff --git a/paddle/fluid/memory/allocation/buffered_allocator.h b/paddle/fluid/memory/allocation/buffered_allocator.h
new file mode 100644
index 0000000000000000000000000000000000000000..630b3ad800d90711fe4fdee7650efdd828aac45e
--- /dev/null
+++ b/paddle/fluid/memory/allocation/buffered_allocator.h
@@ -0,0 +1,70 @@
+// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+
+#include <cstdint>
+#include <map>
+#include <memory>
+#include <vector>
+#include "paddle/fluid/memory/allocation/allocator.h"
+
+namespace paddle {
+namespace memory {
+namespace allocation {
+
+// NOTE(zjl): BufferedAllocator maintains a memory pool to accelerate
+// memory allocation and reuse memory.
+// BufferedAllocator provides the same thread-safety level as
+// underlying_allocator_
+class BufferedAllocator : public UnmanagedAllocator {
+ public:
+  explicit BufferedAllocator(std::unique_ptr<Allocator>&& allocator);
+
+  BufferedAllocator(std::unique_ptr<Allocator>&& allocator,
+                    const std::vector<size_t>& division_plan);
+
+  ~BufferedAllocator();
+
+  std::unique_ptr<Allocation> Allocate(size_t size, Allocator::Attr) override;
+
+  void FreeUniquePtr(std::unique_ptr<Allocation> allocation) override;
+
+  bool IsAllocThreadSafe() const override;
+
+ private:
+  void InitAndEnforceCheck(std::unique_ptr<Allocator>&& allocator,
+                           const std::vector<size_t>& division_plan);
+
+  void InsertAllocation(std::unique_ptr<Allocation>&& allocation);
+  void InsertAllocationImpl(std::unique_ptr<Allocation>&& allocation);
+
+  static bool Match(const std::unique_ptr<Allocation>& allocation, size_t size);
+  std::unique_ptr<Allocation> RemoveAllocation(size_t size);
+  std::unique_ptr<Allocation> RemoveAllocationImpl(size_t size);
+
+  void FreeAllocations(size_t size);
+  void FreeAllocationsImpl(size_t size);
+
+  size_t GetListIndex(size_t size);
+
+  std::unique_ptr<UnmanagedAllocator> underlying_allocator_;
+  std::vector<std::multimap<size_t, std::unique_ptr<Allocation>>> allocations_;
+  std::vector<size_t> division_plan_;
+  std::unique_ptr<std::mutex> mtx_;
+};
+
+}  // namespace allocation
+}  // namespace memory
+}  // namespace paddle
diff --git a/paddle/fluid/memory/allocation/cpu_allocator.cc b/paddle/fluid/memory/allocation/cpu_allocator.cc
index 3133627bf7202f4fa9d9fd5ec2e62376133779a9..3714c0da746474db1a89f7cbb93a50ebdbb9ee02 100644
--- a/paddle/fluid/memory/allocation/cpu_allocator.cc
+++ b/paddle/fluid/memory/allocation/cpu_allocator.cc
@@ -29,8 +29,8 @@ std::unique_ptr<Allocation> CPUAllocator::Allocate(size_t size, Attr attr) {
   }
   return std::unique_ptr<Allocation>(new CPUAllocation(ptr, size));
 }
-void CPUAllocator::Free(Allocation* allocation) {
-  PADDLE_ENFORCE_NOT_NULL(dynamic_cast<CPUAllocation*>(allocation));
+void CPUAllocator::FreeUniquePtr(std::unique_ptr<Allocation> allocation) {
+  PADDLE_ENFORCE_NOT_NULL(dynamic_cast<CPUAllocation*>(allocation.get()));
   free(allocation->ptr());
 }
 
diff --git a/paddle/fluid/memory/allocation/cpu_allocator.h b/paddle/fluid/memory/allocation/cpu_allocator.h
index b2df77f1227c658e6ba83075fbc0f46340305334..0852a58e577732a73a5bc6d924204533b6558c68 100644
--- a/paddle/fluid/memory/allocation/cpu_allocator.h
+++ b/paddle/fluid/memory/allocation/cpu_allocator.h
@@ -36,7 +36,7 @@ class CPUAllocator : public UnmanagedAllocator {
   constexpr static size_t kAlignment = 64u;
   std::unique_ptr<Allocation> Allocate(size_t size,
                                        Attr attr = kDefault) override;
-  void Free(Allocation* allocation) override;
+  void FreeUniquePtr(std::unique_ptr<Allocation> allocation) override;
   bool IsAllocThreadSafe() const override;
 };
 }  // namespace allocation
diff --git a/paddle/fluid/memory/allocation/cuda_allocator.cc b/paddle/fluid/memory/allocation/cuda_allocator.cc
index 7b477c53ea2ead54073658a015ca7dc5a41309eb..20a62ea067c0b85be1f5b41a1f2adfddcc38f7d6 100644
--- a/paddle/fluid/memory/allocation/cuda_allocator.cc
+++ b/paddle/fluid/memory/allocation/cuda_allocator.cc
@@ -35,9 +35,9 @@ std::unique_ptr<Allocation> CUDAAllocator::Allocate(size_t size, Attr attr) {
       new CUDAAllocation(ptr, size, platform::Place(place_)));
 }
 
-void CUDAAllocator::Free(Allocation* allocation) {
+void CUDAAllocator::FreeUniquePtr(std::unique_ptr<Allocation> allocation) {
   platform::CUDADeviceGuard guard(place_.device);
-  auto* cuda_allocation = dynamic_cast<CUDAAllocation*>(allocation);
+  auto* cuda_allocation = dynamic_cast<CUDAAllocation*>(allocation.get());
   PADDLE_ENFORCE_NOT_NULL(cuda_allocation);
   PADDLE_ENFORCE_EQ(boost::get<platform::CUDAPlace>(cuda_allocation->place()),
                     place_);
diff --git a/paddle/fluid/memory/allocation/cuda_allocator.h b/paddle/fluid/memory/allocation/cuda_allocator.h
index dea01e60890741877a387e5588fae8703dd202ac..33556413df9acc3858e1afead92e3a2b375a106c 100644
--- a/paddle/fluid/memory/allocation/cuda_allocator.h
+++ b/paddle/fluid/memory/allocation/cuda_allocator.h
@@ -34,7 +34,7 @@ class CUDAAllocator : public UnmanagedAllocator {
       : place_(boost::get<platform::CUDAPlace>(place)) {}
   std::unique_ptr<Allocation> Allocate(size_t size,
                                        Attr attr = kDefault) override;
-  void Free(Allocation* allocation) override;
+  void FreeUniquePtr(std::unique_ptr<Allocation> allocation) override;
   bool IsAllocThreadSafe() const override;
 
  private:
diff --git a/paddle/fluid/memory/allocation/locked_allocator.cc b/paddle/fluid/memory/allocation/locked_allocator.cc
index dea87229f9143efb1d0efbe121bf923c6df0810a..0b9f1f753146e4c4e97a2a0402e8d0b1524324cd 100644
--- a/paddle/fluid/memory/allocation/locked_allocator.cc
+++ b/paddle/fluid/memory/allocation/locked_allocator.cc
@@ -27,12 +27,12 @@ std::unique_ptr<Allocation> LockedAllocator::Allocate(size_t size, Attr attr) {
     return underlying_allocator_->Allocate(size, attr);
   }
 }
-void LockedAllocator::Free(Allocation *allocation) {
+void LockedAllocator::FreeUniquePtr(std::unique_ptr<Allocation> allocation) {
   if (underlying_allocator_->IsAllocThreadSafe()) {
-    return underlying_allocator_->Free(allocation);
+    return underlying_allocator_->FreeUniquePtr(std::move(allocation));
   } else {
     std::lock_guard<std::mutex> guard(mtx_);
-    return underlying_allocator_->Free(allocation);
+    return underlying_allocator_->FreeUniquePtr(std::move(allocation));
   }
 }
 bool LockedAllocator::IsAllocThreadSafe() const { return true; }
diff --git a/paddle/fluid/memory/allocation/locked_allocator.h b/paddle/fluid/memory/allocation/locked_allocator.h
index d6b877ba4f7da3e191624b94eb832b7aa8c0069f..952622f534477dc01afc51788f58ba142481f7e9 100644
--- a/paddle/fluid/memory/allocation/locked_allocator.h
+++ b/paddle/fluid/memory/allocation/locked_allocator.h
@@ -27,7 +27,7 @@ class LockedAllocator : public UnmanagedAllocator {
   explicit LockedAllocator(std::unique_ptr<Allocator>&& underlying_allocator);
   std::unique_ptr<Allocation> Allocate(size_t size,
                                        Attr attr = kDefault) override;
-  void Free(Allocation* allocation) override;
+  void FreeUniquePtr(std::unique_ptr<Allocation> allocation) override;
   bool IsAllocThreadSafe() const override;
 
  private:
diff --git a/paddle/fluid/memory/allocation/naive_managed_allocator_test.cc b/paddle/fluid/memory/allocation/naive_managed_allocator_test.cc
index 027fdec26def0208ff961688799b472a2be0f671..bb7440d394621f92c8a1bac97c1b5444caacd042 100644
--- a/paddle/fluid/memory/allocation/naive_managed_allocator_test.cc
+++ b/paddle/fluid/memory/allocation/naive_managed_allocator_test.cc
@@ -31,7 +31,9 @@ class StubAllocator : public UnmanagedAllocator {
     return std::unique_ptr<Allocation>(
         new Allocation(nullptr, size, platform::CPUPlace()));
   }
-  void Free(Allocation* allocation) override { counter_.fetch_sub(1); }
+  void FreeUniquePtr(std::unique_ptr<Allocation> allocation) override {
+    counter_.fetch_sub(1);
+  }
   bool IsAllocThreadSafe() const override { return true; }
 
   std::atomic<int> counter_{0};
diff --git a/paddle/fluid/memory/allocation/pinned_allocator.cc b/paddle/fluid/memory/allocation/pinned_allocator.cc
index 650dab1b27c8095b3bd1c6d33cff20a2d0d7c5de..581dd64aaf2bd95452f342b3f7a4beba3c9aa032 100644
--- a/paddle/fluid/memory/allocation/pinned_allocator.cc
+++ b/paddle/fluid/memory/allocation/pinned_allocator.cc
@@ -32,8 +32,8 @@ std::unique_ptr<Allocation> CPUPinnedAllocator::Allocate(size_t size,
       new CPUPinnedAllocation(ptr, size));
 }
 
-void CPUPinnedAllocator::Free(Allocation* allocation) {
-  PADDLE_ENFORCE_NOT_NULL(dynamic_cast<CPUPinnedAllocation*>(allocation));
+void CPUPinnedAllocator::FreeUniquePtr(std::unique_ptr<Allocation> allocation) {
+  PADDLE_ENFORCE_NOT_NULL(dynamic_cast<CPUPinnedAllocation*>(allocation.get()));
   PADDLE_ENFORCE(cudaFreeHost(allocation->ptr()));
 }
 
diff --git a/paddle/fluid/memory/allocation/pinned_allocator.h b/paddle/fluid/memory/allocation/pinned_allocator.h
index d001a91d893e759ae838c93f6e104f5ed4b3a00b..b0d7e9091eff0d185499b2d9fe40216743845105 100644
--- a/paddle/fluid/memory/allocation/pinned_allocator.h
+++ b/paddle/fluid/memory/allocation/pinned_allocator.h
@@ -29,7 +29,7 @@ class CPUPinnedAllocation : public Allocation {
 class CPUPinnedAllocator : public UnmanagedAllocator {
  public:
   std::unique_ptr<Allocation> Allocate(size_t size, Attr attr) override;
-  void Free(Allocation* allocation) override;
+  void FreeUniquePtr(std::unique_ptr<Allocation> allocation) override;
   bool IsAllocThreadSafe() const override;
 };
 
diff --git a/paddle/fluid/memory/allocation/retry_allocator.cc b/paddle/fluid/memory/allocation/retry_allocator.cc
index 9a4ff2f51d08713b425f2a21c3287b71a1857327..9dc568ef2ab6d4ce79e2c923311a53cf0cede278 100644
--- a/paddle/fluid/memory/allocation/retry_allocator.cc
+++ b/paddle/fluid/memory/allocation/retry_allocator.cc
@@ -75,7 +75,7 @@ Allocation* RetryAllocator::AllocateImpl(size_t size, Allocator::Attr attr) {
 }
 void RetryAllocator::FreeUnderlyingAllocation(
     std::unique_ptr<Allocation>&& allocation) {
-  underlying_allocator_->Free(allocation.get());
+  underlying_allocator_->FreeUniquePtr(std::move(allocation));
   {
     // notify all waited allocators, they can try to allocate memory after free.
     std::lock_guard<std::mutex> lock(mutex_);