Paddle/paddle/fluid/memory/allocation/allocator_facade.cc

// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/memory/allocation/allocator.h"
#include <gflags/gflags.h>
#include <map>
#include <unordered_map>
#include <vector>
#include "paddle/fluid/memory/allocation/aligned_allocator.h"
#include "paddle/fluid/memory/allocation/allocator_facade.h"
#include "paddle/fluid/memory/allocation/auto_increment_allocator.h"
#include "paddle/fluid/memory/allocation/best_fit_allocator.h"
#include "paddle/fluid/memory/allocation/conditional_allocator.h"
#include "paddle/fluid/memory/allocation/cpu_allocator.h"
#include "paddle/fluid/memory/allocation/locked_allocator.h"
#include "paddle/fluid/memory/allocation/retry_allocator.h"
#include "paddle/fluid/memory/allocation/zero_size_allocator.h"
#include "paddle/fluid/platform/cpu_info.h"
#include "paddle/fluid/platform/place.h"
#ifdef PADDLE_WITH_CUDA
#include "paddle/fluid/memory/allocation/cuda_allocator.h"
#include "paddle/fluid/memory/allocation/pinned_allocator.h"
#include "paddle/fluid/platform/cuda_device_guard.h"
#include "paddle/fluid/platform/gpu_info.h"
#endif

DEFINE_int64(
    gpu_allocator_retry_time, 0,
    "The retry time (milliseconds) when allocator fails "
    "to allocate memory. No retry if this value is not greater than 0");

namespace paddle {
namespace memory {
namespace allocation {

// TODO(yy): Dirty code here. This class should be configurable in runtime.
class CPUManagedAllocator : public Allocator {
 public:
  CPUManagedAllocator() : normal_allocator_(new CPUAllocator()) {}

  AllocationPtr Allocate(size_t size, Attr attr) override {
    return normal_allocator_->Allocate(size, attr);
  }

  bool IsAllocThreadSafe() const override { return true; }

 private:
  std::shared_ptr<Allocator> normal_allocator_;
};

// TODO(yy): Dirty code here. This class should be configurable in runtime.
class ChunkedManagedAllocator : public Allocator {
 public:
  explicit ChunkedManagedAllocator(std::unique_ptr<Allocator> system_allocator,
                                   size_t max_chunk_size, size_t capacity = 1,
                                   int64_t retry_time = -1)
      : max_chunk_size_(max_chunk_size), retry_time_(retry_time) {
    raw_allocator_ = std::move(system_allocator);

    if (max_chunk_size_ == 0) {
      default_allocator_ = raw_allocator_;
    } else {
      if (capacity == 1) {
        VLOG(10) << "Create BestFitAllocator with chunk_size "
                 << max_chunk_size_;
        default_allocator_ = BestFitAllocatorCreator();
      } else {
        VLOG(10) << "Create AutoIncrementAllocator with chunk_size "
                 << max_chunk_size_ << " and capacity " << capacity;
        default_allocator_ = std::make_shared<AutoIncrementAllocator>(
            [this] { return std::move(BestFitAllocatorCreator()); }, capacity);
      }
    }

    auto* cond_allocator = new ConditionalAllocator();
    cond_allocator
        ->AddAllocator(
            [this](size_t size, Attr attr) { return size < max_chunk_size_; },
            default_allocator_)
        .AddAllocator(
            [](size_t size, Attr attr) {
              return true;  // default case
            },
            raw_allocator_);
    default_allocator_.reset(cond_allocator);
  }

  ~ChunkedManagedAllocator() {
    // Specify destruct order.
    default_allocator_.reset();
    chunks_.clear();
    raw_allocator_.reset();
  }

  AllocationPtr Allocate(size_t size, Attr attr) override {
    return default_allocator_->Allocate(size, attr);
  }

  std::shared_ptr<Allocator> BestFitAllocatorCreator() {
    chunks_.emplace_back(raw_allocator_->Allocate(max_chunk_size_));
    auto* allocation = chunks_.back().get();
    std::unique_ptr<Allocator> unmanaged_allocator(new LockedAllocator(
        std::unique_ptr<Allocator>(new BestFitAllocator(allocation))));

    if (retry_time_ <= 0) {
      VLOG(10) << "Create NaiveManagedAllocator without retry";
      return std::make_shared<AlignedAllocator<64u>>(
          std::move(unmanaged_allocator));
    } else {
      VLOG(10) << "Create RetryAllocator with retry_time " << retry_time_
               << "ms";
      auto tmp = std::make_shared<RetryAllocator>(
          std::move(unmanaged_allocator), static_cast<size_t>(retry_time_));
      return std::make_shared<AlignedAllocator<64u>>(tmp);
    }
  }

  bool IsAllocThreadSafe() const override { return true; }

 protected:
  size_t max_chunk_size_;
  int64_t retry_time_;
  std::vector<AllocationPtr> chunks_;
  std::shared_ptr<Allocator> raw_allocator_;
  std::shared_ptr<Allocator> default_allocator_;
};

#ifdef PADDLE_WITH_CUDA

class CUDAManagedAllocator : public ChunkedManagedAllocator {
 public:
  explicit CUDAManagedAllocator(int dev_id)
      : ChunkedManagedAllocator(
            std::unique_ptr<Allocator>(
                new CUDAAllocator(platform::CUDAPlace(dev_id))),
            GetMaxChunkSize(dev_id), GetCapcity(dev_id), GetRetryTime()) {}

 private:
  static size_t GetMaxChunkSize(int dev_id) {
    platform::CUDADeviceGuard guard(dev_id);
    return platform::GpuMaxChunkSize();
  }

  static size_t GetCapcity(int dev_id) {
    platform::CUDADeviceGuard guard(dev_id);
    size_t available, total;
    platform::GpuMemoryUsage(&available, &total);
    size_t max_chunk_size = platform::GpuMaxChunkSize();
    return max_chunk_size == 0 ? 0 : available / max_chunk_size;
  }

  static int64_t GetRetryTime() { return FLAGS_gpu_allocator_retry_time; }
};

class CUDAPinnedManagedAllocator : public ChunkedManagedAllocator {
 public:
  CUDAPinnedManagedAllocator()
      : ChunkedManagedAllocator(
            std::unique_ptr<Allocator>(new CPUPinnedAllocator()),
            platform::CUDAPinnedMaxChunkSize(), GetCapacity(), -1) {
  }  // never retry

 private:
  static size_t GetCapacity() {
    size_t total = platform::CpuTotalPhysicalMemory();
    size_t max_chunk_size = platform::CUDAPinnedMaxChunkSize();
    return max_chunk_size == 0 ? 0 : total / max_chunk_size;
  }
};

#endif

class AllocatorFacadePrivate {
 public:
  std::map<platform::Place, std::shared_ptr<Allocator>> allocators_;

  ~AllocatorFacadePrivate() = default;

  AllocatorFacadePrivate() {
    InitCPUAllocator();
    InitCUDAAllocator();
    InitCUDAPinnedAllocator();
    WrapZeroSizeAllocator();
  }

 private:
  void InitCPUAllocator() {
    allocators_[platform::CPUPlace()] = std::make_shared<CPUManagedAllocator>();
  }

  void InitCUDAAllocator() {
#ifdef PADDLE_WITH_CUDA
    int device_count = platform::GetCUDADeviceCount();
    for (int dev_id = 0; dev_id < device_count; ++dev_id) {
      allocators_[platform::CUDAPlace(dev_id)] =
          std::make_shared<CUDAManagedAllocator>(dev_id);
    }
#endif
  }

  void InitCUDAPinnedAllocator() {
#ifdef PADDLE_WITH_CUDA
    allocators_[platform::CUDAPinnedPlace()] =
        std::make_shared<CUDAPinnedManagedAllocator>();
#endif
  }

  void WrapZeroSizeAllocator() {
    for (auto& pair : allocators_) {
      pair.second =
          std::make_shared<ZeroSizeAllocator>(pair.second, pair.first);
    }
  }
};

// Pimpl. Make interface clean.
AllocatorFacade::AllocatorFacade() : m_(new AllocatorFacadePrivate()) {}
AllocatorFacade::~AllocatorFacade() { delete m_; }

AllocatorFacade& AllocatorFacade::Instance() {
  static AllocatorFacade instance;
  return instance;
}

std::shared_ptr<Allocation> AllocatorFacade::AllocShared(
    const platform::Place& place, size_t size, Allocator::Attr attr) {
  return std::shared_ptr<Allocation>(
      m_->allocators_.at(place)->Allocate(size, attr).release(),
      AllocationDeleter());
}

AllocationPtr AllocatorFacade::Alloc(const platform::Place& place, size_t size,
                                     Allocator::Attr attr) {
  return m_->allocators_.at(place)->Allocate(size, attr);
}

}  // namespace allocation
}  // namespace memory
}  // namespace paddle
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.`
			`//`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`

			`#include "paddle/fluid/memory/allocation/allocator.h"`
add unittest for allocator_facade.cc 6 years ago			`#include <gflags/gflags.h>`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`#include <map>`
add unittest for allocator_facade.cc 6 years ago			`#include <unordered_map>`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`#include <vector>`
			`#include "paddle/fluid/memory/allocation/aligned_allocator.h"`
			`#include "paddle/fluid/memory/allocation/allocator_facade.h"`
Refine Allocator facade 6 years ago			`#include "paddle/fluid/memory/allocation/auto_increment_allocator.h"`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`#include "paddle/fluid/memory/allocation/best_fit_allocator.h"`
Add conditional_allocator 6 years ago			`#include "paddle/fluid/memory/allocation/conditional_allocator.h"`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`#include "paddle/fluid/memory/allocation/cpu_allocator.h"`
			`#include "paddle/fluid/memory/allocation/locked_allocator.h"`
add unittest for allocator_facade.cc 6 years ago			`#include "paddle/fluid/memory/allocation/retry_allocator.h"`
Add ZeroSize Allocator 6 years ago			`#include "paddle/fluid/memory/allocation/zero_size_allocator.h"`
fix pinned allocator 6 years ago			`#include "paddle/fluid/platform/cpu_info.h"`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`#include "paddle/fluid/platform/place.h"`
			`#ifdef PADDLE_WITH_CUDA`
			`#include "paddle/fluid/memory/allocation/cuda_allocator.h"`
fix pinned allocator 6 years ago			`#include "paddle/fluid/memory/allocation/pinned_allocator.h"`
			`#include "paddle/fluid/platform/cuda_device_guard.h"`
			`#include "paddle/fluid/platform/gpu_info.h"`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`#endif`

fix pinned allocator 6 years ago			`DEFINE_int64(`
add unittest for allocator_facade.cc 6 years ago			`gpu_allocator_retry_time, 0,`
			`"The retry time (milliseconds) when allocator fails "`
			`"to allocate memory. No retry if this value is not greater than 0");`

refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`namespace paddle {`
			`namespace memory {`
			`namespace allocation {`

Refine Allocator facade 6 years ago			`// TODO(yy): Dirty code here. This class should be configurable in runtime.`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`class CPUManagedAllocator : public Allocator {`
Add communication attr 6 years ago			`public:`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`CPUManagedAllocator() : normal_allocator_(new CPUAllocator()) {}`
Add communication attr 6 years ago
Refine code 6 years ago			`AllocationPtr Allocate(size_t size, Attr attr) override {`
fix pinned allocator 6 years ago			`return normal_allocator_->Allocate(size, attr);`
Add communication attr 6 years ago			`}`

Refine Allocator facade 6 years ago			`bool IsAllocThreadSafe() const override { return true; }`
Add communication attr 6 years ago
			`private:`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`std::shared_ptr<Allocator> normal_allocator_;`
Add communication attr 6 years ago			`};`

Refine Allocator facade 6 years ago			`// TODO(yy): Dirty code here. This class should be configurable in runtime.`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`class ChunkedManagedAllocator : public Allocator {`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`public:`
fix pinned allocator 6 years ago			`explicit ChunkedManagedAllocator(std::unique_ptr<Allocator> system_allocator,`
			`size_t max_chunk_size, size_t capacity = 1,`
			`int64_t retry_time = -1)`
			`: max_chunk_size_(max_chunk_size), retry_time_(retry_time) {`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`raw_allocator_ = std::move(system_allocator);`
fix allocator_facade bug 6 years ago
			`if (max_chunk_size_ == 0) {`
			`default_allocator_ = raw_allocator_;`
			`} else {`
			`if (capacity == 1) {`
add unittest for allocator_facade.cc 6 years ago			`VLOG(10) << "Create BestFitAllocator with chunk_size "`
			`<< max_chunk_size_;`
fix allocator_facade bug 6 years ago			`default_allocator_ = BestFitAllocatorCreator();`
			`} else {`
add unittest for allocator_facade.cc 6 years ago			`VLOG(10) << "Create AutoIncrementAllocator with chunk_size "`
			`<< max_chunk_size_ << " and capacity " << capacity;`
fix allocator_facade bug 6 years ago			`default_allocator_ = std::make_shared<AutoIncrementAllocator>(`
			`[this] { return std::move(BestFitAllocatorCreator()); }, capacity);`
			`}`
			`}`
Add conditional_allocator 6 years ago
			`auto* cond_allocator = new ConditionalAllocator();`
			`cond_allocator`
			`->AddAllocator(`
			`[this](size_t size, Attr attr) { return size < max_chunk_size_; },`
			`default_allocator_)`
			`.AddAllocator(`
			`[](size_t size, Attr attr) {`
			`return true; // default case`
			`},`
			`raw_allocator_);`
			`default_allocator_.reset(cond_allocator);`
Refine Allocator facade 6 years ago			`}`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago
fix pinned allocator 6 years ago			`~ChunkedManagedAllocator() {`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`// Specify destruct order.`
Refine Allocator facade 6 years ago			`default_allocator_.reset();`
			`chunks_.clear();`
			`raw_allocator_.reset();`
			`}`

Refine code 6 years ago			`AllocationPtr Allocate(size_t size, Attr attr) override {`
Refine Allocator facade 6 years ago			`return default_allocator_->Allocate(size, attr);`
			`}`
add unittest for allocator_facade.cc 6 years ago
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`std::shared_ptr<Allocator> BestFitAllocatorCreator() {`
Refine Allocator facade 6 years ago			`chunks_.emplace_back(raw_allocator_->Allocate(max_chunk_size_));`
			`auto* allocation = chunks_.back().get();`
add unittest for allocator_facade.cc 6 years ago			`std::unique_ptr<Allocator> unmanaged_allocator(new LockedAllocator(`
			`std::unique_ptr<Allocator>(new BestFitAllocator(allocation))));`

fix pinned allocator 6 years ago			`if (retry_time_ <= 0) {`
add unittest for allocator_facade.cc 6 years ago			`VLOG(10) << "Create NaiveManagedAllocator without retry";`
			`return std::make_shared<AlignedAllocator<64u>>(`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`std::move(unmanaged_allocator));`
add unittest for allocator_facade.cc 6 years ago			`} else {`
fix pinned allocator 6 years ago			`VLOG(10) << "Create RetryAllocator with retry_time " << retry_time_`
			`<< "ms";`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`auto tmp = std::make_shared<RetryAllocator>(`
			`std::move(unmanaged_allocator), static_cast<size_t>(retry_time_));`
			`return std::make_shared<AlignedAllocator<64u>>(tmp);`
add unittest for allocator_facade.cc 6 years ago			`}`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`}`
fix allocator_facade bug 6 years ago
Refine Allocator facade 6 years ago			`bool IsAllocThreadSafe() const override { return true; }`

fix pinned allocator 6 years ago			`protected:`
Refine Allocator facade 6 years ago			`size_t max_chunk_size_;`
fix pinned allocator 6 years ago			`int64_t retry_time_;`
Refine code 6 years ago			`std::vector<AllocationPtr> chunks_;`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`std::shared_ptr<Allocator> raw_allocator_;`
			`std::shared_ptr<Allocator> default_allocator_;`
Refine Allocator facade 6 years ago			`};`
fix pinned allocator 6 years ago
			`#ifdef PADDLE_WITH_CUDA`

			`class CUDAManagedAllocator : public ChunkedManagedAllocator {`
			`public:`
			`explicit CUDAManagedAllocator(int dev_id)`
			`: ChunkedManagedAllocator(`
			`std::unique_ptr<Allocator>(`
			`new CUDAAllocator(platform::CUDAPlace(dev_id))),`
			`GetMaxChunkSize(dev_id), GetCapcity(dev_id), GetRetryTime()) {}`

			`private:`
			`static size_t GetMaxChunkSize(int dev_id) {`
			`platform::CUDADeviceGuard guard(dev_id);`
			`return platform::GpuMaxChunkSize();`
			`}`

			`static size_t GetCapcity(int dev_id) {`
			`platform::CUDADeviceGuard guard(dev_id);`
			`size_t available, total;`
			`platform::GpuMemoryUsage(&available, &total);`
			`size_t max_chunk_size = platform::GpuMaxChunkSize();`
			`return max_chunk_size == 0 ? 0 : available / max_chunk_size;`
			`}`

			`static int64_t GetRetryTime() { return FLAGS_gpu_allocator_retry_time; }`
			`};`

			`class CUDAPinnedManagedAllocator : public ChunkedManagedAllocator {`
			`public:`
			`CUDAPinnedManagedAllocator()`
			`: ChunkedManagedAllocator(`
			`std::unique_ptr<Allocator>(new CPUPinnedAllocator()),`
			`platform::CUDAPinnedMaxChunkSize(), GetCapacity(), -1) {`
			`} // never retry`

			`private:`
			`static size_t GetCapacity() {`
			`size_t total = platform::CpuTotalPhysicalMemory();`
			`size_t max_chunk_size = platform::CUDAPinnedMaxChunkSize();`
			`return max_chunk_size == 0 ? 0 : total / max_chunk_size;`
			`}`
			`};`

Refine 6 years ago			`#endif`
Refine Allocator facade 6 years ago
			`class AllocatorFacadePrivate {`
			`public:`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`std::map<platform::Place, std::shared_ptr<Allocator>> allocators_;`
Refine Allocator facade 6 years ago
Refine 6 years ago			`~AllocatorFacadePrivate() = default;`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago
			`AllocatorFacadePrivate() {`
			`InitCPUAllocator();`
			`InitCUDAAllocator();`
fix pinned allocator 6 years ago			`InitCUDAPinnedAllocator();`
Add ZeroSize Allocator 6 years ago			`WrapZeroSizeAllocator();`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`}`

			`private:`
			`void InitCPUAllocator() {`
Add communication attr 6 years ago			`allocators_[platform::CPUPlace()] = std::make_shared<CPUManagedAllocator>();`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`}`

			`void InitCUDAAllocator() {`
			`#ifdef PADDLE_WITH_CUDA`
fix pinned allocator 6 years ago			`int device_count = platform::GetCUDADeviceCount();`
			`for (int dev_id = 0; dev_id < device_count; ++dev_id) {`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`allocators_[platform::CUDAPlace(dev_id)] =`
Refine Allocator facade 6 years ago			`std::make_shared<CUDAManagedAllocator>(dev_id);`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`}`
			`#endif`
			`}`
Add ZeroSize Allocator 6 years ago
fix pinned allocator 6 years ago			`void InitCUDAPinnedAllocator() {`
			`#ifdef PADDLE_WITH_CUDA`
			`allocators_[platform::CUDAPinnedPlace()] =`
			`std::make_shared<CUDAPinnedManagedAllocator>();`
			`#endif`
			`}`

Add ZeroSize Allocator 6 years ago			`void WrapZeroSizeAllocator() {`
			`for (auto& pair : allocators_) {`
			`pair.second =`
			`std::make_shared<ZeroSizeAllocator>(pair.second, pair.first);`
			`}`
			`}`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`};`

Refine 6 years ago			`// Pimpl. Make interface clean.`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`AllocatorFacade::AllocatorFacade() : m_(new AllocatorFacadePrivate()) {}`
			`AllocatorFacade::~AllocatorFacade() { delete m_; }`

			`AllocatorFacade& AllocatorFacade::Instance() {`
			`static AllocatorFacade instance;`
			`return instance;`
			`}`

			`std::shared_ptr<Allocation> AllocatorFacade::AllocShared(`
			`const platform::Place& place, size_t size, Allocator::Attr attr) {`
Clean interface of allocator Clean managed/umnamaged allocator 6 years ago			`return std::shared_ptr<Allocation>(`
Refine code 6 years ago			`m_->allocators_.at(place)->Allocate(size, attr).release(),`
			`AllocationDeleter());`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`}`

Refine code 6 years ago			`AllocationPtr AllocatorFacade::Alloc(const platform::Place& place, size_t size,`
			`Allocator::Attr attr) {`
add unittest for allocator_facade.cc 6 years ago			`return m_->allocators_.at(place)->Allocate(size, attr);`
refactor(memory): rewrite memory allocation and make it extentable Use OO style to rewrite memory allocation. 6 years ago			`}`

			`} // namespace allocation`
			`} // namespace memory`
			`} // namespace paddle`