You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
212 lines
5.6 KiB
212 lines
5.6 KiB
/**
|
|
* Copyright 2019-2020 Huawei Technologies Co., Ltd
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#ifndef GE_GRAPH_MANAGER_GRAPH_CACHING_ALLOCATOR_H_
|
|
#define GE_GRAPH_MANAGER_GRAPH_CACHING_ALLOCATOR_H_
|
|
|
|
#include <iostream>
|
|
#include <map>
|
|
#include <memory>
|
|
#include <mutex>
|
|
#include <string>
|
|
#include <vector>
|
|
#include <set>
|
|
#include <unordered_map>
|
|
#include <unordered_set>
|
|
|
|
#include "framework/common/ge_inner_error_codes.h"
|
|
#include "graph/node.h"
|
|
#include "graph/manager/block_memory.h"
|
|
#include "runtime/mem.h"
|
|
|
|
namespace ge {
|
|
constexpr size_t kRoundBlockSize = 512; // all block sizes are rounded to at least 512 bytes
|
|
constexpr size_t kBinSizeUnit4 = 4;
|
|
constexpr size_t kBinSizeUnit8 = 8;
|
|
constexpr size_t kBinSizeUnit32 = 32;
|
|
constexpr size_t kBinSizeUnit128 = 128;
|
|
constexpr size_t kBinSizeUnit256 = 256;
|
|
constexpr size_t kBinSizeUnit512 = 512;
|
|
|
|
constexpr double kSplitThreshold = 0.5; // split when malloc size <= small block size * kSpliThreshold
|
|
constexpr size_t kKByteSize = 1024;
|
|
constexpr size_t kMByteSize = 1048576; // 1024 * 1024
|
|
constexpr size_t kGByteSize = 1073741824; // 1024 * 1024 * 1024
|
|
|
|
static const uint32_t kNumBins = 7;
|
|
|
|
class MemoryAllocator;
|
|
|
|
class CachingAllocator {
|
|
public:
|
|
explicit CachingAllocator(rtMemType_t memory_type);
|
|
|
|
CachingAllocator(const CachingAllocator &) = delete;
|
|
|
|
CachingAllocator &operator=(const CachingAllocator &) = delete;
|
|
|
|
virtual ~CachingAllocator() = default;
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief caching allocator init
|
|
/// @param [in] device id
|
|
/// @return Status of init
|
|
///
|
|
Status Initialize(uint32_t device_id = 0);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief memory allocator finalize, release cached memory
|
|
/// @return void
|
|
///
|
|
void Finalize(uint32_t device_id = 0);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief malloc memory
|
|
/// @param [in] size memory size
|
|
/// @param [in] try to reuse the same memory
|
|
/// @param [in] device id
|
|
/// @return memory address
|
|
///
|
|
uint8_t *Malloc(size_t size, uint8_t *org_ptr = nullptr, uint32_t device_id = 0);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief free memory
|
|
/// @param [in] device_id device id
|
|
/// @param [out] memory_ptr memory address ptr
|
|
/// @return Status result of function
|
|
///
|
|
Status Free(uint8_t *memory_addr, uint32_t device_id = 0);
|
|
|
|
private:
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief extend cache by size
|
|
/// @param [in] memory size
|
|
/// @param [in] device id
|
|
/// @return Status result of function
|
|
///
|
|
Status TryExtendCache(size_t size, uint32_t device_id);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief find free block by size
|
|
/// @param [in] memory size
|
|
/// @param [in] device_id device id
|
|
/// @return block ptr
|
|
///
|
|
Block *FindFreeBlock(size_t size, uint8_t *org_ptr, uint32_t device_id);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief get the right bin based on size
|
|
/// @param [in] original malloc size
|
|
/// @return block bin
|
|
///
|
|
BlockBin *GetBlockBin(size_t size);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief add memory to right bin based on size
|
|
/// @param [in] memory ptr
|
|
/// @param [in] memory size
|
|
/// @param [in] device_id device id
|
|
/// @return Status result of function
|
|
///
|
|
Status AddToBlockBin(uint8_t *ptr, size_t size, uint32_t device_id);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief free block to right bin
|
|
/// @param [in] block ptr
|
|
/// @return void
|
|
///
|
|
void FreeBlock(Block* block);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief free all cached blocks to right bin and release the memory when memory is not enough
|
|
/// @return free cached memory size
|
|
///
|
|
size_t FreeCachedBlocks();
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief free allocated and cached blocks and release the memory when process exit
|
|
/// @return void
|
|
///
|
|
void FreeBlocks();
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief free block bins when process exit
|
|
/// @return void
|
|
///
|
|
void FreeBlockBins();
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief If a split block is freed, try merging with the original block
|
|
/// @param [inout] dest block ptr
|
|
/// @param [in] src block ptr
|
|
/// @param [out] block bin
|
|
/// @return void
|
|
///
|
|
void MergeBlocks(Block *dst, Block *src, BlockBin &bin);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief If the allocated memory size is too much smaller than the memory block, try to split the memory block
|
|
/// @param [in] original block ptr
|
|
/// @param [in] allocated memory size
|
|
/// @param [in] block bin
|
|
/// @param [in] device id
|
|
/// @return splited block ptr
|
|
///
|
|
Block *SplitBlock(Block *block, size_t size, BlockBin &bin, uint32_t device_id);
|
|
|
|
///
|
|
/// @ingroup ge_graph
|
|
/// @brief print the memory info in pool
|
|
/// @return void
|
|
///
|
|
void PrintStatics();
|
|
|
|
private:
|
|
rtMemType_t memory_type_;
|
|
|
|
// device memory allocator
|
|
MemoryAllocator *memory_allocator_;
|
|
|
|
// lock around all operations
|
|
mutable std::recursive_mutex mutex_;
|
|
|
|
// allocated blocks by memory pointer
|
|
std::unordered_map<uint8_t *, Block *> allocated_blocks_;
|
|
|
|
// block bins by different block size
|
|
BlockBin *free_block_bins_[kNumBins];
|
|
|
|
// malloced memorys from device
|
|
std::map<size_t, size_t> malloced_memory_;
|
|
};
|
|
} // namespace ge
|
|
#endif // GE_GRAPH_MANAGER_GRAPH_CACHING_ALLOCATOR_H_
|