You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
graphengine/ge/single_op/stream_resource.cc

230 lines
7.5 KiB

5 years ago
/**
* Copyright 2019-2020 Huawei Technologies Co., Ltd
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "single_op/stream_resource.h"
#include "framework/common/debug/ge_log.h"
#include "framework/common/debug/log.h"
#include "runtime/rt.h"
#include "single_op/single_op_model.h"
5 years ago
namespace ge {
namespace {
// limit available device mem size 1M
const uint32_t kFuzzDeviceBufferSize = 1 * 1024 * 1024;
}
4 years ago
StreamResource::StreamResource(uintptr_t resource_id) : resource_id_(resource_id) {
}
5 years ago
StreamResource::~StreamResource() {
for (auto mem : memory_list_) {
if (mem != nullptr) {
auto rt_ret = rtFree(mem);
GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE, GELOGE(RT_FAILED, "[Free][Rt] failed."));
5 years ago
}
}
for (auto weight : weight_list_) {
if (weight != nullptr) {
auto rt_ret = rtFree(weight);
GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE, GELOGE(RT_FAILED, "[Free][Rt] failed."));
5 years ago
}
}
if (device_buffer_ != nullptr) {
auto rt_ret = rtFree(device_buffer_);
GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE, GELOGE(RT_FAILED, "[Free][Rt] failed."));
}
}
Status StreamResource::Init() {
auto rt_ret = rtMalloc(&device_buffer_, kFuzzDeviceBufferSize, RT_MEMORY_HBM);
GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE, GELOGE(RT_FAILED, "[Malloc][Rt] failed."));
return SUCCESS;
5 years ago
}
SingleOp *StreamResource::GetOperator(const uint64_t key) {
std::lock_guard<std::mutex> lk(mu_);
5 years ago
auto it = op_map_.find(key);
if (it == op_map_.end()) {
return nullptr;
}
return it->second.get();
5 years ago
}
DynamicSingleOp *StreamResource::GetDynamicOperator(const uint64_t key) {
std::lock_guard<std::mutex> lk(mu_);
auto it = dynamic_op_map_.find(key);
if (it == dynamic_op_map_.end()) {
return nullptr;
}
return it->second.get();
}
rtStream_t StreamResource::GetStream() const {
return stream_;
}
4 years ago
void StreamResource::SetStream(rtStream_t stream) {
stream_ = stream;
}
4 years ago
uint8_t *StreamResource::DoMallocMemory(const std::string &purpose,
size_t size,
size_t &max_allocated,
std::vector<uint8_t *> &allocated) {
if (size == 0) {
GELOGD("Mem size == 0");
return nullptr;
}
5 years ago
if (size <= max_allocated && !allocated.empty()) {
GELOGD("reuse last memory");
return allocated.back();
}
if (!allocated.empty()) {
uint8_t *current_buffer = allocated.back();
allocated.pop_back();
if (rtStreamSynchronize(stream_) != RT_ERROR_NONE) {
GELOGW("Failed to invoke rtStreamSynchronize");
}
(void) rtFree(current_buffer);
}
5 years ago
uint8_t *buffer = nullptr;
auto ret = rtMalloc(reinterpret_cast<void **>(&buffer), size, RT_MEMORY_HBM);
if (ret != RT_ERROR_NONE) {
GELOGE(RT_FAILED, "[RtMalloc][Memory] failed, size = %zu, ret = %d", size, ret);
4 years ago
REPORT_INNER_ERROR("E19999", "rtMalloc failed, size = %zu, ret = %d.", size, ret);
5 years ago
return nullptr;
}
GE_PRINT_DYNAMIC_MEMORY(rtMalloc, purpose.c_str(), size)
5 years ago
ret = rtMemset(buffer, size, 0U, size);
if (ret != RT_ERROR_NONE) {
GELOGE(RT_FAILED, "[RtMemset][Memory] failed, ret = %d", ret);
4 years ago
REPORT_INNER_ERROR("E19999", "rtMemset failed, ret = %d.", ret);
5 years ago
auto rt_ret = rtFree(buffer);
GE_IF_BOOL_EXEC(rt_ret != RT_ERROR_NONE, GELOGE(RT_FAILED, "[RtFree][Memory] failed"));
5 years ago
return nullptr;
}
GELOGD("Malloc new memory succeeded. size = %zu", size);
max_allocated = size;
allocated.emplace_back(buffer);
return buffer;
}
uint8_t *StreamResource::MallocMemory(const std::string &purpose, size_t size, bool holding_lock) {
5 years ago
GELOGD("To Malloc memory, size = %zu", size);
if (holding_lock) {
return DoMallocMemory(purpose, size, max_memory_size_, memory_list_);
} else {
std::lock_guard<std::mutex> lk(stream_mu_);
return DoMallocMemory(purpose, size, max_memory_size_, memory_list_);
}
5 years ago
}
uint8_t *StreamResource::MallocWeight(const std::string &purpose, size_t size) {
5 years ago
GELOGD("To Malloc weight, size = %zu", size);
uint8_t *buffer = nullptr;
auto ret = rtMalloc(reinterpret_cast<void **>(&buffer), size, RT_MEMORY_HBM);
if (ret != RT_ERROR_NONE) {
GELOGE(RT_FAILED, "[RtMalloc][Memory] failed, size = %zu, ret = %d", size, ret);
4 years ago
REPORT_INNER_ERROR("E19999", "rtMalloc failed, size = %zu, ret = %d.", size, ret);
return nullptr;
}
GE_PRINT_DYNAMIC_MEMORY(rtMalloc, purpose.c_str(), size)
weight_list_.emplace_back(buffer);
5 years ago
return buffer;
}
Status StreamResource::BuildDynamicOperator(const ModelData &model_data,
DynamicSingleOp **single_op,
const uint64_t model_id) {
const string &model_name = std::to_string(model_id);
std::lock_guard<std::mutex> lk(mu_);
auto it = dynamic_op_map_.find(model_id);
if (it != dynamic_op_map_.end()) {
*single_op = it->second.get();
return SUCCESS;
}
SingleOpModel model(model_name, model_data.model_data, model_data.model_len);
auto ret = model.Init();
if (ret != SUCCESS) {
GELOGE(ret, "[Init][SingleOpModel] failed. model = %s, ret = %u", model_name.c_str(), ret);
REPORT_CALL_ERROR("E19999", "SingleOpModel init failed, model = %s, ret = %u", model_name.c_str(), ret);
return ret;
}
4 years ago
auto new_op = std::unique_ptr<DynamicSingleOp>(new(std::nothrow) DynamicSingleOp(resource_id_, &stream_mu_, stream_));
GE_CHECK_NOTNULL(new_op);
GELOGI("To build operator: %s", model_name.c_str());
GE_CHK_STATUS_RET(model.BuildDynamicOp(*this, *new_op),
"[Build][DynamicOp]failed. op = %s, ret = %u", model_name.c_str(), ret);
*single_op = new_op.get();
dynamic_op_map_[model_id] = std::move(new_op);
return SUCCESS;
}
Status StreamResource::BuildOperator(const ModelData &model_data, SingleOp **single_op, const uint64_t model_id) {
const string &model_name = std::to_string(model_id);
std::lock_guard<std::mutex> lk(mu_);
auto it = op_map_.find(model_id);
if (it != op_map_.end()) {
*single_op = it->second.get();
return SUCCESS;
}
SingleOpModel model(model_name, model_data.model_data, model_data.model_len);
auto ret = model.Init();
if (ret != SUCCESS) {
GELOGE(ret, "[Init][SingleOpModel] failed. model = %s, ret = %u", model_name.c_str(), ret);
REPORT_CALL_ERROR("E19999", "SingleOpModel init failed, model = %s, ret = %u", model_name.c_str(), ret);
return ret;
}
auto new_op = std::unique_ptr<SingleOp>(new(std::nothrow) SingleOp(this, &stream_mu_, stream_));
if (new_op == nullptr) {
GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "[New][SingleOp] failed.");
4 years ago
REPORT_CALL_ERROR("E19999", "new SingleOp failed.");
4 years ago
return ACL_ERROR_GE_MEMORY_ALLOCATION;
}
GELOGI("To build operator: %s", model_name.c_str());
GE_CHK_STATUS_RET(model.BuildOp(*this, *new_op), "[Build][Op] failed. op = %s, ret = %u", model_name.c_str(), ret);
*single_op = new_op.get();
op_map_[model_id] = std::move(new_op);
return SUCCESS;
}
const uint8_t *StreamResource::GetMemoryBase() const {
if (memory_list_.empty()) {
return nullptr;
}
return memory_list_.back();
}
5 years ago
} // namespace ge