You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
88 lines
3.4 KiB
88 lines
3.4 KiB
/**
|
|
* Copyright 2020 Huawei Technologies Co., Ltd
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#ifndef GE_GRAPH_LOAD_NEW_MODEL_MANAGER_ZERO_COPY_OFFSET_H_
|
|
#define GE_GRAPH_LOAD_NEW_MODEL_MANAGER_ZERO_COPY_OFFSET_H_
|
|
|
|
#include <map>
|
|
#include <set>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
#include "external/ge/ge_api_error_codes.h"
|
|
#include "framework/common/ge_types.h"
|
|
#include "graph/debug/ge_attr_define.h"
|
|
#include "graph/load/model_manager/zero_copy_task.h"
|
|
#include "graph/utils/attr_utils.h"
|
|
#include "graph/utils/tensor_utils.h"
|
|
#include "runtime/mem.h"
|
|
#include "task_info/task_info.h"
|
|
|
|
using std::map;
|
|
using std::set;
|
|
using std::string;
|
|
using std::vector;
|
|
|
|
namespace ge {
|
|
class ZeroCopyOffset {
|
|
public:
|
|
ZeroCopyOffset();
|
|
~ZeroCopyOffset();
|
|
|
|
Status InitInputDataInfo(int64_t output_size, void *virtual_addr, const OpDescPtr &op_desc, bool &fusion_flag);
|
|
void SetInputOutsideAddrs(int64_t output_offset, void *addr, bool fusion_flag, set<const void *> &real_virtual_addrs);
|
|
|
|
void IsL2Fusion(const vector<int64_t> &fusion_basic_addrs, const int64_t &tensor_addr, bool &fusion_flag);
|
|
Status InitOutputDataInfo(const vector<int64_t> &input_size_list, const vector<void *> &virtual_addr_list,
|
|
const OpDescPtr &op_desc, const size_t &idx, bool &fusion_flag);
|
|
void SetOutputOutsideAddrs(const int64_t &input_offset, const bool &fusion_flag, void *addr,
|
|
std::vector<void *> &tensor_addrs);
|
|
void SetOutsideAddrsValue(ZeroCopyTask &zero_copy_task, void *outside_addr, void *args, size_t offset);
|
|
|
|
// basic_addr of l2-fusion
|
|
void *GetBasicAddr() const { return basic_addr_; }
|
|
// total num of out_of_data/in_of_phonyconcat
|
|
uint32_t GetDataCount() const { return data_count_; }
|
|
uint32_t GetAddrCount() const { return addr_count_; }
|
|
// value of *data_info_ from davinci_model
|
|
std::vector<std::pair<int64_t, void *>> GetDataInfo() const { return data_info_; }
|
|
// relative_offset from zero_copy_relative_offset_
|
|
std::vector<int64_t> GetRelativeOffset() const { return relative_offset_; }
|
|
// data_size of Data/Netoutput
|
|
int64_t GetDataSize() const { return data_size_; }
|
|
// value of *outside_addrs_ from davinci_model
|
|
const std::vector<std::map<const void *, std::vector<void *>>> &GetOutsideAddrs() const { return outside_addrs_; }
|
|
// name of op
|
|
std::string GetOpName() const { return op_name_; }
|
|
const bool IsRelativeOffsetValid() const { return valid_relative_offset_; }
|
|
|
|
private:
|
|
void *basic_addr_ = nullptr;
|
|
std::string op_name_;
|
|
uint32_t data_count_ = 0;
|
|
std::vector<std::pair<int64_t, void *>> data_info_;
|
|
vector<int64_t> relative_offset_;
|
|
int64_t data_size_ = 0;
|
|
uint32_t addr_count_ = 0;
|
|
std::vector<std::map<const void *, std::vector<void *>>> outside_addrs_;
|
|
|
|
std::vector<int64_t> zero_copy_basic_offset_;
|
|
std::vector<int64_t> zero_copy_relative_offset_;
|
|
bool valid_relative_offset_ = false;
|
|
};
|
|
} // namespace ge
|
|
#endif // GE_GRAPH_LOAD_NEW_MODEL_MANAGER_ZERO_COPY_OFFSET_H_
|