You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
graphengine/ge/host_kernels/concat_offset_kernel.cc

107 lines
4.1 KiB

/**
* Copyright 2020 Huawei Technologies Co., Ltd
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "host_kernels/concat_offset_kernel.h"
#include <memory>
#include "common/ge_inner_error_codes.h"
#include "common/op/ge_op_utils.h"
#include "common/types.h"
#include "framework/common/debug/ge_log.h"
#include "graph/utils/type_utils.h"
#include "inc/kernel_factory.h"
namespace ge {
namespace {
const size_t kConcatOffsetInputIndexZero = 0;
const size_t kConcatOffsetInputIndexOne = 1;
const int kNumOne = 1;
} // namespace
Status ConcatOffsetKernel::Compute(const OpDescPtr op_desc_ptr, const vector<ConstGeTensorPtr> &input,
vector<GeTensorPtr> &v_output) {
GELOGI("ConcatOffsetKernel in.");
if (op_desc_ptr == nullptr) {
GELOGE(PARAM_INVALID, "input opdesc is nullptr.");
return PARAM_INVALID;
}
// validate attrs
int N = 0;
if (!(AttrUtils::GetInt(op_desc_ptr, "N", N))) {
GELOGW("Attr %s does not exist.", "N");
return NOT_CHANGED;
}
// follow IR def, the first input is concat_dim
ConstGeTensorPtr input_0 = input[kConcatOffsetInputIndexZero];
GE_CHECK_NOTNULL(input_0);
int32_t concat_dim = *(const_cast<int32_t *>(reinterpret_cast<const int32_t *>(input_0->GetData().data())));
// validate inputs
if ((static_cast<int>(input.size()) != (N + kNumOne)) || (input.size() <= kConcatOffsetInputIndexOne)) {
GELOGW("The number of input for concat offset must be equal to %d, and must be more than one.", (N + kNumOne));
return NOT_CHANGED;
}
// calculate ouput dim
GeShape output_shape = input[kConcatOffsetInputIndexOne]->GetTensorDesc().GetShape();
int64_t output_size = output_shape.GetShapeSize();
if (concat_dim >= output_size) {
GELOGW("Concat dim is bigger than the size of output_shape.");
return NOT_CHANGED;
}
GELOGI("Output shape size is %ld", output_size);
int32_t offset = 0;
if (output_size < 0) {
GELOGE(FAILED, "Index is negative.");
return FAILED;
}
unique_ptr<int32_t[]> buf(new (std::nothrow) int32_t[output_size]());
if (buf == nullptr) {
GELOGE(MEMALLOC_FAILED, "new buf failed");
return INTERNAL_ERROR;
}
for (size_t i = 0; i < static_cast<size_t>(N); i++) {
buf[concat_dim] = offset;
// generate output, index 0 can always gets a GeTensorDesc object from any OpDescPtr.
auto output_tensor_desc = op_desc_ptr->GetOutputDesc(0);
GeTensorPtr output_ptr = MakeShared<GeTensor>(output_tensor_desc);
if (output_ptr == nullptr) {
GELOGW("Failed to fold node %s, out of memeory", op_desc_ptr->GetName().c_str());
return NOT_CHANGED;
}
output_ptr->MutableTensorDesc().SetDataType(DT_INT32);
output_ptr->MutableTensorDesc().SetShape(output_shape);
GE_IF_BOOL_EXEC(output_ptr->SetData(reinterpret_cast<uint8_t *>(buf.get()),
static_cast<size_t>(sizeof(DT_INT32) * output_size)) != GRAPH_SUCCESS,
GELOGW("set data failed");
return NOT_CHANGED);
v_output.push_back(output_ptr);
// caculate offset
const int32_t *input_shape =
reinterpret_cast<const int32_t *>(input[i + kConcatOffsetInputIndexOne]->GetData().data());
int64_t input_dim = input_shape[concat_dim]; // this index is valid, checked before
if (input_dim > (INT64_MAX - offset)) {
GELOGE(PARAM_INVALID, " %d and %ld addition can result in overflow!.", offset, input_dim);
return INTERNAL_ERROR;
}
offset += input_dim;
}
GELOGI("ConcatOffsetKernel success.");
return SUCCESS;
}
REGISTER_KERNEL(CONCATOFFSET, ConcatOffsetKernel);
} // namespace ge