You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
136 lines
5.3 KiB
136 lines
5.3 KiB
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License. */
|
|
|
|
#include "paddle/operators/sequence_concat_op.h"
|
|
|
|
namespace paddle {
|
|
namespace operators {
|
|
|
|
class SequenceConcatOp : public framework::OperatorWithKernel {
|
|
public:
|
|
using framework::OperatorWithKernel::OperatorWithKernel;
|
|
|
|
void InferShape(framework::InferShapeContext* ctx) const override {
|
|
PADDLE_ENFORCE(ctx->HasInputs("X"),
|
|
"Inputs(X) of SequenceConcatOp should not be null.");
|
|
PADDLE_ENFORCE(ctx->HasOutput("Out"),
|
|
"Output(Out) of SequenceConcatOp should not be null.");
|
|
const size_t level = static_cast<size_t>(ctx->Attrs().Get<int>("level"));
|
|
const size_t axis = static_cast<size_t>(ctx->Attrs().Get<int>("axis"));
|
|
PADDLE_ENFORCE(level == 0UL || level == 1UL,
|
|
"The sequence_concat operator only accepts sequence "
|
|
"or a nested sequence as its input.");
|
|
auto ins_dims = ctx->GetInputsDim("X");
|
|
framework::DDim out_dims = ins_dims[0];
|
|
const size_t n = ins_dims.size();
|
|
for (size_t i = 1; i < n; ++i) {
|
|
out_dims[axis] += ins_dims[i][axis];
|
|
}
|
|
ctx->SetOutputDim("Out", out_dims);
|
|
}
|
|
};
|
|
|
|
class SequenceConcatOpMaker : public framework::OpProtoAndCheckerMaker {
|
|
public:
|
|
SequenceConcatOpMaker(OpProto* proto, OpAttrChecker* op_checker)
|
|
: OpProtoAndCheckerMaker(proto, op_checker) {
|
|
AddInput("X",
|
|
"(LodTensorArray) Input is a vector of LoDTensor, "
|
|
"each of which is a variable-length sequence or nested sequence.")
|
|
.AsDuplicable();
|
|
AddOutput("Out",
|
|
"(LoDTensor), Variable-length output of "
|
|
"sequence_concat Op.");
|
|
AddAttr<int>("axis",
|
|
"(int, default 0) "
|
|
"The axis along which the inputs will be joined. "
|
|
"If axis is 0, the inputs will be joined with LoD index.")
|
|
.SetDefault(0);
|
|
AddAttr<int>("level",
|
|
"(int, default 0) "
|
|
"The level at which the inputs will be joined. "
|
|
"If the level is 0, the inputs will be joined at the nested "
|
|
"sequence level. "
|
|
"If the level is 1, the inputs will be joined at the "
|
|
"sequence level. "
|
|
"The level should be less than the level number of inputs.")
|
|
.SetDefault(0);
|
|
AddComment(R"DOC(
|
|
The sequence_concat operator concatenates multiple LoDTensors.
|
|
It only supports sequence (LoD Tensor with level number is 1)
|
|
or a nested sequence (LoD tensor with level number is 2) as its input.
|
|
- Case1:
|
|
If the axis is other than 0(here, axis is 1 and level is 1),
|
|
each input should have the same LoD information and the LoD
|
|
information of the output keeps the same as the input.
|
|
|
|
LoD(x0) = {{0,2,4}, {0,1,2,3,4}}; Dims(x0) = (4,3,4)
|
|
LoD(x1) = {{0,2,4}, {0,1,2,3,4}}; Dims(x1) = (4,4,4)
|
|
LoD(Out) = {{0,2,4}, {0,1,2,3,4}}; Dims(Out) = (4,7,4)
|
|
|
|
- Case2:
|
|
If the axis is 0(here, leve is 0), the inputs are concatenated along
|
|
time steps, the LoD information of the output need to re-compute.
|
|
The LoD information of level-1 should be same.
|
|
|
|
LoD(x0) = {{0,2,4}, {0,1,2,3,4}}; Dims(x0) = (4,3,4)
|
|
LoD(x1) = {{0,2,4}, {0,1,3,5,7}}; Dims(x1) = (7,3,4)
|
|
LoD(Out) = {{0,2,4}, {0,2,5,8,11}}; Dims(Out) = (11,3,4)
|
|
|
|
- Case3:
|
|
If the axis is 0(here, level is 1).
|
|
|
|
LoD(x0) = {{0,2,4}, {0,1,2,3,4}}; Dims(x0) = (4,3,4)
|
|
LoD(x1) = {{0,3,4}, {0,1,3,5,7}}; Dims(x1) = (7,3,4)
|
|
LoD(Out) = {{0,5,8}, {0,1,2,3,5,7,8,9,11}}; Dims(Out) = (11,3,4)
|
|
|
|
- Case4:
|
|
If the LoD number is 1, axis is 0, level is 0
|
|
|
|
LoD(x0) = {{0,1,2,3,4}}; Dims(x0) = (4,3,4)
|
|
LoD(x1) = {{0,1,3,5,7}}; Dims(x1) = (7,3,4)
|
|
LoD(Out) = {{0,2,5,8,11}}; Dims(Out) = (11,3,4)
|
|
|
|
NOTE: The levels of all the inputs should be the same.
|
|
)DOC");
|
|
}
|
|
};
|
|
|
|
class SequenceConcatGradOp : public framework::OperatorWithKernel {
|
|
public:
|
|
using framework::OperatorWithKernel::OperatorWithKernel;
|
|
|
|
void InferShape(framework::InferShapeContext* ctx) const override {
|
|
PADDLE_ENFORCE(ctx->HasInput(framework::GradVarName("Out")),
|
|
"The gradient of Out should not be null.");
|
|
PADDLE_ENFORCE(ctx->HasOutputs(framework::GradVarName("X")),
|
|
"The gradient of X should not be null.");
|
|
ctx->SetOutputsDim(framework::GradVarName("X"), ctx->GetInputsDim("X"));
|
|
}
|
|
};
|
|
|
|
} // namespace operators
|
|
} // namespace paddle
|
|
|
|
namespace ops = paddle::operators;
|
|
REGISTER_OP_EX(sequence_concat, ops::SequenceConcatOp,
|
|
ops::SequenceConcatOpMaker, sequence_concat_grad,
|
|
ops::SequenceConcatGradOp, false);
|
|
REGISTER_OP_CPU_KERNEL(
|
|
sequence_concat,
|
|
ops::SequenceConcatOpKernel<paddle::platform::CPUDeviceContext, float>);
|
|
REGISTER_OP_CPU_KERNEL(
|
|
sequence_concat_grad,
|
|
ops::SequenceConcatGradOpKernel<paddle::platform::CPUDeviceContext, float>);
|