|
|
|
@ -90,108 +90,143 @@ template <typename Place, typename T>
|
|
|
|
|
class SequenceProjectFunctor {
|
|
|
|
|
public:
|
|
|
|
|
void operator()(const platform::DeviceContext& context,
|
|
|
|
|
const framework::LoDTensor* in,
|
|
|
|
|
const framework::LoDTensor* padding_data,
|
|
|
|
|
framework::LoDTensor* col, bool padding_trainable,
|
|
|
|
|
framework::LoDTensor& in, framework::LoDTensor& padding_data,
|
|
|
|
|
framework::LoDTensor& col, bool padding_trainable,
|
|
|
|
|
int context_start, int context_length, int context_stride,
|
|
|
|
|
int up_pad, int down_pad) {
|
|
|
|
|
auto lod_level_0 = in->lod()[0];
|
|
|
|
|
int up_pad, int down_pad, bool gradient, bool input_grad,
|
|
|
|
|
bool pad_grad) {
|
|
|
|
|
auto lod_level_0 = in.lod()[0];
|
|
|
|
|
|
|
|
|
|
paddle::operators::math::Im2ColFunctor<
|
|
|
|
|
paddle::operators::math::ColFormat::kOCF, Place, float>
|
|
|
|
|
im2col_ocf;
|
|
|
|
|
paddle::operators::math::Col2ImFunctor<
|
|
|
|
|
paddle::operators::math::ColFormat::kOCF, Place, float>
|
|
|
|
|
col2im_ocf;
|
|
|
|
|
|
|
|
|
|
int input_row_begin, input_row_end;
|
|
|
|
|
int sequence_height, sequence_width;
|
|
|
|
|
sequence_width = in->dims()[1];
|
|
|
|
|
|
|
|
|
|
for (int i = 0; i < static_cast<int>(lod_level_0.size()) - 1; ++i) {
|
|
|
|
|
input_row_begin = (context_start > 0)
|
|
|
|
|
? static_cast<int>(lod_level_0[i]) + context_start
|
|
|
|
|
: static_cast<int>(lod_level_0[i]);
|
|
|
|
|
input_row_end = static_cast<int>(lod_level_0[i + 1]);
|
|
|
|
|
|
|
|
|
|
framework::Tensor out_t =
|
|
|
|
|
col->Slice(static_cast<int>(lod_level_0[i]),
|
|
|
|
|
static_cast<int>(lod_level_0[i + 1]));
|
|
|
|
|
|
|
|
|
|
sequence_height = static_cast<int>(out_t.dims()[0]);
|
|
|
|
|
|
|
|
|
|
if (input_row_begin < input_row_end) {
|
|
|
|
|
framework::Tensor in_t = in->Slice(input_row_begin, input_row_end);
|
|
|
|
|
|
|
|
|
|
std::vector<int64_t> output_shape(
|
|
|
|
|
{sequence_height, 1, 1, context_length,
|
|
|
|
|
sequence_width}); // output_height, output_width,
|
|
|
|
|
// input_channels, filter_height, filter_width
|
|
|
|
|
|
|
|
|
|
out_t.Resize(framework::make_ddim(output_shape));
|
|
|
|
|
|
|
|
|
|
std::vector<int64_t> input_shape(
|
|
|
|
|
{1, input_row_end - input_row_begin,
|
|
|
|
|
sequence_width}); // input_channels, input_height, input_width
|
|
|
|
|
in_t.Resize(framework::make_ddim(input_shape));
|
|
|
|
|
|
|
|
|
|
im2col_ocf(context, in_t, out_t,
|
|
|
|
|
/*stride_height*/ context_stride, /*stride_width*/ 1, up_pad,
|
|
|
|
|
down_pad, 0, 0);
|
|
|
|
|
sequence_width = in.dims()[1];
|
|
|
|
|
input_grad = gradient && input_grad;
|
|
|
|
|
pad_grad = gradient && pad_grad;
|
|
|
|
|
|
|
|
|
|
if (!gradient || input_grad) {
|
|
|
|
|
for (int i = 0; i < static_cast<int>(lod_level_0.size()) - 1; ++i) {
|
|
|
|
|
input_row_begin = (context_start > 0)
|
|
|
|
|
? static_cast<int>(lod_level_0[i]) + context_start
|
|
|
|
|
: static_cast<int>(lod_level_0[i]);
|
|
|
|
|
input_row_end = static_cast<int>(lod_level_0[i + 1]);
|
|
|
|
|
|
|
|
|
|
framework::Tensor out_t =
|
|
|
|
|
col.Slice(static_cast<int>(lod_level_0[i]),
|
|
|
|
|
static_cast<int>(lod_level_0[i + 1]));
|
|
|
|
|
|
|
|
|
|
sequence_height = static_cast<int>(out_t.dims()[0]);
|
|
|
|
|
|
|
|
|
|
if (input_row_begin < input_row_end) {
|
|
|
|
|
framework::Tensor in_t = in.Slice(input_row_begin, input_row_end);
|
|
|
|
|
|
|
|
|
|
std::vector<int64_t> output_shape(
|
|
|
|
|
{sequence_height, 1, 1, context_length,
|
|
|
|
|
sequence_width}); // output_height, output_width,
|
|
|
|
|
// input_channels, filter_height, filter_width
|
|
|
|
|
|
|
|
|
|
out_t.Resize(framework::make_ddim(output_shape));
|
|
|
|
|
|
|
|
|
|
std::vector<int64_t> input_shape(
|
|
|
|
|
{1, input_row_end - input_row_begin,
|
|
|
|
|
sequence_width}); // input_channels, input_height, input_width
|
|
|
|
|
in_t.Resize(framework::make_ddim(input_shape));
|
|
|
|
|
|
|
|
|
|
if (gradient) {
|
|
|
|
|
col2im_ocf(context, in_t, out_t,
|
|
|
|
|
/*stride_height*/ context_stride, /*stride_width*/ 1,
|
|
|
|
|
up_pad, down_pad, 0, 0);
|
|
|
|
|
} else {
|
|
|
|
|
im2col_ocf(context, in_t, out_t,
|
|
|
|
|
/*stride_height*/ context_stride, /*stride_width*/ 1,
|
|
|
|
|
up_pad, down_pad, 0, 0);
|
|
|
|
|
}
|
|
|
|
|
out_t.Resize(framework::make_ddim(
|
|
|
|
|
{sequence_height, context_length * sequence_width}));
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
if (!gradient || pad_grad) {
|
|
|
|
|
if (padding_trainable) {
|
|
|
|
|
// add up trainable data
|
|
|
|
|
out_t.Resize(framework::make_ddim(
|
|
|
|
|
{sequence_height * context_length, sequence_width}));
|
|
|
|
|
|
|
|
|
|
if (up_pad > 0) { // add up pad
|
|
|
|
|
int padding_rows = std::min(
|
|
|
|
|
up_pad, static_cast<int>(lod_level_0[i + 1] - lod_level_0[i]));
|
|
|
|
|
|
|
|
|
|
for (int k = 0; k < padding_rows; ++k) {
|
|
|
|
|
int padding_size =
|
|
|
|
|
k + context_length < up_pad ? context_length : up_pad - k;
|
|
|
|
|
framework::Tensor out_t_sub = out_t.Slice(
|
|
|
|
|
k * context_length, k * context_length + padding_size);
|
|
|
|
|
framework::Tensor w_sub = padding_data->Slice(k, k + padding_size);
|
|
|
|
|
// in this block, using EigenVector<T>::Flatten is ok too.
|
|
|
|
|
auto out_t_sub_e = EigenMatrix<T>::From(out_t_sub);
|
|
|
|
|
auto w_sub_e = EigenMatrix<T>::From(w_sub);
|
|
|
|
|
out_t_sub_e.device(*context.GetEigenDevice<Place>()) = w_sub_e;
|
|
|
|
|
for (int i = 0; i < static_cast<int>(lod_level_0.size()) - 1; ++i) {
|
|
|
|
|
framework::Tensor out_t =
|
|
|
|
|
col.Slice(static_cast<int>(lod_level_0[i]),
|
|
|
|
|
static_cast<int>(lod_level_0[i + 1]));
|
|
|
|
|
|
|
|
|
|
sequence_height = static_cast<int>(out_t.dims()[0]);
|
|
|
|
|
|
|
|
|
|
// add up trainable data
|
|
|
|
|
out_t.Resize(framework::make_ddim(
|
|
|
|
|
{sequence_height * context_length, sequence_width}));
|
|
|
|
|
|
|
|
|
|
if (up_pad > 0) { // add up pad
|
|
|
|
|
int padding_rows = std::min(
|
|
|
|
|
up_pad, static_cast<int>(lod_level_0[i + 1] - lod_level_0[i]));
|
|
|
|
|
|
|
|
|
|
for (int k = 0; k < padding_rows; ++k) {
|
|
|
|
|
int padding_size =
|
|
|
|
|
k + context_length < up_pad ? context_length : up_pad - k;
|
|
|
|
|
framework::Tensor out_t_sub = out_t.Slice(
|
|
|
|
|
k * context_length, k * context_length + padding_size);
|
|
|
|
|
framework::Tensor w_sub = padding_data.Slice(k, k + padding_size);
|
|
|
|
|
// in this block, using EigenVector<T>::Flatten is ok too.
|
|
|
|
|
auto out_t_sub_e = EigenMatrix<T>::From(out_t_sub);
|
|
|
|
|
auto w_sub_e = EigenMatrix<T>::From(w_sub);
|
|
|
|
|
if (gradient) {
|
|
|
|
|
w_sub_e.device(*context.GetEigenDevice<Place>()) =
|
|
|
|
|
w_sub_e + out_t_sub_e;
|
|
|
|
|
} else {
|
|
|
|
|
out_t_sub_e.device(*context.GetEigenDevice<Place>()) = w_sub_e;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (down_pad > 0) { // add down pad
|
|
|
|
|
int down_pad_begin_row =
|
|
|
|
|
std::max(0,
|
|
|
|
|
(sequence_height - context_start - context_length) + 1) +
|
|
|
|
|
1;
|
|
|
|
|
int padding_begin = std::max(0, context_start - sequence_height);
|
|
|
|
|
int padding_size =
|
|
|
|
|
sequence_height - context_start >= context_length
|
|
|
|
|
? 1
|
|
|
|
|
: context_length - (sequence_height - context_start);
|
|
|
|
|
if (context_start >= sequence_height) padding_size = context_length;
|
|
|
|
|
int padding_idx = padding_begin;
|
|
|
|
|
for (int t = 0; t + down_pad_begin_row <= sequence_height;
|
|
|
|
|
++t, ++padding_size) {
|
|
|
|
|
if (down_pad > 0) { // add down pad
|
|
|
|
|
int down_pad_begin_row =
|
|
|
|
|
std::max(
|
|
|
|
|
0, (sequence_height - context_start - context_length) + 1) +
|
|
|
|
|
1;
|
|
|
|
|
int padding_begin = std::max(0, context_start - sequence_height);
|
|
|
|
|
int padding_size =
|
|
|
|
|
sequence_height - context_start >= context_length
|
|
|
|
|
? 1
|
|
|
|
|
: context_length - (sequence_height - context_start);
|
|
|
|
|
if (context_start >= sequence_height) padding_size = context_length;
|
|
|
|
|
if (padding_size > context_length) {
|
|
|
|
|
padding_size = context_length;
|
|
|
|
|
padding_idx++;
|
|
|
|
|
int padding_idx = padding_begin;
|
|
|
|
|
for (int t = 0; t + down_pad_begin_row <= sequence_height;
|
|
|
|
|
++t, ++padding_size) {
|
|
|
|
|
if (context_start >= sequence_height)
|
|
|
|
|
padding_size = context_length;
|
|
|
|
|
if (padding_size > context_length) {
|
|
|
|
|
padding_size = context_length;
|
|
|
|
|
padding_idx++;
|
|
|
|
|
}
|
|
|
|
|
if (padding_begin > 0 || sequence_height == context_start)
|
|
|
|
|
padding_idx = padding_begin + t;
|
|
|
|
|
framework::Tensor out_t_sub = out_t.Slice(
|
|
|
|
|
(down_pad_begin_row + t) * context_length - padding_size,
|
|
|
|
|
(down_pad_begin_row + t) * context_length);
|
|
|
|
|
framework::Tensor w_sub = padding_data.Slice(
|
|
|
|
|
up_pad + padding_idx, up_pad + padding_idx + padding_size);
|
|
|
|
|
auto out_t_sub_e = EigenMatrix<T>::From(out_t_sub);
|
|
|
|
|
auto w_sub_e = EigenMatrix<T>::From(w_sub);
|
|
|
|
|
if (gradient) {
|
|
|
|
|
w_sub_e.device(*context.GetEigenDevice<Place>()) =
|
|
|
|
|
w_sub_e + out_t_sub_e;
|
|
|
|
|
} else {
|
|
|
|
|
out_t_sub_e.device(*context.GetEigenDevice<Place>()) = w_sub_e;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (padding_begin > 0 || sequence_height == context_start)
|
|
|
|
|
padding_idx = padding_begin + t;
|
|
|
|
|
framework::Tensor out_t_sub = out_t.Slice(
|
|
|
|
|
(down_pad_begin_row + t) * context_length - padding_size,
|
|
|
|
|
(down_pad_begin_row + t) * context_length);
|
|
|
|
|
framework::Tensor w_sub = padding_data->Slice(
|
|
|
|
|
up_pad + padding_idx, up_pad + padding_idx + padding_size);
|
|
|
|
|
auto out_t_sub_e = EigenMatrix<T>::From(out_t_sub);
|
|
|
|
|
auto w_sub_e = EigenMatrix<T>::From(w_sub);
|
|
|
|
|
out_t_sub_e.device(*context.GetEigenDevice<Place>()) = w_sub_e;
|
|
|
|
|
}
|
|
|
|
|
out_t.Resize(framework::make_ddim(
|
|
|
|
|
{sequence_height, context_length * sequence_width}));
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
out_t.Resize(framework::make_ddim(
|
|
|
|
|
{sequence_height, context_length * sequence_width}));
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|