Paddle/paddle/operators/math/sequence2batch.h

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

   http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
#include "paddle/framework/lod_tensor.h"
#include "paddle/framework/tensor.h"
#include "paddle/platform/device_context.h"

namespace paddle {
namespace operators {
namespace math {

template <typename Place, typename T>
class CopyMatrixRowsFunctor {
 public:
  // If is_src_index is true,
  // copy the indexed rows of input src to the output dst.
  // If is_src_index is false,
  // copy the input src to the indexed rows of output dst.
  // The indexed rows are based on the input index.
  void operator()(const platform::DeviceContext& context,
                  const framework::LoDTensor& src, const size_t* index,
                  framework::LoDTensor& dst, const bool is_src_index);
};

template <typename Place, typename T>
class LoDTensor2BatchFunctor {
 public:
  void operator()(const platform::DeviceContext& context,
                  const framework::LoDTensor& lod_tensor,
                  framework::LoDTensor& batch, const bool is_reverse) const {
    auto lods = lod_tensor.lod();
    PADDLE_ENFORCE_EQ(lods.size(), 1UL, "Only support one level sequence now.");
    auto lod = lods[0];

    // Calculate the length of each sequence and
    // sort sequence index by the length.
    // example:  sequences = {s0, s1, s2}
    //           s0: 0 0 0 0, s1: 1 1 1 1 1, s2: 2 2 2
    //           seq_info[3] = {(4, 5, 1), (0, 4, 0), (9, 3, 2)}
    //
    struct SeqInfo {
      SeqInfo(int start, int length, int seq_idx)
          : start(start), length(length), seq_idx(seq_idx) {}
      int start;
      int length;
      int seq_idx;
    };

    std::vector<SeqInfo> seq_info;
    for (size_t seq_id = 0; seq_id < lod.size() - 1; ++seq_id) {
      int length = lod[seq_id + 1] - lod[seq_id];
      seq_info.emplace_back(lod[seq_id], length, seq_id);
    }

    std::sort(seq_info.begin(), seq_info.end(),
              [](SeqInfo a, SeqInfo b) { return a.length > b.length; });

    // calculate the start position of each batch
    // (numBatch equal the maxLength of sequences)
    // example:  sequences = {s0, s1, s2}
    //           s0: 0 0 0 0, s1: 1 1 1 1 1, s2: 2 2 2
    //           num_batch = 5,
    //           batchIndex = {b0, b1, b2, b3, b4}
    //           b0: 1 0 2, b1: 1 0 2, b2: 1 0 2, b3: 1 0, b4: 1
    //           batch_start_positions[6] = {0, 3, 6, 9, 11, 12}
    //           seq2batch_idx[12] = {4, 0, 9,
    //                                5, 1, 10,
    //                                6, 2, 11,
    //                                7, 3,
    //                                8}

    // The batch number represents batch size after rearranging the
    // input LodTensor. It is also the maximum length of input sequence.

    paddle::framework::LoD batch_lods;
    batch_lods.push_back(std::vector<size_t>{0});
    batch_lods.push_back(std::vector<size_t>{0});

    // batch_lods[0] is the start positions for batch LoDTensor
    int num_batch = (size_t)seq_info[0].length;
    batch_lods[0].resize(num_batch + 1);
    // batch_lods[1] is the raw index in the input LoDTensor
    auto dims = lod_tensor.dims();
    batch_lods[1].resize(dims[0]);

    size_t* batch_starts = batch_lods[0].data();
    size_t* seq2batch_idx = batch_lods[1].data();
    batch_starts[0] = 0;
    for (size_t n = 0; n < num_batch; n++) {
      int batch_id = batch_starts[n];
      for (size_t i = 0; i < seq_info.size(); ++i) {
        size_t seq_len = seq_info[i].length;
        int start = seq_info[i].start;
        if (n < seq_len) {
          if (!is_reverse) {
            seq2batch_idx[batch_id] = start + n;
          } else {
            seq2batch_idx[batch_id] = start + seq_len - 1 - n;
          }
          batch_id++;
        } else {
          break;
        }
      }
      batch_starts[n + 1] = batch_id;
    }
    batch.set_lod(batch_lods);

    CopyMatrixRowsFunctor<Place, T> to_batch;
    to_batch(context, lod_tensor, seq2batch_idx, batch, true);
  }
};

template <typename Place, typename T>
class Batch2LoDTensorFunctor {
 public:
  void operator()(const platform::DeviceContext& context,
                  const framework::LoDTensor& batch,
                  framework::LoDTensor& lod_tensor) const {
    auto in_lod = batch.lod();
    PADDLE_ENFORCE_EQ(in_lod.size(), 2UL,
                      "The LoD size of input `batch` should be 2.");
    auto out_lod = lod_tensor.lod()[0];
    auto num = out_lod[out_lod.size() - 1];
    PADDLE_ENFORCE_EQ(num, lod_tensor.dims()[0]);
    PADDLE_ENFORCE_EQ(num, in_lod[1].size());
    PADDLE_ENFORCE_EQ(num, batch.dims()[0]);
    CopyMatrixRowsFunctor<Place, T> to_seq;
    size_t* index = in_lod[1].data();
    to_seq(context, batch, index, lod_tensor, false);
  }
};

}  // namespace math
}  // namespace operators
}  // namespace paddle
Add LSTM Operators. 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.`

			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

LSTM Operator forward implementation. 7 years ago			`#pragma once`
			`#include "paddle/framework/lod_tensor.h"`
			`#include "paddle/framework/tensor.h"`
			`#include "paddle/platform/device_context.h"`

Add LSTM Operators. 7 years ago			`namespace paddle {`
			`namespace operators {`
			`namespace math {`

Add lstm implementation. 7 years ago			`template <typename Place, typename T>`
			`class CopyMatrixRowsFunctor {`
			`public:`
			`// If is_src_index is true,`
			`// copy the indexed rows of input src to the output dst.`
			`// If is_src_index is false,`
			`// copy the input src to the indexed rows of output dst.`
			`// The indexed rows are based on the input index.`
			`void operator()(const platform::DeviceContext& context,`
LSTM Operator forward implementation. 7 years ago			`const framework::LoDTensor& src, const size_t* index,`
			`framework::LoDTensor& dst, const bool is_src_index);`
Add lstm implementation. 7 years ago			`};`

Add LSTM Operators. 7 years ago			`template <typename Place, typename T>`
			`class LoDTensor2BatchFunctor {`
			`public:`
			`void operator()(const platform::DeviceContext& context,`
			`const framework::LoDTensor& lod_tensor,`
			`framework::LoDTensor& batch, const bool is_reverse) const {`
LSTM Operator forward implementation. 7 years ago			`auto lods = lod_tensor.lod();`
			`PADDLE_ENFORCE_EQ(lods.size(), 1UL, "Only support one level sequence now.");`
Add LSTM Operators. 7 years ago			`auto lod = lods[0];`

			`// Calculate the length of each sequence and`
			`// sort sequence index by the length.`
			`// example: sequences = {s0, s1, s2}`
			`// s0: 0 0 0 0, s1: 1 1 1 1 1, s2: 2 2 2`
			`// seq_info[3] = {(4, 5, 1), (0, 4, 0), (9, 3, 2)}`
			`//`
			`struct SeqInfo {`
			`SeqInfo(int start, int length, int seq_idx)`
LSTM Operator forward implementation. 7 years ago			`: start(start), length(length), seq_idx(seq_idx) {}`
Add LSTM Operators. 7 years ago			`int start;`
			`int length;`
			`int seq_idx;`
			`};`

			`std::vector<SeqInfo> seq_info;`
Add unit testing for forwad implementation. 7 years ago			`for (size_t seq_id = 0; seq_id < lod.size() - 1; ++seq_id) {`
Add LSTM Operators. 7 years ago			`int length = lod[seq_id + 1] - lod[seq_id];`
			`seq_info.emplace_back(lod[seq_id], length, seq_id);`
			`}`

			`std::sort(seq_info.begin(), seq_info.end(),`
			`[](SeqInfo a, SeqInfo b) { return a.length > b.length; });`

			`// calculate the start position of each batch`
			`// (numBatch equal the maxLength of sequences)`
			`// example: sequences = {s0, s1, s2}`
			`// s0: 0 0 0 0, s1: 1 1 1 1 1, s2: 2 2 2`
			`// num_batch = 5,`
			`// batchIndex = {b0, b1, b2, b3, b4}`
			`// b0: 1 0 2, b1: 1 0 2, b2: 1 0 2, b3: 1 0, b4: 1`
			`// batch_start_positions[6] = {0, 3, 6, 9, 11, 12}`
			`// seq2batch_idx[12] = {4, 0, 9,`
			`// 5, 1, 10,`
			`// 6, 2, 11,`
			`// 7, 3,`
			`// 8}`

			`// The batch number represents batch size after rearranging the`
			`// input LodTensor. It is also the maximum length of input sequence.`
Add unit testing for forwad implementation. 7 years ago
			`paddle::framework::LoD batch_lods;`
			`batch_lods.push_back(std::vector<size_t>{0});`
			`batch_lods.push_back(std::vector<size_t>{0});`

Add LSTM Operators. 7 years ago			`// batch_lods[0] is the start positions for batch LoDTensor`
			`int num_batch = (size_t)seq_info[0].length;`
LSTM Operator forward implementation. 7 years ago			`batch_lods[0].resize(num_batch + 1);`
Add LSTM Operators. 7 years ago			`// batch_lods[1] is the raw index in the input LoDTensor`
LSTM Operator forward implementation. 7 years ago			`auto dims = lod_tensor.dims();`
			`batch_lods[1].resize(dims[0]);`
Add LSTM Operators. 7 years ago
LSTM Operator forward implementation. 7 years ago			`size_t* batch_starts = batch_lods[0].data();`
			`size_t* seq2batch_idx = batch_lods[1].data();`
Add LSTM Operators. 7 years ago			`batch_starts[0] = 0;`
			`for (size_t n = 0; n < num_batch; n++) {`
			`int batch_id = batch_starts[n];`
			`for (size_t i = 0; i < seq_info.size(); ++i) {`
			`size_t seq_len = seq_info[i].length;`
			`int start = seq_info[i].start;`
			`if (n < seq_len) {`
			`if (!is_reverse) {`
			`seq2batch_idx[batch_id] = start + n;`
			`} else {`
			`seq2batch_idx[batch_id] = start + seq_len - 1 - n;`
			`}`
			`batch_id++;`
			`} else {`
			`break;`
			`}`
			`}`
			`batch_starts[n + 1] = batch_id;`
			`}`
Add unit testing for forwad implementation. 7 years ago			`batch.set_lod(batch_lods);`
Add lstm implementation. 7 years ago
			`CopyMatrixRowsFunctor<Place, T> to_batch;`
LSTM Operator forward implementation. 7 years ago			`to_batch(context, lod_tensor, seq2batch_idx, batch, true);`
Add LSTM Operators. 7 years ago			`}`
Add lstm implementation. 7 years ago			`};`
Add LSTM Operators. 7 years ago
			`template <typename Place, typename T>`
LSTM Operator forward implementation. 7 years ago			`class Batch2LoDTensorFunctor {`
Add LSTM Operators. 7 years ago			`public:`
			`void operator()(const platform::DeviceContext& context,`
			`const framework::LoDTensor& batch,`
LSTM Operator forward implementation. 7 years ago			`framework::LoDTensor& lod_tensor) const {`
			`auto in_lod = batch.lod();`
			`PADDLE_ENFORCE_EQ(in_lod.size(), 2UL,`
			"The LoD size of input `batch` should be 2.");
Add unit testing for forwad implementation. 7 years ago			`auto out_lod = lod_tensor.lod()[0];`
			`auto num = out_lod[out_lod.size() - 1];`
			`PADDLE_ENFORCE_EQ(num, lod_tensor.dims()[0]);`
			`PADDLE_ENFORCE_EQ(num, in_lod[1].size());`
			`PADDLE_ENFORCE_EQ(num, batch.dims()[0]);`
LSTM Operator forward implementation. 7 years ago			`CopyMatrixRowsFunctor<Place, T> to_seq;`
Add unit testing for forwad implementation. 7 years ago			`size_t* index = in_lod[1].data();`
LSTM Operator forward implementation. 7 years ago			`to_seq(context, batch, index, lod_tensor, false);`
			`}`
Add lstm implementation. 7 years ago			`};`
Add LSTM Operators. 7 years ago
			`} // namespace math`
			`} // namespace operators`
			`} // namespace paddle`