Paddle/paddle/fluid/operators/math/concat.cc

/* Copyright (c) 2018 paddlepaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/fluid/operators/math/concat.h"
#include <vector>

namespace paddle {
namespace operators {
namespace math {

/*
 * All tensors' dimension should be the same and the values of
 * each dimension must be the same, except the axis dimension.
 */
template <typename T>
class ConcatFunctor<platform::CPUDeviceContext, T> {
 public:
  void operator()(const platform::CPUDeviceContext& context,
                  const std::vector<framework::Tensor>& input, const int axis,
                  framework::Tensor* output) {
    // TODO(zcd): Add input data validity checking
    int num = input.size();

    int rows = 1;
    auto dim_0 = input[0].dims();
    for (int i = 0; i < axis; ++i) {
      rows *= dim_0[i];
    }
    int out_rows = rows, out_cols = 0;

    std::vector<int64_t> input_cols(input.size());
    for (int i = 0; i < num; ++i) {
      int t_cols = input[i].numel() / rows;
      out_cols += t_cols;
      input_cols[i] = t_cols;
    }
    auto cpu_place = boost::get<platform::CPUPlace>(context.GetPlace());

    // computation
    for (int k = 0; k < out_rows; ++k) {
      T* dst_ptr = output->data<T>() + k * out_cols;
      int col_idx = 0;
      for (int j = 0; j < num; ++j) {
        int col_len = input_cols[j];
        const T* src_prt = input[j].data<T>() + k * col_len;
        memory::Copy(cpu_place, dst_ptr + col_idx, cpu_place, src_prt,
                     sizeof(T) * col_len);
        col_idx += col_len;
      }
    }
  }
};

/*
 * All tensors' dimension should be the same and the values of
 * each dimension must be the same, except the axis dimension.
 */
template <typename T>
class ConcatGradFunctor<platform::CPUDeviceContext, T> {
 public:
  void operator()(const platform::CPUDeviceContext& context,
                  const framework::Tensor& input, const int axis,
                  std::vector<framework::Tensor>* outputs) {
    // TODO(zcd): Add input data validity checking
    int num = outputs->size();

    int input_rows = 1;
    auto dim_0 = outputs->at(0).dims();
    for (int i = 0; i < axis; ++i) {
      input_rows *= dim_0[i];
    }
    int input_cols = 0;

    std::vector<int64_t> output_cols(outputs->size());
    for (int i = 0; i < num; ++i) {
      int t_cols = outputs->at(i).numel() / input_rows;
      input_cols += t_cols;
      output_cols[i] = t_cols;
    }
    auto cpu_place = boost::get<platform::CPUPlace>(context.GetPlace());

    // computation
    for (int k = 0; k < input_rows; ++k) {
      const T* src_ptr = input.data<T>() + k * input_cols;
      int col_idx = 0;
      for (int j = 0; j < num; ++j) {
        int col_len = output_cols[j];
        T* dst_ptr = outputs->at(j).data<T>() + k * col_len;
        memory::Copy(cpu_place, dst_ptr, cpu_place, src_ptr + col_idx,
                     sizeof(T) * col_len);
        col_idx += col_len;
      }
    }
  }
};

template class ConcatFunctor<platform::CPUDeviceContext, int>;
template class ConcatFunctor<platform::CPUDeviceContext, int64_t>;
template class ConcatFunctor<platform::CPUDeviceContext, float>;
template class ConcatFunctor<platform::CPUDeviceContext, double>;

template class ConcatGradFunctor<platform::CPUDeviceContext, int>;
template class ConcatGradFunctor<platform::CPUDeviceContext, int64_t>;
template class ConcatGradFunctor<platform::CPUDeviceContext, float>;
template class ConcatGradFunctor<platform::CPUDeviceContext, double>;

}  // namespace math
}  // namespace operators
}  // namespace paddle
refine concat_op 7 years ago			`/* Copyright (c) 2018 paddlepaddle Authors. All Rights Reserved.`

			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

			`#include "paddle/fluid/operators/math/concat.h"`
Fix more CPPLint issues in fluid/operators/math (#10276) * Fix CPPLint issues in lstm_cpu_kernel.h * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/gru_cpu_kernel * Fix CPPLint issues in math/selected_rows_functor_test.cu * Fix compile error * Fix compile error 7 years ago			`#include <vector>`
refine concat_op 7 years ago
			`namespace paddle {`
			`namespace operators {`
			`namespace math {`

			`/*`
follow comments and refine code 7 years ago			`* All tensors' dimension should be the same and the values of`
Merge branch 'develop' of https://github.com/PaddlePaddle/Paddle into feature/fix_concat 7 years ago			`* each dimension must be the same, except the axis dimension.`
refine concat_op 7 years ago			`*/`
			`template <typename T>`
			`class ConcatFunctor<platform::CPUDeviceContext, T> {`
			`public:`
			`void operator()(const platform::CPUDeviceContext& context,`
get max threads of GPU 7 years ago			`const std::vector<framework::Tensor>& input, const int axis,`
refine concat_op 7 years ago			`framework::Tensor* output) {`
follow comments and refine code 7 years ago			`// TODO(zcd): Add input data validity checking`
refine concat_op 7 years ago			`int num = input.size();`

			`int rows = 1;`
			`auto dim_0 = input[0].dims();`
			`for (int i = 0; i < axis; ++i) {`
			`rows *= dim_0[i];`
			`}`
			`int out_rows = rows, out_cols = 0;`

get max threads of GPU 7 years ago			`std::vector<int64_t> input_cols(input.size());`
refine concat_op 7 years ago			`for (int i = 0; i < num; ++i) {`
			`int t_cols = input[i].numel() / rows;`
			`out_cols += t_cols;`
get max threads of GPU 7 years ago			`input_cols[i] = t_cols;`
refine concat_op 7 years ago			`}`
Fix compilation for gcc5.4 The error is: paddle/fluid/operators/math/concat.cc:47:72: error: invalid initialization of non-const reference of type 'paddle::platform::CPUPlace&' from an rvalue of type 'paddle::platform::CPUPlace' auto& cpu_place = boost::get<platform::CPUPlace>(context.GetPlace()); Should not use reference for cpu_place. 7 years ago			`auto cpu_place = boost::get<platform::CPUPlace>(context.GetPlace());`
get max threads of GPU 7 years ago
refine concat_op 7 years ago			`// computation`
get max threads of GPU 7 years ago			`for (int k = 0; k < out_rows; ++k) {`
refine concat_op 7 years ago			`T* dst_ptr = output->data<T>() + k * out_cols;`
			`int col_idx = 0;`
			`for (int j = 0; j < num; ++j) {`
get max threads of GPU 7 years ago			`int col_len = input_cols[j];`
refine concat_op 7 years ago			`const T* src_prt = input[j].data<T>() + k * col_len;`
			`memory::Copy(cpu_place, dst_ptr + col_idx, cpu_place, src_prt,`
			`sizeof(T) * col_len);`
			`col_idx += col_len;`
			`}`
			`}`
get max threads of GPU 7 years ago			`}`
			`};`

follow comments and refine code 7 years ago			`/*`
			`* All tensors' dimension should be the same and the values of`
Merge branch 'develop' of https://github.com/PaddlePaddle/Paddle into feature/fix_concat 7 years ago			`* each dimension must be the same, except the axis dimension.`
follow comments and refine code 7 years ago			`*/`
get max threads of GPU 7 years ago			`template <typename T>`
			`class ConcatGradFunctor<platform::CPUDeviceContext, T> {`
			`public:`
			`void operator()(const platform::CPUDeviceContext& context,`
			`const framework::Tensor& input, const int axis,`
Fix more CPPLint issues in fluid/operators/math (#10276) * Fix CPPLint issues in lstm_cpu_kernel.h * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/gru_cpu_kernel * Fix CPPLint issues in math/selected_rows_functor_test.cu * Fix compile error * Fix compile error 7 years ago			`std::vector<framework::Tensor>* outputs) {`
follow comments and refine code 7 years ago			`// TODO(zcd): Add input data validity checking`
Fix more CPPLint issues in fluid/operators/math (#10276) * Fix CPPLint issues in lstm_cpu_kernel.h * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/gru_cpu_kernel * Fix CPPLint issues in math/selected_rows_functor_test.cu * Fix compile error * Fix compile error 7 years ago			`int num = outputs->size();`
refine concat_op 7 years ago
get max threads of GPU 7 years ago			`int input_rows = 1;`
Fix more CPPLint issues in fluid/operators/math (#10276) * Fix CPPLint issues in lstm_cpu_kernel.h * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/gru_cpu_kernel * Fix CPPLint issues in math/selected_rows_functor_test.cu * Fix compile error * Fix compile error 7 years ago			`auto dim_0 = outputs->at(0).dims();`
get max threads of GPU 7 years ago			`for (int i = 0; i < axis; ++i) {`
			`input_rows *= dim_0[i];`
			`}`
			`int input_cols = 0;`

Fix more CPPLint issues in fluid/operators/math (#10276) * Fix CPPLint issues in lstm_cpu_kernel.h * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/gru_cpu_kernel * Fix CPPLint issues in math/selected_rows_functor_test.cu * Fix compile error * Fix compile error 7 years ago			`std::vector<int64_t> output_cols(outputs->size());`
get max threads of GPU 7 years ago			`for (int i = 0; i < num; ++i) {`
Fix more CPPLint issues in fluid/operators/math (#10276) * Fix CPPLint issues in lstm_cpu_kernel.h * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/gru_cpu_kernel * Fix CPPLint issues in math/selected_rows_functor_test.cu * Fix compile error * Fix compile error 7 years ago			`int t_cols = outputs->at(i).numel() / input_rows;`
get max threads of GPU 7 years ago			`input_cols += t_cols;`
			`output_cols[i] = t_cols;`
			`}`
Fix compilation for gcc5.4 The error is: paddle/fluid/operators/math/concat.cc:47:72: error: invalid initialization of non-const reference of type 'paddle::platform::CPUPlace&' from an rvalue of type 'paddle::platform::CPUPlace' auto& cpu_place = boost::get<platform::CPUPlace>(context.GetPlace()); Should not use reference for cpu_place. 7 years ago			`auto cpu_place = boost::get<platform::CPUPlace>(context.GetPlace());`
get max threads of GPU 7 years ago
			`// computation`
			`for (int k = 0; k < input_rows; ++k) {`
			`const T* src_ptr = input.data<T>() + k * input_cols;`
			`int col_idx = 0;`
			`for (int j = 0; j < num; ++j) {`
			`int col_len = output_cols[j];`
Fix more CPPLint issues in fluid/operators/math (#10276) * Fix CPPLint issues in lstm_cpu_kernel.h * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/math_function_test * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/concat.cc * Fix CPPLint issues in math/gru_cpu_kernel * Fix CPPLint issues in math/selected_rows_functor_test.cu * Fix compile error * Fix compile error 7 years ago			`T* dst_ptr = outputs->at(j).data<T>() + k * col_len;`
get max threads of GPU 7 years ago			`memory::Copy(cpu_place, dst_ptr, cpu_place, src_ptr + col_idx,`
			`sizeof(T) * col_len);`
			`col_idx += col_len;`
			`}`
			`}`
refine concat_op 7 years ago			`}`
			`};`

			`template class ConcatFunctor<platform::CPUDeviceContext, int>;`
			`template class ConcatFunctor<platform::CPUDeviceContext, int64_t>;`
			`template class ConcatFunctor<platform::CPUDeviceContext, float>;`
			`template class ConcatFunctor<platform::CPUDeviceContext, double>;`

get max threads of GPU 7 years ago			`template class ConcatGradFunctor<platform::CPUDeviceContext, int>;`
			`template class ConcatGradFunctor<platform::CPUDeviceContext, int64_t>;`
			`template class ConcatGradFunctor<platform::CPUDeviceContext, float>;`
			`template class ConcatGradFunctor<platform::CPUDeviceContext, double>;`

refine concat_op 7 years ago			`} // namespace math`
			`} // namespace operators`
			`} // namespace paddle`