Paddle/paddle/fluid/operators/cross_entropy_op.h

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
#include "paddle/fluid/framework/eigen.h"
#include "paddle/fluid/framework/op_registry.h"
#include "paddle/fluid/operators/math/cross_entropy.h"
#include "paddle/fluid/operators/math/math_function.h"

namespace paddle {
namespace operators {

using Tensor = framework::Tensor;
template <typename T, int MajorType = Eigen::RowMajor,
          typename IndexType = Eigen::DenseIndex>
using EigenMatrix = framework::EigenMatrix<T, MajorType, IndexType>;

template <typename T>
class CrossEntropyOpKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const override {
    PADDLE_ENFORCE(platform::is_cpu_place(ctx.GetPlace()),
                   "This kernel only runs on CPU.");
    const Tensor* x = ctx.Input<Tensor>("X");
    const Tensor* labels = ctx.Input<Tensor>("Label");
    Tensor* y = ctx.Output<Tensor>("Y");
    y->mutable_data<T>(ctx.GetPlace());

    math::CrossEntropyFunctor<platform::CPUDeviceContext, T>()(
        ctx.template device_context<platform::CPUDeviceContext>(), y, x, labels,
        ctx.Attr<bool>("soft_label"));
  }
};

template <typename T>
class CrossEntropyGradientOpKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const override {
    PADDLE_ENFORCE(platform::is_cpu_place(ctx.GetPlace()),
                   "This kernel only runs on CPU.");
    const Tensor* x = ctx.Input<Tensor>("X");
    const Tensor* dy = ctx.Input<Tensor>(framework::GradVarName("Y"));
    const Tensor* label = ctx.Input<Tensor>("Label");
    Tensor* dx = ctx.Output<Tensor>(framework::GradVarName("X"));
    T* dx_data = dx->mutable_data<T>(ctx.GetPlace());

    int64_t class_num = x->dims()[1];
    if (ctx.Attr<bool>("soft_label")) {
      auto x_mat = EigenMatrix<T>::From(*x);
      auto dy_mat = EigenMatrix<T>::From(*dy);
      auto lbl_mat = EigenMatrix<T>::From(*label);
      auto dx_mat = EigenMatrix<T>::From(*dx);

      dx_mat.device(*ctx.template device_context<platform::CPUDeviceContext>()
                         .eigen_device()) =
          -(lbl_mat *
            dy_mat.broadcast(Eigen::DSizes<int64_t, 2>(1, class_num)) / x_mat);
    } else {
      int64_t batch_size = x->dims()[0];
      const T* dy_data = dy->data<T>();
      const T* x_data = x->data<T>();
      const int64_t* label_data = label->data<int64_t>();

      math::SetConstant<platform::CPUDeviceContext, T> functor;
      functor(ctx.template device_context<platform::CPUDeviceContext>(), dx, 0);

      for (int64_t i = 0; i < batch_size; ++i) {
        PADDLE_ASSERT(label_data[i] >= 0 || label_data[i] < class_num);
        int64_t index = i * class_num + label_data[i];
        dx_data[index] = -dy_data[i] / x_data[index];
      }
    }
  }
};

}  // namespace operators
}  // namespace paddle
Fix the grammar in copyright. (#8403) 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.`
add cross-entropy-op (#2965) * add cross-entropy-op * add infershape and compute * implement Infershape and compute of onehotcrossentropy op 8 years ago
			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

			`#pragma once`
Correct #include path 7 years ago			`#include "paddle/fluid/framework/eigen.h"`
			`#include "paddle/fluid/framework/op_registry.h"`
			`#include "paddle/fluid/operators/math/cross_entropy.h"`
			`#include "paddle/fluid/operators/math/math_function.h"`
add cross-entropy-op (#2965) * add cross-entropy-op * add infershape and compute * implement Infershape and compute of onehotcrossentropy op 8 years ago
			`namespace paddle {`
			`namespace operators {`

"net op alias" 8 years ago			`using Tensor = framework::Tensor;`
update the backward kernel. 8 years ago			`template <typename T, int MajorType = Eigen::RowMajor,`
			`typename IndexType = Eigen::DenseIndex>`
			`using EigenMatrix = framework::EigenMatrix<T, MajorType, IndexType>;`
"net op alias" 8 years ago
Implement GPU kernel for cross entropy operator. 8 years ago			`template <typename T>`
Add Skeleton of Double support 7 years ago			`class CrossEntropyOpKernel : public framework::OpKernel<T> {`
Reformat paddle/operators/* strictly following Google Style Guide 8 years ago			`public:`
"net op alias" 8 years ago			`void Compute(const framework::ExecutionContext& ctx) const override {`
Implement GPU kernel for cross entropy operator. 8 years ago			`PADDLE_ENFORCE(platform::is_cpu_place(ctx.GetPlace()),`
fix backward op. 7 years ago			`"This kernel only runs on CPU.");`
update the backward kernel. 8 years ago			`const Tensor* x = ctx.Input<Tensor>("X");`
			`const Tensor* labels = ctx.Input<Tensor>("Label");`
			`Tensor* y = ctx.Output<Tensor>("Y");`
cross entropy as a functor to avoid duplicated codes. 7 years ago			`y->mutable_data<T>(ctx.GetPlace());`
update the backward kernel. 8 years ago
Refine device context (#6433) There are mainly following fixes: - take `DeviceContext` as the template parameter of math functors and OpKernel instead of `Place` - remove `eigen_device` interface in base class `DeviceContext` - remove `GetEigenDevice` interface in `ExecutionContext` and base class `DeviceContext` - remove unused `platform::EigenDeviceConverter` - rename `REGISTER_OP_GPU_KERNEL` to `REGISTER_OP_CUDA_KERNEL` - rename `USE_GPU_ONLY_OP` to `USE_CUDA_ONLY_OP` 7 years ago			`math::CrossEntropyFunctor<platform::CPUDeviceContext, T>()(`
			`ctx.template device_context<platform::CPUDeviceContext>(), y, x, labels,`
			`ctx.Attr<bool>("soft_label"));`
crossentropy grad op (#3186) * init cross entropy graident * add crossentropy grad op * remove details * fix static compile 8 years ago			`}`
			`};`

Implement GPU kernel for cross entropy operator. 8 years ago			`template <typename T>`
Add Skeleton of Double support 7 years ago			`class CrossEntropyGradientOpKernel : public framework::OpKernel<T> {`
crossentropy grad op (#3186) * init cross entropy graident * add crossentropy grad op * remove details * fix static compile 8 years ago			`public:`
"net op alias" 8 years ago			`void Compute(const framework::ExecutionContext& ctx) const override {`
Implement GPU kernel for cross entropy operator. 8 years ago			`PADDLE_ENFORCE(platform::is_cpu_place(ctx.GetPlace()),`
fix backward op. 7 years ago			`"This kernel only runs on CPU.");`
			`const Tensor* x = ctx.Input<Tensor>("X");`
			`const Tensor* dy = ctx.Input<Tensor>(framework::GradVarName("Y"));`
			`const Tensor* label = ctx.Input<Tensor>("Label");`
			`Tensor* dx = ctx.Output<Tensor>(framework::GradVarName("X"));`
			`T* dx_data = dx->mutable_data<T>(ctx.GetPlace());`
crossentropy grad op (#3186) * init cross entropy graident * add crossentropy grad op * remove details * fix static compile 8 years ago
support sparse output for lookup table grad op (#5145) * add sparse support for sum op * typo fix * fix gpu build error * fix unittest error * typo fix * infer var type and shape in op_test * follow comments * fix build error * bypass some unittests depend on NetOp * support sparse output for lookup table grad op * refine codes * fix gpu build error * fix lookup table grad gpu kernel * fix ci * fix ci * fix ci * fix bug in lookup_table_grad op * fix bug in test_word2vec * register double kernel for some operators * set is_sparse=True in test_word2vec * fix lookup table grad op CUDA kernel bug * disable test_modified_huber_loss_op temporarily * disable test_lstm_unit_op temporarily 7 years ago			`int64_t class_num = x->dims()[1];`
Change Name convention of operator attributes (#4807) * Change dataType to data_type Follow PEP8 * Change name_convention to fit PEP8 7 years ago			`if (ctx.Attr<bool>("soft_label")) {`
fix backward op. 7 years ago			`auto x_mat = EigenMatrix<T>::From(*x);`
			`auto dy_mat = EigenMatrix<T>::From(*dy);`
			`auto lbl_mat = EigenMatrix<T>::From(*label);`
			`auto dx_mat = EigenMatrix<T>::From(*dx);`

Refine device context (#6433) There are mainly following fixes: - take `DeviceContext` as the template parameter of math functors and OpKernel instead of `Place` - remove `eigen_device` interface in base class `DeviceContext` - remove `GetEigenDevice` interface in `ExecutionContext` and base class `DeviceContext` - remove unused `platform::EigenDeviceConverter` - rename `REGISTER_OP_GPU_KERNEL` to `REGISTER_OP_CUDA_KERNEL` - rename `USE_GPU_ONLY_OP` to `USE_CUDA_ONLY_OP` 7 years ago			`dx_mat.device(*ctx.template device_context<platform::CPUDeviceContext>()`
			`.eigen_device()) =`
support sparse output for lookup table grad op (#5145) * add sparse support for sum op * typo fix * fix gpu build error * fix unittest error * typo fix * infer var type and shape in op_test * follow comments * fix build error * bypass some unittests depend on NetOp * support sparse output for lookup table grad op * refine codes * fix gpu build error * fix lookup table grad gpu kernel * fix ci * fix ci * fix ci * fix bug in lookup_table_grad op * fix bug in test_word2vec * register double kernel for some operators * set is_sparse=True in test_word2vec * fix lookup table grad op CUDA kernel bug * disable test_modified_huber_loss_op temporarily * disable test_lstm_unit_op temporarily 7 years ago			`-(lbl_mat *`
			`dy_mat.broadcast(Eigen::DSizes<int64_t, 2>(1, class_num)) / x_mat);`
Add soft-label support for cross-entropy operator. 8 years ago			`} else {`
support sparse output for lookup table grad op (#5145) * add sparse support for sum op * typo fix * fix gpu build error * fix unittest error * typo fix * infer var type and shape in op_test * follow comments * fix build error * bypass some unittests depend on NetOp * support sparse output for lookup table grad op * refine codes * fix gpu build error * fix lookup table grad gpu kernel * fix ci * fix ci * fix ci * fix bug in lookup_table_grad op * fix bug in test_word2vec * register double kernel for some operators * set is_sparse=True in test_word2vec * fix lookup table grad op CUDA kernel bug * disable test_modified_huber_loss_op temporarily * disable test_lstm_unit_op temporarily 7 years ago			`int64_t batch_size = x->dims()[0];`
fix backward op. 7 years ago			`const T* dy_data = dy->data<T>();`
			`const T* x_data = x->data<T>();`
support sparse output for lookup table grad op (#5145) * add sparse support for sum op * typo fix * fix gpu build error * fix unittest error * typo fix * infer var type and shape in op_test * follow comments * fix build error * bypass some unittests depend on NetOp * support sparse output for lookup table grad op * refine codes * fix gpu build error * fix lookup table grad gpu kernel * fix ci * fix ci * fix ci * fix bug in lookup_table_grad op * fix bug in test_word2vec * register double kernel for some operators * set is_sparse=True in test_word2vec * fix lookup table grad op CUDA kernel bug * disable test_modified_huber_loss_op temporarily * disable test_lstm_unit_op temporarily 7 years ago			`const int64_t* label_data = label->data<int64_t>();`
fix backward op. 7 years ago
Refine device context (#6433) There are mainly following fixes: - take `DeviceContext` as the template parameter of math functors and OpKernel instead of `Place` - remove `eigen_device` interface in base class `DeviceContext` - remove `GetEigenDevice` interface in `ExecutionContext` and base class `DeviceContext` - remove unused `platform::EigenDeviceConverter` - rename `REGISTER_OP_GPU_KERNEL` to `REGISTER_OP_CUDA_KERNEL` - rename `USE_GPU_ONLY_OP` to `USE_CUDA_ONLY_OP` 7 years ago			`math::SetConstant<platform::CPUDeviceContext, T> functor;`
			`functor(ctx.template device_context<platform::CPUDeviceContext>(), dx, 0);`
fix backward op. 7 years ago
support sparse output for lookup table grad op (#5145) * add sparse support for sum op * typo fix * fix gpu build error * fix unittest error * typo fix * infer var type and shape in op_test * follow comments * fix build error * bypass some unittests depend on NetOp * support sparse output for lookup table grad op * refine codes * fix gpu build error * fix lookup table grad gpu kernel * fix ci * fix ci * fix ci * fix bug in lookup_table_grad op * fix bug in test_word2vec * register double kernel for some operators * set is_sparse=True in test_word2vec * fix lookup table grad op CUDA kernel bug * disable test_modified_huber_loss_op temporarily * disable test_lstm_unit_op temporarily 7 years ago			`for (int64_t i = 0; i < batch_size; ++i) {`
Add soft-label support for cross-entropy operator. 8 years ago			`PADDLE_ASSERT(label_data[i] >= 0 \|\| label_data[i] < class_num);`
support sparse output for lookup table grad op (#5145) * add sparse support for sum op * typo fix * fix gpu build error * fix unittest error * typo fix * infer var type and shape in op_test * follow comments * fix build error * bypass some unittests depend on NetOp * support sparse output for lookup table grad op * refine codes * fix gpu build error * fix lookup table grad gpu kernel * fix ci * fix ci * fix ci * fix bug in lookup_table_grad op * fix bug in test_word2vec * register double kernel for some operators * set is_sparse=True in test_word2vec * fix lookup table grad op CUDA kernel bug * disable test_modified_huber_loss_op temporarily * disable test_lstm_unit_op temporarily 7 years ago			`int64_t index = i * class_num + label_data[i];`
Add soft-label support for cross-entropy operator. 8 years ago			`dx_data[index] = -dy_data[i] / x_data[index];`
			`}`
add cross-entropy-op (#2965) * add cross-entropy-op * add infershape and compute * implement Infershape and compute of onehotcrossentropy op 8 years ago			`}`
			`}`
			`};`

			`} // namespace operators`
			`} // namespace paddle`