Paddle/paddle/fluid/operators/cross_entropy_op.h

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
#include "paddle/fluid/framework/eigen.h"
#include "paddle/fluid/framework/op_registry.h"
#include "paddle/fluid/operators/math.h"
#include "paddle/fluid/operators/math/cross_entropy.h"
#include "paddle/fluid/operators/math/math_function.h"
#include "paddle/fluid/platform/for_range.h"

namespace paddle {
namespace operators {

using Tensor = framework::Tensor;

template <typename DeviceContext, typename T>
class CrossEntropyOpKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const override {
    auto* x = ctx.Input<Tensor>("X");
    auto* labels = ctx.Input<Tensor>("Label");
    auto* y = ctx.Output<Tensor>("Y");
    y->mutable_data<T>(ctx.GetPlace());

    int rank = x->dims().size();
    Tensor x_2d = framework::ReshapeToMatrix(*x, rank - 1);
    Tensor labels_2d = framework::ReshapeToMatrix(*labels, rank - 1);
    Tensor y_2d = framework::ReshapeToMatrix(*y, rank - 1);

    int axis_dim = x->dims()[rank - 1];
    math::CrossEntropyFunctor<DeviceContext, T>()(
        ctx.template device_context<DeviceContext>(), &y_2d, &x_2d, &labels_2d,
        ctx.Attr<bool>("soft_label"), ctx.Attr<int>("ignore_index"), axis_dim);
  }
};

template <typename T>
class XeSoftlabelGradFunctor {
 public:
  XeSoftlabelGradFunctor(T* dx,
                         const T* dy,     // NOLINT
                         const T* x,      // NOLINT
                         const T* label,  // NOLINT
                         size_t num_classes)
      : dx_(dx), dy_(dy), x_(x), label_(label), num_classes_(num_classes) {}

  HOSTDEVICE void operator()(size_t i) {
    auto row_ids = i / num_classes_;
    dx_[i] = -label_[i] * dy_[row_ids] / x_[i];
  }

 private:
  T* dx_;
  const T* dy_;
  const T* x_;
  const T* label_;
  size_t num_classes_;
};

template <typename T>
class XeGradFunctor {
 public:
  XeGradFunctor(T* dx,
                const T* dy,           // NOLINT
                const T* x,            // NOLINT
                const int64_t* label,  // NOLINT
                size_t num_classes, size_t ignore_index)
      : dx_(dx),
        dy_(dy),
        x_(x),
        label_(label),
        num_classes_(num_classes),
        ignore_index_(ignore_index) {}

  HOSTDEVICE void operator()(size_t sample_id) {
    auto x_is_true_offset = sample_id * num_classes_ + label_[sample_id];
    for (size_t x_offset = sample_id * num_classes_;
         x_offset < (sample_id + 1) * num_classes_; ++x_offset) {
      dx_[x_offset] = (x_offset != x_is_true_offset ||
                       label_[sample_id] == static_cast<int64_t>(ignore_index_))
                          ? static_cast<T>(0)
                          : -dy_[sample_id] / x_[x_offset];
    }
  }

 private:
  T* dx_;
  const T* dy_;
  const T* x_;
  const int64_t* label_;
  size_t num_classes_;
  size_t ignore_index_;
};

template <typename DeviceContext, typename T>
class CrossEntropyGradientOpKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const override {
    auto* x = ctx.Input<Tensor>("X");
    auto* dy = ctx.Input<Tensor>(framework::GradVarName("Y"));
    auto* label = ctx.Input<Tensor>("Label");
    auto* dx = ctx.Output<Tensor>(framework::GradVarName("X"));
    T* dx_data = dx->mutable_data<T>(ctx.GetPlace());

    // Following computation only depends on the last dimension size. So it's
    // unnecessary to convert tensors to 2-D views.
    int rank = x->dims().size();
    int64_t class_num = x->dims()[rank - 1];
    int64_t ignore_index = ctx.Attr<int>("ignore_index");
    if (ctx.Attr<bool>("soft_label")) {
      XeSoftlabelGradFunctor<T> functor(dx_data, dy->data<T>(), x->data<T>(),
                                        label->data<T>(),
                                        static_cast<size_t>(class_num));
      platform::ForRange<DeviceContext> for_range(
          ctx.template device_context<DeviceContext>(),
          static_cast<size_t>(dx->numel()));
      for_range(functor);
    } else {
      XeGradFunctor<T> functor(
          dx_data, dy->data<T>(), x->data<T>(), label->data<int64_t>(),
          static_cast<size_t>(class_num), static_cast<size_t>(ignore_index));
      platform::ForRange<DeviceContext> for_range(
          ctx.template device_context<DeviceContext>(),
          static_cast<size_t>(dy->numel()));
      for_range(functor);
    }
  }
};

template <typename T>
struct HardLabelCrossEntropyForwardFunctor {
  HardLabelCrossEntropyForwardFunctor(const T* x, T* y, T* match_x,
                                      const int64_t* label,
                                      int64_t ignore_index,
                                      int64_t feature_size)
      : x_(x),
        y_(y),
        match_x_(match_x),
        label_(label),
        ignore_index_(ignore_index),
        feature_size_(feature_size) {}

  HOSTDEVICE void operator()(int64_t idx) const {
    auto label = label_[idx];
    if (label != ignore_index_) {
      PADDLE_ASSERT_MSG(label >= 0 && label < feature_size_,
                        "Variable value (label) of "
                        "OP(fluid.layers.cross_entropy) expected >= 0 "
                        "and < %ld, but got %ld. Please check label value.",
                        feature_size_, label);
      auto match_x = x_[idx * feature_size_ + label];
      y_[idx] = -math::TolerableValue<T>()(real_log(match_x));
      match_x_[idx] = match_x;
    } else {
      y_[idx] = 0;
      match_x_[idx] = 0;  // any value is ok
    }
  }

  const T* x_;
  T* y_;
  T* match_x_;
  const int64_t* label_;
  int64_t ignore_index_;
  int64_t feature_size_;
};

template <typename T>
struct HardLabelCrossEntropyBackwardFunctor {
  HardLabelCrossEntropyBackwardFunctor(T* dx, const T* dy, const T* match_x,
                                       const int64_t* label,
                                       int64_t ignore_index,
                                       int64_t feature_size)
      : dx_(dx),
        dy_(dy),
        match_x_(match_x),
        label_(label),
        ignore_index_(ignore_index),
        feature_size_(feature_size) {}

  HOSTDEVICE void operator()(int64_t idx) const {
    auto row_idx = idx / feature_size_;
    auto col_idx = idx % feature_size_;
    auto label = label_[row_idx];
    if (label == col_idx && label != ignore_index_) {
      dx_[idx] = -dy_[row_idx] / match_x_[row_idx];
    } else {
      dx_[idx] = 0;
    }
  }

  T* dx_;
  const T* dy_;
  const T* match_x_;
  const int64_t* label_;
  int64_t ignore_index_;
  int64_t feature_size_;
};

template <typename DeviceContext, typename T>
class CrossEntropyOpKernel2 : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const override {
    auto* x = ctx.Input<Tensor>("X");
    auto* label = ctx.Input<Tensor>("Label");
    auto* y = ctx.Output<Tensor>("Y");
    auto* match_x = ctx.Output<Tensor>("MatchX");

    auto& x_dims = x->dims();
    auto feature_size = x_dims[x_dims.size() - 1];
    auto batch_size = framework::product(x->dims()) / feature_size;

    auto* p_x = x->data<T>();
    auto* p_label = label->data<int64_t>();
    auto* p_y = y->mutable_data<T>(ctx.GetPlace());
    auto* p_match_x = match_x->mutable_data<T>(ctx.GetPlace());

    auto ignore_index = ctx.Attr<int>("ignore_index");

    platform::ForRange<DeviceContext> for_range(
        ctx.template device_context<DeviceContext>(), batch_size);
    for_range(HardLabelCrossEntropyForwardFunctor<T>(
        p_x, p_y, p_match_x, p_label, ignore_index, feature_size));
  }
};

template <typename DeviceContext, typename T>
class CrossEntropyGradientOpKernel2 : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const override {
    auto* dx = ctx.Output<Tensor>(framework::GradVarName("X"));
    auto* dy = ctx.Input<Tensor>(framework::GradVarName("Y"));
    auto* match_x = ctx.Input<Tensor>("MatchX");
    auto* label = ctx.Input<Tensor>("Label");

    auto* p_dx = dx->mutable_data<T>(ctx.GetPlace());
    auto* p_dy = dy->data<T>();
    auto* p_match_x = match_x->data<T>();
    auto* p_label = label->data<int64_t>();

    int64_t ignore_index = ctx.Attr<int>("ignore_index");
    int rank = dx->dims().size();
    int64_t feature_size = dx->dims()[rank - 1];
    int64_t batch_size = framework::product(dx->dims()) / feature_size;

    platform::ForRange<DeviceContext> for_range(
        ctx.template device_context<DeviceContext>(),
        batch_size * feature_size);
    for_range(HardLabelCrossEntropyBackwardFunctor<T>(
        p_dx, p_dy, p_match_x, p_label, ignore_index, feature_size));
  }
};

}  // namespace operators
}  // namespace paddle
Fix the grammar in copyright. (#8403) 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.`
add cross-entropy-op (#2965) * add cross-entropy-op * add infershape and compute * implement Infershape and compute of onehotcrossentropy op 8 years ago
			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

			`#pragma once`
Correct #include path 7 years ago			`#include "paddle/fluid/framework/eigen.h"`
			`#include "paddle/fluid/framework/op_registry.h"`
revert revert 16144 test=develop 6 years ago			`#include "paddle/fluid/operators/math.h"`
Correct #include path 7 years ago			`#include "paddle/fluid/operators/math/cross_entropy.h"`
			`#include "paddle/fluid/operators/math/math_function.h"`
Clean cross entropy and add sync in executor 7 years ago			`#include "paddle/fluid/platform/for_range.h"`
add cross-entropy-op (#2965) * add cross-entropy-op * add infershape and compute * implement Infershape and compute of onehotcrossentropy op 8 years ago
			`namespace paddle {`
			`namespace operators {`

"net op alias" 8 years ago			`using Tensor = framework::Tensor;`

Clean cross entropy and add sync in executor 7 years ago			`template <typename DeviceContext, typename T>`
Add Skeleton of Double support 7 years ago			`class CrossEntropyOpKernel : public framework::OpKernel<T> {`
Reformat paddle/operators/* strictly following Google Style Guide 8 years ago			`public:`
"net op alias" 8 years ago			`void Compute(const framework::ExecutionContext& ctx) const override {`
Clean cross entropy and add sync in executor 7 years ago			`auto* x = ctx.Input<Tensor>("X");`
			`auto* labels = ctx.Input<Tensor>("Label");`
			`auto* y = ctx.Output<Tensor>("Y");`
cross entropy as a functor to avoid duplicated codes. 7 years ago			`y->mutable_data<T>(ctx.GetPlace());`
update the backward kernel. 8 years ago
make cross_entropy_op supporting tensors 7 years ago			`int rank = x->dims().size();`
code clean 7 years ago			`Tensor x_2d = framework::ReshapeToMatrix(*x, rank - 1);`
			`Tensor labels_2d = framework::ReshapeToMatrix(*labels, rank - 1);`
			`Tensor y_2d = framework::ReshapeToMatrix(*y, rank - 1);`
make cross_entropy_op supporting tensors 7 years ago
Softmax_cross_entropy op add axis (#16806) * add attr axis infershape. test=develop * add CUDA kernel. test=develop * fix unittest. test=develop * fix unittest for soft_label. test=develop * fix fp16 unittest. test=develop * remove comment code. test=develop * refine test for axis. test=develop * add python api. test=develop * fix doc. test=develop * fix fp16 unittest. test=develop * fix ngraph test. test=develop * fix ENFORCE for test_imperative_transformer. test=develop * fit for ngraph test. test=develop * fix after rebase develop. test=develop * fix doc. test=develop * fix API.spec. test=develop * fix test_layers. test=develop * fix format. test=develop 6 years ago			`int axis_dim = x->dims()[rank - 1];`
Clean cross entropy and add sync in executor 7 years ago			`math::CrossEntropyFunctor<DeviceContext, T>()(`
make cross_entropy_op supporting tensors 7 years ago			`ctx.template device_context<DeviceContext>(), &y_2d, &x_2d, &labels_2d,`
Softmax_cross_entropy op add axis (#16806) * add attr axis infershape. test=develop * add CUDA kernel. test=develop * fix unittest. test=develop * fix unittest for soft_label. test=develop * fix fp16 unittest. test=develop * remove comment code. test=develop * refine test for axis. test=develop * add python api. test=develop * fix doc. test=develop * fix fp16 unittest. test=develop * fix ngraph test. test=develop * fix ENFORCE for test_imperative_transformer. test=develop * fit for ngraph test. test=develop * fix after rebase develop. test=develop * fix doc. test=develop * fix API.spec. test=develop * fix test_layers. test=develop * fix format. test=develop 6 years ago			`ctx.Attr<bool>("soft_label"), ctx.Attr<int>("ignore_index"), axis_dim);`
crossentropy grad op (#3186) * init cross entropy graident * add crossentropy grad op * remove details * fix static compile 8 years ago			`}`
			`};`

Implement GPU kernel for cross entropy operator. 8 years ago			`template <typename T>`
Clean cross entropy and add sync in executor 7 years ago			`class XeSoftlabelGradFunctor {`
			`public:`
			`XeSoftlabelGradFunctor(T* dx,`
			`const T* dy, // NOLINT`
			`const T* x, // NOLINT`
			`const T* label, // NOLINT`
			`size_t num_classes)`
			`: dx_(dx), dy_(dy), x_(x), label_(label), num_classes_(num_classes) {}`

			`HOSTDEVICE void operator()(size_t i) {`
			`auto row_ids = i / num_classes_;`
			`dx_[i] = -label_[i] * dy_[row_ids] / x_[i];`
			`}`

			`private:`
			`T* dx_;`
			`const T* dy_;`
			`const T* x_;`
			`const T* label_;`
			`size_t num_classes_;`
			`};`

			`template <typename T>`
			`class XeGradFunctor {`
			`public:`
			`XeGradFunctor(T* dx,`
			`const T* dy, // NOLINT`
			`const T* x, // NOLINT`
			`const int64_t* label, // NOLINT`
Add ignore_index in cross_entropy op (#13217) * add ignore index * update api.spec * enhance softmax_with_cross_entropy 7 years ago			`size_t num_classes, size_t ignore_index)`
			`: dx_(dx),`
			`dy_(dy),`
			`x_(x),`
			`label_(label),`
			`num_classes_(num_classes),`
			`ignore_index_(ignore_index) {}`
Clean cross entropy and add sync in executor 7 years ago
Follow comment 7 years ago			`HOSTDEVICE void operator()(size_t sample_id) {`
			`auto x_is_true_offset = sample_id * num_classes_ + label_[sample_id];`
			`for (size_t x_offset = sample_id * num_classes_;`
			`x_offset < (sample_id + 1) * num_classes_; ++x_offset) {`
fix warning 6 years ago			`dx_[x_offset] = (x_offset != x_is_true_offset \|\|`
			`label_[sample_id] == static_cast<int64_t>(ignore_index_))`
			`? static_cast<T>(0)`
			`: -dy_[sample_id] / x_[x_offset];`
Clean cross entropy and add sync in executor 7 years ago			`}`
			`}`

			`private:`
			`T* dx_;`
			`const T* dy_;`
			`const T* x_;`
			`const int64_t* label_;`
			`size_t num_classes_;`
Add ignore_index in cross_entropy op (#13217) * add ignore index * update api.spec * enhance softmax_with_cross_entropy 7 years ago			`size_t ignore_index_;`
Clean cross entropy and add sync in executor 7 years ago			`};`

			`template <typename DeviceContext, typename T>`
Add Skeleton of Double support 7 years ago			`class CrossEntropyGradientOpKernel : public framework::OpKernel<T> {`
crossentropy grad op (#3186) * init cross entropy graident * add crossentropy grad op * remove details * fix static compile 8 years ago			`public:`
"net op alias" 8 years ago			`void Compute(const framework::ExecutionContext& ctx) const override {`
Clean cross entropy and add sync in executor 7 years ago			`auto* x = ctx.Input<Tensor>("X");`
			`auto* dy = ctx.Input<Tensor>(framework::GradVarName("Y"));`
			`auto* label = ctx.Input<Tensor>("Label");`
			`auto* dx = ctx.Output<Tensor>(framework::GradVarName("X"));`
make cross_entropy_op supporting tensors 7 years ago			`T* dx_data = dx->mutable_data<T>(ctx.GetPlace());`
crossentropy grad op (#3186) * init cross entropy graident * add crossentropy grad op * remove details * fix static compile 8 years ago
make cross_entropy_op supporting tensors 7 years ago			`// Following computation only depends on the last dimension size. So it's`
			`// unnecessary to convert tensors to 2-D views.`
			`int rank = x->dims().size();`
			`int64_t class_num = x->dims()[rank - 1];`
Add ignore_index in cross_entropy op (#13217) * add ignore index * update api.spec * enhance softmax_with_cross_entropy 7 years ago			`int64_t ignore_index = ctx.Attr<int>("ignore_index");`
Change Name convention of operator attributes (#4807) * Change dataType to data_type Follow PEP8 * Change name_convention to fit PEP8 7 years ago			`if (ctx.Attr<bool>("soft_label")) {`
Clean cross entropy and add sync in executor 7 years ago			`XeSoftlabelGradFunctor<T> functor(dx_data, dy->data<T>(), x->data<T>(),`
			`label->data<T>(),`
			`static_cast<size_t>(class_num));`
			`platform::ForRange<DeviceContext> for_range(`
			`ctx.template device_context<DeviceContext>(),`
			`static_cast<size_t>(dx->numel()));`
			`for_range(functor);`
Add soft-label support for cross-entropy operator. 8 years ago			`} else {`
Add ignore_index in cross_entropy op (#13217) * add ignore index * update api.spec * enhance softmax_with_cross_entropy 7 years ago			`XeGradFunctor<T> functor(`
			`dx_data, dy->data<T>(), x->data<T>(), label->data<int64_t>(),`
			`static_cast<size_t>(class_num), static_cast<size_t>(ignore_index));`
Clean cross entropy and add sync in executor 7 years ago			`platform::ForRange<DeviceContext> for_range(`
			`ctx.template device_context<DeviceContext>(),`
			`static_cast<size_t>(dy->numel()));`
			`for_range(functor);`
add cross-entropy-op (#2965) * add cross-entropy-op * add infershape and compute * implement Infershape and compute of onehotcrossentropy op 8 years ago			`}`
			`}`
			`};`

fix numeric error test=develop 6 years ago			`template <typename T>`
			`struct HardLabelCrossEntropyForwardFunctor {`
			`HardLabelCrossEntropyForwardFunctor(const T* x, T* y, T* match_x,`
			`const int64_t* label,`
			`int64_t ignore_index,`
			`int64_t feature_size)`
			`: x_(x),`
			`y_(y),`
			`match_x_(match_x),`
			`label_(label),`
			`ignore_index_(ignore_index),`
			`feature_size_(feature_size) {}`

			`HOSTDEVICE void operator()(int64_t idx) const {`
			`auto label = label_[idx];`
			`if (label != ignore_index_) {`
fix assert,test=develop (#17445) 6 years ago			`PADDLE_ASSERT_MSG(label >= 0 && label < feature_size_,`
optimize error message for "embedding" and "cross_entropy" OP (#18765) * optimize error message, test=develop * optimize error message, test=develop 6 years ago			`"Variable value (label) of "`
			`"OP(fluid.layers.cross_entropy) expected >= 0 "`
			`"and < %ld, but got %ld. Please check label value.",`
			`feature_size_, label);`
fix numeric error test=develop 6 years ago			`auto match_x = x_[idx * feature_size_ + label];`
			`y_[idx] = -math::TolerableValue<T>()(real_log(match_x));`
			`match_x_[idx] = match_x;`
			`} else {`
			`y_[idx] = 0;`
			`match_x_[idx] = 0; // any value is ok`
			`}`
			`}`

			`const T* x_;`
			`T* y_;`
			`T* match_x_;`
			`const int64_t* label_;`
			`int64_t ignore_index_;`
			`int64_t feature_size_;`
			`};`

revert revert 16144 test=develop 6 years ago			`template <typename T>`
			`struct HardLabelCrossEntropyBackwardFunctor {`
fix numeric error test=develop 6 years ago			`HardLabelCrossEntropyBackwardFunctor(T* dx, const T* dy, const T* match_x,`
revert revert 16144 test=develop 6 years ago			`const int64_t* label,`
			`int64_t ignore_index,`
			`int64_t feature_size)`
			`: dx_(dx),`
			`dy_(dy),`
fix numeric error test=develop 6 years ago			`match_x_(match_x),`
revert revert 16144 test=develop 6 years ago			`label_(label),`
			`ignore_index_(ignore_index),`
			`feature_size_(feature_size) {}`

			`HOSTDEVICE void operator()(int64_t idx) const {`
			`auto row_idx = idx / feature_size_;`
			`auto col_idx = idx % feature_size_;`
			`auto label = label_[row_idx];`
			`if (label == col_idx && label != ignore_index_) {`
fix numeric error test=develop 6 years ago			`dx_[idx] = -dy_[row_idx] / match_x_[row_idx];`
revert revert 16144 test=develop 6 years ago			`} else {`
			`dx_[idx] = 0;`
			`}`
			`}`

			`T* dx_;`
			`const T* dy_;`
fix numeric error test=develop 6 years ago			`const T* match_x_;`
revert revert 16144 test=develop 6 years ago			`const int64_t* label_;`
			`int64_t ignore_index_;`
			`int64_t feature_size_;`
			`};`

			`template <typename DeviceContext, typename T>`
			`class CrossEntropyOpKernel2 : public framework::OpKernel<T> {`
			`public:`
			`void Compute(const framework::ExecutionContext& ctx) const override {`
fix numeric error test=develop 6 years ago			`auto* x = ctx.Input<Tensor>("X");`
			`auto* label = ctx.Input<Tensor>("Label");`
revert revert 16144 test=develop 6 years ago			`auto* y = ctx.Output<Tensor>("Y");`
fix numeric error test=develop 6 years ago			`auto* match_x = ctx.Output<Tensor>("MatchX");`

			`auto& x_dims = x->dims();`
			`auto feature_size = x_dims[x_dims.size() - 1];`
			`auto batch_size = framework::product(x->dims()) / feature_size;`

			`auto* p_x = x->data<T>();`
			`auto* p_label = label->data<int64_t>();`
			`auto* p_y = y->mutable_data<T>(ctx.GetPlace());`
			`auto* p_match_x = match_x->mutable_data<T>(ctx.GetPlace());`
revert revert 16144 test=develop 6 years ago
			`auto ignore_index = ctx.Attr<int>("ignore_index");`

fix numeric error test=develop 6 years ago			`platform::ForRange<DeviceContext> for_range(`
			`ctx.template device_context<DeviceContext>(), batch_size);`
			`for_range(HardLabelCrossEntropyForwardFunctor<T>(`
			`p_x, p_y, p_match_x, p_label, ignore_index, feature_size));`
revert revert 16144 test=develop 6 years ago			`}`
			`};`

			`template <typename DeviceContext, typename T>`
			`class CrossEntropyGradientOpKernel2 : public framework::OpKernel<T> {`
			`public:`
			`void Compute(const framework::ExecutionContext& ctx) const override {`
			`auto* dx = ctx.Output<Tensor>(framework::GradVarName("X"));`
			`auto* dy = ctx.Input<Tensor>(framework::GradVarName("Y"));`
fix numeric error test=develop 6 years ago			`auto* match_x = ctx.Input<Tensor>("MatchX");`
revert revert 16144 test=develop 6 years ago			`auto* label = ctx.Input<Tensor>("Label");`

			`auto* p_dx = dx->mutable_data<T>(ctx.GetPlace());`
			`auto* p_dy = dy->data<T>();`
fix numeric error test=develop 6 years ago			`auto* p_match_x = match_x->data<T>();`
revert revert 16144 test=develop 6 years ago			`auto* p_label = label->data<int64_t>();`

			`int64_t ignore_index = ctx.Attr<int>("ignore_index");`
			`int rank = dx->dims().size();`
			`int64_t feature_size = dx->dims()[rank - 1];`
			`int64_t batch_size = framework::product(dx->dims()) / feature_size;`

			`platform::ForRange<DeviceContext> for_range(`
			`ctx.template device_context<DeviceContext>(),`
			`batch_size * feature_size);`
			`for_range(HardLabelCrossEntropyBackwardFunctor<T>(`
fix numeric error test=develop 6 years ago			`p_dx, p_dy, p_match_x, p_label, ignore_index, feature_size));`
revert revert 16144 test=develop 6 years ago			`}`
			`};`

add cross-entropy-op (#2965) * add cross-entropy-op * add infershape and compute * implement Infershape and compute of onehotcrossentropy op 8 years ago			`} // namespace operators`
			`} // namespace paddle`