Paddle/paddle/fluid/operators/softmax_op.h

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
#include "paddle/fluid/framework/op_registry.h"
#include "paddle/fluid/operators/math/softmax.h"

namespace paddle {
namespace operators {

using Tensor = framework::Tensor;
using DDim = framework::DDim;

static inline int CanonicalAxis(const int axis, const int rank) {
  if (axis < 0) {
    return axis + rank;
  }
  return axis;
}

static inline int SizeToAxis(const int axis, DDim dims) {
  int size = 1;
  for (int i = 0; i < axis; i++) {
    size *= dims[i];
  }
  return size;
}

static inline int SizeFromAxis(const int axis, DDim dims) {
  int size = 1;
  for (int i = axis; i < dims.size(); i++) {
    size *= dims[i];
  }
  return size;
}

template <typename DeviceContext, typename T>
class SoftmaxKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& context) const override {
    auto* X = context.Input<Tensor>("X");
    auto* Out = context.Output<Tensor>("Out");
    const int rank = X->dims().size();
    const int axis = CanonicalAxis(context.Attr<int>("axis"), rank);
    int axis_dim = X->dims()[axis];

    // allocate memory on device.
    Out->mutable_data<T>(context.GetPlace());

    const int n = SizeToAxis(axis, X->dims());
    const int d = SizeFromAxis(axis, X->dims());
    Tensor X_2d, Out_2d;
    X_2d.ShareDataWith(*X).Resize({n, d});
    Out_2d.ShareDataWith(*Out).Resize({n, d});

#ifdef PADDLE_ON_INFERENCE
    math::SoftmaxFunctor<DeviceContext, T, true>()(
        context.template device_context<DeviceContext>(), axis_dim, &X_2d,
        &Out_2d);
#else
    math::SoftmaxFunctor<DeviceContext, T, false>()(
        context.template device_context<DeviceContext>(), axis_dim, &X_2d,
        &Out_2d);
#endif
  }
};

template <typename DeviceContext, typename T>
class SoftmaxGradKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& context) const override {
    auto* Out = context.Input<Tensor>("Out");
    auto* dOut = context.Input<Tensor>(framework::GradVarName("Out"));
    auto* dX = context.Output<Tensor>(framework::GradVarName("X"));
    const int rank = dX->dims().size();
    const int axis = CanonicalAxis(context.Attr<int>("axis"), rank);
    int axis_dim = dX->dims()[axis];

    // allocate memory on device.
    dX->mutable_data<T>(context.GetPlace());

    const int n = SizeToAxis(axis, dX->dims());
    const int d = SizeFromAxis(axis, dX->dims());
    Tensor dX_2d, Out_2d, dOut_2d;
    dX_2d.ShareDataWith(*dX).Resize({n, d});
    Out_2d.ShareDataWith(*Out).Resize({n, d});
    dOut_2d.ShareDataWith(*dOut).Resize({n, d});

    math::SoftmaxGradFunctor<DeviceContext, T>()(
        context.template device_context<DeviceContext>(), axis_dim, &Out_2d,
        &dOut_2d, &dX_2d);
  }
};

}  // namespace operators
}  // namespace paddle
Fix the grammar in copyright. (#8403) 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.`
Add skeletons of `mul`, `rowwise_add`, `sigmoid`, `softmax` ops * Implement InferShape and register them, give a stub Kernel method by LOG(INFO) 8 years ago
Softmax grad op (#3164) * init softmax grad op * add compute code * export Backward to python * update test ,export op.type to python * update python test, fix compute bug * update unit test * use eigen * optimize eigen code * add gpu test * register softmax_grad GPU kernel and fix test bug * typo * follow comments 8 years ago			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`
Add skeletons of `mul`, `rowwise_add`, `sigmoid`, `softmax` ops * Implement InferShape and register them, give a stub Kernel method by LOG(INFO) 8 years ago
Softmax grad op (#3164) * init softmax grad op * add compute code * export Backward to python * update test ,export op.type to python * update python test, fix compute bug * update unit test * use eigen * optimize eigen code * add gpu test * register softmax_grad GPU kernel and fix test bug * typo * follow comments 8 years ago			`http://www.apache.org/licenses/LICENSE-2.0`
Add skeletons of `mul`, `rowwise_add`, `sigmoid`, `softmax` ops * Implement InferShape and register them, give a stub Kernel method by LOG(INFO) 8 years ago
Softmax grad op (#3164) * init softmax grad op * add compute code * export Backward to python * update test ,export op.type to python * update python test, fix compute bug * update unit test * use eigen * optimize eigen code * add gpu test * register softmax_grad GPU kernel and fix test bug * typo * follow comments 8 years ago			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`
Add skeletons of `mul`, `rowwise_add`, `sigmoid`, `softmax` ops * Implement InferShape and register them, give a stub Kernel method by LOG(INFO) 8 years ago
			`#pragma once`
Correct #include path 7 years ago			`#include "paddle/fluid/framework/op_registry.h"`
			`#include "paddle/fluid/operators/math/softmax.h"`
Add skeletons of `mul`, `rowwise_add`, `sigmoid`, `softmax` ops * Implement InferShape and register them, give a stub Kernel method by LOG(INFO) 8 years ago
			`namespace paddle {`
			`namespace operators {`

"remove a lot alias" 8 years ago			`using Tensor = framework::Tensor;`
refine softmax kernel. test=develop 6 years ago			`using DDim = framework::DDim;`
"remove a lot alias" 8 years ago
refine softmax kernel. test=develop 6 years ago			`static inline int CanonicalAxis(const int axis, const int rank) {`
			`if (axis < 0) {`
			`return axis + rank;`
			`}`
			`return axis;`
			`}`
add softmax_axis CPU kernel. test=develop 6 years ago
refine softmax kernel. test=develop 6 years ago			`static inline int SizeToAxis(const int axis, DDim dims) {`
			`int size = 1;`
			`for (int i = 0; i < axis; i++) {`
			`size *= dims[i];`
add softmax_axis CPU kernel. test=develop 6 years ago			`}`
refine softmax kernel. test=develop 6 years ago			`return size;`
			`}`
add softmax_axis CPU kernel. test=develop 6 years ago
refine softmax kernel. test=develop 6 years ago			`static inline int SizeFromAxis(const int axis, DDim dims) {`
			`int size = 1;`
			`for (int i = axis; i < dims.size(); i++) {`
			`size *= dims[i];`
add softmax_axis CPU kernel. test=develop 6 years ago			`}`
refine softmax kernel. test=develop 6 years ago			`return size;`
add softmax_axis CPU kernel. test=develop 6 years ago			`}`

Refine device context (#6433) There are mainly following fixes: - take `DeviceContext` as the template parameter of math functors and OpKernel instead of `Place` - remove `eigen_device` interface in base class `DeviceContext` - remove `GetEigenDevice` interface in `ExecutionContext` and base class `DeviceContext` - remove unused `platform::EigenDeviceConverter` - rename `REGISTER_OP_GPU_KERNEL` to `REGISTER_OP_CUDA_KERNEL` - rename `USE_GPU_ONLY_OP` to `USE_CUDA_ONLY_OP` 7 years ago			`template <typename DeviceContext, typename T>`
Add Skeleton of Double support 7 years ago			`class SoftmaxKernel : public framework::OpKernel<T> {`
Reformat paddle/operators/* strictly following Google Style Guide 8 years ago			`public:`
"remove a lot alias" 8 years ago			`void Compute(const framework::ExecutionContext& context) const override {`
Add SoftmaxGradFunctor, and use SoftmaxGradFunctor in softmax_op instead. 7 years ago			`auto* X = context.Input<Tensor>("X");`
Change softmax 7 years ago			`auto* Out = context.Output<Tensor>("Out");`
refine softmax kernel. test=develop 6 years ago			`const int rank = X->dims().size();`
			`const int axis = CanonicalAxis(context.Attr<int>("axis"), rank);`
			`int axis_dim = X->dims()[axis];`
implement some basic OpKernel 8 years ago
softmax as function. 8 years ago			`// allocate memory on device.`
Change softmax 7 years ago			`Out->mutable_data<T>(context.GetPlace());`
implement some basic OpKernel 8 years ago
refine softmax kernel. test=develop 6 years ago			`const int n = SizeToAxis(axis, X->dims());`
			`const int d = SizeFromAxis(axis, X->dims());`
add cudnn support. test=develop 6 years ago			`Tensor X_2d, Out_2d;`
refine softmax kernel. test=develop 6 years ago			`X_2d.ShareDataWith(*X).Resize({n, d});`
			`Out_2d.ShareDataWith(*Out).Resize({n, d});`
add softmax_axis CPU kernel. test=develop 6 years ago
Squashing MKL based softmax for inference test=develop - Added profiling to softmax functors - MKL based softmax inference op - Fix to softmax compuation via MKL - cleaning - Cosmetic fixes to softmax MKL - Fix to ON_INFER lack of propagation 6 years ago			`#ifdef PADDLE_ON_INFERENCE`
- ASUM MKL integration 6 years ago			`math::SoftmaxFunctor<DeviceContext, T, true>()(`
fix format. test=develop 6 years ago			`context.template device_context<DeviceContext>(), axis_dim, &X_2d,`
			`&Out_2d);`
- Softmax for Inference is enabled when ON_INFER is set test=develop 6 years ago			`#else`
			`math::SoftmaxFunctor<DeviceContext, T, false>()(`
fix format. test=develop 6 years ago			`context.template device_context<DeviceContext>(), axis_dim, &X_2d,`
			`&Out_2d);`
- Softmax for Inference is enabled when ON_INFER is set test=develop 6 years ago			`#endif`
Add skeletons of `mul`, `rowwise_add`, `sigmoid`, `softmax` ops * Implement InferShape and register them, give a stub Kernel method by LOG(INFO) 8 years ago			`}`
			`};`
Softmax grad op (#3164) * init softmax grad op * add compute code * export Backward to python * update test ,export op.type to python * update python test, fix compute bug * update unit test * use eigen * optimize eigen code * add gpu test * register softmax_grad GPU kernel and fix test bug * typo * follow comments 8 years ago
Refine device context (#6433) There are mainly following fixes: - take `DeviceContext` as the template parameter of math functors and OpKernel instead of `Place` - remove `eigen_device` interface in base class `DeviceContext` - remove `GetEigenDevice` interface in `ExecutionContext` and base class `DeviceContext` - remove unused `platform::EigenDeviceConverter` - rename `REGISTER_OP_GPU_KERNEL` to `REGISTER_OP_CUDA_KERNEL` - rename `USE_GPU_ONLY_OP` to `USE_CUDA_ONLY_OP` 7 years ago			`template <typename DeviceContext, typename T>`
Add Skeleton of Double support 7 years ago			`class SoftmaxGradKernel : public framework::OpKernel<T> {`
Reformat paddle/operators/* strictly following Google Style Guide 8 years ago			`public:`
"remove type alias header file" 8 years ago			`void Compute(const framework::ExecutionContext& context) const override {`
Change softmax 7 years ago			`auto* Out = context.Input<Tensor>("Out");`
			`auto* dOut = context.Input<Tensor>(framework::GradVarName("Out"));`
Add SoftmaxGradFunctor, and use SoftmaxGradFunctor in softmax_op instead. 7 years ago			`auto* dX = context.Output<Tensor>(framework::GradVarName("X"));`
refine softmax kernel. test=develop 6 years ago			`const int rank = dX->dims().size();`
			`const int axis = CanonicalAxis(context.Attr<int>("axis"), rank);`
			`int axis_dim = dX->dims()[axis];`
Softmax grad op (#3164) * init softmax grad op * add compute code * export Backward to python * update test ,export op.type to python * update python test, fix compute bug * update unit test * use eigen * optimize eigen code * add gpu test * register softmax_grad GPU kernel and fix test bug * typo * follow comments 8 years ago
Add SoftmaxGradFunctor, and use SoftmaxGradFunctor in softmax_op instead. 7 years ago			`// allocate memory on device.`
			`dX->mutable_data<T>(context.GetPlace());`
Softmax grad op (#3164) * init softmax grad op * add compute code * export Backward to python * update test ,export op.type to python * update python test, fix compute bug * update unit test * use eigen * optimize eigen code * add gpu test * register softmax_grad GPU kernel and fix test bug * typo * follow comments 8 years ago
refine softmax kernel. test=develop 6 years ago			`const int n = SizeToAxis(axis, dX->dims());`
			`const int d = SizeFromAxis(axis, dX->dims());`
add cudnn support. test=develop 6 years ago			`Tensor dX_2d, Out_2d, dOut_2d;`
refine softmax kernel. test=develop 6 years ago			`dX_2d.ShareDataWith(*dX).Resize({n, d});`
			`Out_2d.ShareDataWith(*Out).Resize({n, d});`
			`dOut_2d.ShareDataWith(*dOut).Resize({n, d});`
make softmax supporting tensors 7 years ago
Refine device context (#6433) There are mainly following fixes: - take `DeviceContext` as the template parameter of math functors and OpKernel instead of `Place` - remove `eigen_device` interface in base class `DeviceContext` - remove `GetEigenDevice` interface in `ExecutionContext` and base class `DeviceContext` - remove unused `platform::EigenDeviceConverter` - rename `REGISTER_OP_GPU_KERNEL` to `REGISTER_OP_CUDA_KERNEL` - rename `USE_GPU_ONLY_OP` to `USE_CUDA_ONLY_OP` 7 years ago			`math::SoftmaxGradFunctor<DeviceContext, T>()(`
fix format. test=develop 6 years ago			`context.template device_context<DeviceContext>(), axis_dim, &Out_2d,`
			`&dOut_2d, &dX_2d);`
Softmax grad op (#3164) * init softmax grad op * add compute code * export Backward to python * update test ,export op.type to python * update python test, fix compute bug * update unit test * use eigen * optimize eigen code * add gpu test * register softmax_grad GPU kernel and fix test bug * typo * follow comments 8 years ago			`}`
			`};`

Add skeletons of `mul`, `rowwise_add`, `sigmoid`, `softmax` ops * Implement InferShape and register them, give a stub Kernel method by LOG(INFO) 8 years ago			`} // namespace operators`
			`} // namespace paddle`