Paddle/paddle/fluid/operators/prelu_op.cc

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/fluid/operators/prelu_op.h"
#include <string>

namespace paddle {
namespace operators {

class PReluOp : public framework::OperatorWithKernel {
 public:
  PReluOp(const std::string &type, const framework::VariableNameMap &inputs,
          const framework::VariableNameMap &outputs,
          const framework::AttributeMap &attrs)
      : OperatorWithKernel(type, inputs, outputs, attrs) {}

  void InferShape(framework::InferShapeContext *ctx) const override {
    std::string mode = ctx->Attrs().Get<std::string>("mode");

    auto x_dim = ctx->GetInputDim("X");
    PADDLE_ENFORCE(ctx->HasInput("X"),
                   "Input(X) of PreluOp should not be null");
    PADDLE_ENFORCE(ctx->HasInput("Alpha"),
                   "Input(Alpha) of PreluOp should not be null");

    PADDLE_ENFORCE(ctx->HasOutput("Out"),
                   "Output(Out) of PreluOp should not be null");
    if (mode == "all") {
      PADDLE_ENFORCE(product(ctx->GetInputDim("Alpha")) == 1,
                     "For mode 'all', size of weight Alpha must be one.");
    } else if (mode == "channel") {
      PADDLE_ENFORCE(product(ctx->GetInputDim("Alpha")) == x_dim[1],
                     "For channel-wise mode, size of weight Alpha must be "
                     "equal to the number of channels, should be %d",
                     x_dim[1]);
    } else if (mode == "element") {
      PADDLE_ENFORCE(product(ctx->GetInputDim("Alpha")) == product(x_dim),
                     "For element-wise mode, size of weight Alpha must be "
                     "equal to the number of input, should be %d",
                     product(x_dim));
    } else {
      PADDLE_THROW("Unkown mode %s", mode);
    }
    ctx->ShareDim("X", /*->*/ "Out");
    ctx->ShareLoD("X", /*->*/ "Out");
  }

 protected:
  framework::OpKernelType GetExpectedKernelType(
      const framework::ExecutionContext &ctx) const override {
    return framework::OpKernelType(
        OperatorWithKernel::IndicateVarDataType(ctx, "X"),
        ctx.device_context());
  }
};

class PReluOpMaker : public framework::OpProtoAndCheckerMaker {
 public:
  void Make() override {
    AddInput("X", "The input tensor of prelu operator.");
    AddInput("Alpha", "The alpha weight of prelu operator.");
    AddOutput("Out", "The output tensor of prelu operator.");
    AddComment(R"DOC(
PRelu Operator.
The equation is:
$$
f(x) =
\begin{cases}
\alpha * x, \quad  \text{if} \ x < 0 \\
x,         \qquad  \text{if} \ x >= 0
\end{cases}
$$
The input `X` can carry the LoD (Level of Details) information,
or not. And the output shares the LoD information with input `X`.
There are modes:
  all: all elements share same weight
  channel: elements in a channel share same weight
  element: each element has a weight
)DOC");
    AddAttr<std::string>("mode", "The mode for inputs to share weights.")
        .SetDefault("all");
  }
};

// The operator to calculate gradients of a prelu operator.
class PReluGradOp : public framework::OperatorWithKernel {
 public:
  using framework::OperatorWithKernel::OperatorWithKernel;

  void InferShape(framework::InferShapeContext *ctx) const override {
    PADDLE_ENFORCE(ctx->HasInput("X"), "Input(X) must not be null.");
    PADDLE_ENFORCE(ctx->HasInput(framework::GradVarName("Out")),
                   "Input(Out@GRAD) should not be null");
    auto x_grad_name = framework::GradVarName("X");
    auto alpha_grad_name = framework::GradVarName("Alpha");

    if (ctx->HasOutput(x_grad_name)) {
      ctx->SetOutputDim(x_grad_name, ctx->GetInputDim("X"));
    }
    if (ctx->HasOutput(alpha_grad_name)) {
      ctx->SetOutputDim(alpha_grad_name, ctx->GetInputDim("Alpha"));
    }
  }

 protected:
  framework::OpKernelType GetExpectedKernelType(
      const framework::ExecutionContext &ctx) const override {
    return framework::OpKernelType(
        OperatorWithKernel::IndicateVarDataType(ctx, "X"),
        ctx.device_context());
  }
};

}  // namespace operators
}  // namespace paddle

namespace ops = paddle::operators;

REGISTER_OPERATOR(
    prelu, ops::PReluOp, ops::PReluOpMaker,
    paddle::framework::DefaultGradOpMaker<paddle::framework::OpDesc, true>,
    paddle::framework::DefaultGradOpMaker<paddle::imperative::OpBase, true>);
REGISTER_OPERATOR(prelu_grad, ops::PReluGradOp);
REGISTER_OP_CPU_KERNEL(
    prelu, ops::PReluKernel<paddle::platform::CPUDeviceContext, float>);
REGISTER_OP_CPU_KERNEL(
    prelu_grad,
    ops::PReluGradKernel<paddle::platform::CPUDeviceContext, float>);
Fix the grammar in copyright. (#8403) 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.`
unify the indentation of license 7 years ago			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`
			`http://www.apache.org/licenses/LICENSE-2.0`
			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`
prelu op 8 years ago
Correct #include path 7 years ago			`#include "paddle/fluid/operators/prelu_op.h"`
remove net op and cond_op (#9663) * remove net op and cond_op * fix cpplint * fix dependency * delete backward_test; fix compile * disable batch_norm backward * rm test_net.py * make batchnorm test independent of backward.cc * make test_layer_norm_op independent of backward.cc * make test_layer_norm_op independent of backward.cc * delete unused code * clean up 7 years ago			`#include <string>`
prelu op 8 years ago
			`namespace paddle {`
			`namespace operators {`

fix 8 years ago			`class PReluOp : public framework::OperatorWithKernel {`
prelu op 8 years ago			`public:`
fix 8 years ago			`PReluOp(const std::string &type, const framework::VariableNameMap &inputs,`
prelu op 8 years ago			`const framework::VariableNameMap &outputs,`
			`const framework::AttributeMap &attrs)`
			`: OperatorWithKernel(type, inputs, outputs, attrs) {}`

rename InferShapeContextBase to InferShapeContext 8 years ago			`void InferShape(framework::InferShapeContext *ctx) const override {`
Add three modes for prelu_op (#12630) * Add three modes for prelu_op. 7 years ago			`std::string mode = ctx->Attrs().Get<std::string>("mode");`

			`auto x_dim = ctx->GetInputDim("X");`
add error_info prelu_op 7 years ago			`PADDLE_ENFORCE(ctx->HasInput("X"),`
			`"Input(X) of PreluOp should not be null");`
			`PADDLE_ENFORCE(ctx->HasInput("Alpha"),`
			`"Input(Alpha) of PreluOp should not be null");`
Add three modes for prelu_op (#12630) * Add three modes for prelu_op. 7 years ago
add error_info prelu_op 7 years ago			`PADDLE_ENFORCE(ctx->HasOutput("Out"),`
			`"Output(Out) of PreluOp should not be null");`
Add three modes for prelu_op (#12630) * Add three modes for prelu_op. 7 years ago			`if (mode == "all") {`
			`PADDLE_ENFORCE(product(ctx->GetInputDim("Alpha")) == 1,`
			`"For mode 'all', size of weight Alpha must be one.");`
			`} else if (mode == "channel") {`
			`PADDLE_ENFORCE(product(ctx->GetInputDim("Alpha")) == x_dim[1],`
			`"For channel-wise mode, size of weight Alpha must be "`
			`"equal to the number of channels, should be %d",`
			`x_dim[1]);`
			`} else if (mode == "element") {`
			`PADDLE_ENFORCE(product(ctx->GetInputDim("Alpha")) == product(x_dim),`
			`"For element-wise mode, size of weight Alpha must be "`
			`"equal to the number of input, should be %d",`
			`product(x_dim));`
			`} else {`
			`PADDLE_THROW("Unkown mode %s", mode);`
			`}`
Set the right shape of selected_rows (#13723) * set the right shape of selected_rows test=develop * enhance check * fix activation_op * remove cast * use ShareDimInfo replace SetDim and ShareLod * use ShareDimAndLod test=develop * follow comment test=develop * check whether the input has lod test=develop * Split ShareDimAndLod test=develop * checkout clip.py test=develop 7 years ago			`ctx->ShareDim("X", /->/ "Out");`
Refactoring InferShape (#3946) * init Infershape * add static InferShape interface * refactor add-op infershape * add AttrReader * add all maker's infershape * add all InferShape * add python infer api * add VarDesc interface * add python VarDesc and OpDesc interface * update python code * use infershape function to do shape inference * clean code * do not use pointer * refine code of op_proto_maker * add get_dims to VarDesc * refine the code * remove the dependency from operator to op registry * remove OpProtoAndCheckerMaker from operator * restore complete_add_op * add shape_infer_impl.h * code optimization * remove const return value * add fake BlockDesc class * optimize code * remove infer function in op_info * move InferShapeContextImpl to operator.h * optimize the interface of InferShapeContextBase * add temperary interface of new infershape * change add_op, clip_op, conv2d_op and activation_op * change all operators InferShape * fix SetDim * update cos_sim_op * update crop_op * update lookup_table_op * allocate tensor when call GetDim in InferShapeContext * update modified_huber_loss_op * update rowwise_add_op * update mean_op * update sequence_avg_pool_op * typo * remove old InferShape interface * can compile * fix or unit test * clean code * clean code * remove const before InferShapeContext * change InferenceContextBase to pointer * rename RunTime to Runtime, code clean 8 years ago			`ctx->ShareLoD("X", /->/ "Out");`
prelu op 8 years ago			`}`
Add three modes for prelu_op (#12630) * Add three modes for prelu_op. 7 years ago
			`protected:`
			`framework::OpKernelType GetExpectedKernelType(`
			`const framework::ExecutionContext &ctx) const override {`
Replace risky GetInputType method with secure IndicateVarDataType interface (#20668) * replace part of the old implementation, test=develop * restore concat op, test=develop * update all ops implemention & delete GetDataTypeOfVar func, test=develop 5 years ago			`return framework::OpKernelType(`
			`OperatorWithKernel::IndicateVarDataType(ctx, "X"),`
			`ctx.device_context());`
Add three modes for prelu_op (#12630) * Add three modes for prelu_op. 7 years ago			`}`
prelu op 8 years ago			`};`

fix 8 years ago			`class PReluOpMaker : public framework::OpProtoAndCheckerMaker {`
prelu op 8 years ago			`public:`
Clean OpProtoAndCheckerMaker Do not use ctor * Reduce line of codes. * We can use virtual function for Maker now. * The implementation does not care what maker holds, it is easier to refactor later. 7 years ago			`void Make() override {`
prelu_op 8 years ago			`AddInput("X", "The input tensor of prelu operator.");`
Polish operator docs (n to p) (#5376) * polish p ops * fix precision_recall * fix linear_chain_crf_op * small fix 7 years ago			`AddInput("Alpha", "The alpha weight of prelu operator.");`
			`AddOutput("Out", "The output tensor of prelu operator.");`
			`AddComment(R"DOC(`
			`PRelu Operator.`
prelu op 8 years ago			`The equation is:`
Polish operator docs (n to p) (#5376) * polish p ops * fix precision_recall * fix linear_chain_crf_op * small fix 7 years ago			`$$`
			`f(x) =`
			`\begin{cases}`
			`\alpha * x, \quad \text{if} \ x < 0 \\`
			`x, \qquad \text{if} \ x >= 0`
			`\end{cases}`
			`$$`
Share LoD between input and output of each opeators. 8 years ago			The input `X` can carry the LoD (Level of Details) information,
Polish operator docs (n to p) (#5376) * polish p ops * fix precision_recall * fix linear_chain_crf_op * small fix 7 years ago			or not. And the output shares the LoD information with input `X`.
Add cuda implementation for `prelu` backward pass (#18633) * Add GPU implementation for `prelu` backward pass test=develop * Fix logic error in `prelu` GPU backward and simplify a bit test=develop * Fix `prelu` backward CUDA implementation test=develop CPU version was not used actually, so test passed 6 years ago			`There are modes:`
Add three modes for prelu_op (#12630) * Add three modes for prelu_op. 7 years ago			`all: all elements share same weight`
			`channel: elements in a channel share same weight`
Add cuda implementation for `prelu` backward pass (#18633) * Add GPU implementation for `prelu` backward pass test=develop * Fix logic error in `prelu` GPU backward and simplify a bit test=develop * Fix `prelu` backward CUDA implementation test=develop CPU version was not used actually, so test passed 6 years ago			`element: each element has a weight`
prelu op 8 years ago			`)DOC");`
Add three modes for prelu_op (#12630) * Add three modes for prelu_op. 7 years ago			`AddAttr<std::string>("mode", "The mode for inputs to share weights.")`
			`.SetDefault("all");`
prelu op 8 years ago			`}`
			`};`

			`// The operator to calculate gradients of a prelu operator.`
fix 8 years ago			`class PReluGradOp : public framework::OperatorWithKernel {`
prelu op 8 years ago			`public:`
			`using framework::OperatorWithKernel::OperatorWithKernel;`

rename InferShapeContextBase to InferShapeContext 8 years ago			`void InferShape(framework::InferShapeContext *ctx) const override {`
Refactoring InferShape (#3946) * init Infershape * add static InferShape interface * refactor add-op infershape * add AttrReader * add all maker's infershape * add all InferShape * add python infer api * add VarDesc interface * add python VarDesc and OpDesc interface * update python code * use infershape function to do shape inference * clean code * do not use pointer * refine code of op_proto_maker * add get_dims to VarDesc * refine the code * remove the dependency from operator to op registry * remove OpProtoAndCheckerMaker from operator * restore complete_add_op * add shape_infer_impl.h * code optimization * remove const return value * add fake BlockDesc class * optimize code * remove infer function in op_info * move InferShapeContextImpl to operator.h * optimize the interface of InferShapeContextBase * add temperary interface of new infershape * change add_op, clip_op, conv2d_op and activation_op * change all operators InferShape * fix SetDim * update cos_sim_op * update crop_op * update lookup_table_op * allocate tensor when call GetDim in InferShapeContext * update modified_huber_loss_op * update rowwise_add_op * update mean_op * update sequence_avg_pool_op * typo * remove old InferShape interface * can compile * fix or unit test * clean code * clean code * remove const before InferShapeContext * change InferenceContextBase to pointer * rename RunTime to Runtime, code clean 8 years ago			`PADDLE_ENFORCE(ctx->HasInput("X"), "Input(X) must not be null.");`
			`PADDLE_ENFORCE(ctx->HasInput(framework::GradVarName("Out")),`
			`"Input(Out@GRAD) should not be null");`
Add three modes for prelu_op (#12630) * Add three modes for prelu_op. 7 years ago			`auto x_grad_name = framework::GradVarName("X");`
			`auto alpha_grad_name = framework::GradVarName("Alpha");`

			`if (ctx->HasOutput(x_grad_name)) {`
			`ctx->SetOutputDim(x_grad_name, ctx->GetInputDim("X"));`
			`}`
			`if (ctx->HasOutput(alpha_grad_name)) {`
			`ctx->SetOutputDim(alpha_grad_name, ctx->GetInputDim("Alpha"));`
			`}`
			`}`

			`protected:`
			`framework::OpKernelType GetExpectedKernelType(`
			`const framework::ExecutionContext &ctx) const override {`
Replace risky GetInputType method with secure IndicateVarDataType interface (#20668) * replace part of the old implementation, test=develop * restore concat op, test=develop * update all ops implemention & delete GetDataTypeOfVar func, test=develop 5 years ago			`return framework::OpKernelType(`
			`OperatorWithKernel::IndicateVarDataType(ctx, "X"),`
			`ctx.device_context());`
prelu op 8 years ago			`}`
			`};`

			`} // namespace operators`
			`} // namespace paddle`

			`namespace ops = paddle::operators;`

GradMaker for dygraph (#19706) * refactor dygraph,test=develop * fix failed unittest,test=develop * polish code,test=develop * check windows ci error,test=develop try to fix windows ci error by np.allclose,test=develop * polish vlog and profiler, test=develop * try to fix preceding ops order,test=develop * test transformer in windows ci, test=develop * use python c-api to speed up tracer.trace,test=develop * test=develop, fix docker with paddle nccl problem * test=develop, add ut for debug string and gradient_accumulator * test=develop, add tests for layer/gradient_accumulator/prepared_op * test=develop, fix complie error for test_prepared_op * test=develop, add more ut for dygraph * test=develop, create API.spec for dygraph api change * optimize grad maker; test=develop * optimize grad maker * test * grad make optim; test=develop * fix unittest bugs; test=develop * add dygraph grad op maker and split_op * grad op maker refactor; test=develop * add dygraph grad maker; test=develop * fix op deformable_conv_v1_op bug; test=develop * fix deformable_conv prroi pool bugs; * fix new op grad op maker bug; test=develop * fix split by ref bug; test=develop * fix dygraph auto prune bug; test=develop * fix test_trace bug; test=develop * fix fused emb seq pool bug; test=develop * remove useless code in op_desc file; test=develop * remove useless code, StrVarBaseNode; test=develop * fix review issues; test=develop * fix rank_loss grad maker; test=develop * remove flag in VarBase; test=develop * fix distributed_notify_op compile bug ; test=develop * fix reshape op double grad; test=develop * fix expand as op; test=develop * add impertive type_defs.h for demo_train; test=develop * fix inference lib cmake; test=develop * fix inference lib; test=develop * fix infernce_lib; test=develop * fix inference cmake; test=develop * fix inference lib; test=develop * fix inference lib; test=develop * remove condition dygraph grad maker, modify local name; test=develop * fix split grad maker bug; test=develop * fix pyramid_op bug; test=develop * change travis time out limit; test=develop * restore travis; test=develop * change timeout limit; test=develop 5 years ago			`REGISTER_OPERATOR(`
			`prelu, ops::PReluOp, ops::PReluOpMaker,`
			`paddle::framework::DefaultGradOpMaker<paddle::framework::OpDesc, true>,`
			`paddle::framework::DefaultGradOpMaker<paddle::imperative::OpBase, true>);`
add semicolon to op registry (#10034) * script to add semicolon * fix typo 7 years ago			`REGISTER_OPERATOR(prelu_grad, ops::PReluGradOp);`
Refine device context (#6433) There are mainly following fixes: - take `DeviceContext` as the template parameter of math functors and OpKernel instead of `Place` - remove `eigen_device` interface in base class `DeviceContext` - remove `GetEigenDevice` interface in `ExecutionContext` and base class `DeviceContext` - remove unused `platform::EigenDeviceConverter` - rename `REGISTER_OP_GPU_KERNEL` to `REGISTER_OP_CUDA_KERNEL` - rename `USE_GPU_ONLY_OP` to `USE_CUDA_ONLY_OP` 7 years ago			`REGISTER_OP_CPU_KERNEL(`
			`prelu, ops::PReluKernel<paddle::platform::CPUDeviceContext, float>);`
			`REGISTER_OP_CPU_KERNEL(`
			`prelu_grad,`
			`ops::PReluGradKernel<paddle::platform::CPUDeviceContext, float>);`