Paddle/paddle/fluid/operators/average_accumulates_op.cc

/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/fluid/operators/average_accumulates_op.h"

namespace paddle {
namespace operators {

template <>
void GetAccumulators<paddle::platform::CPUDeviceContext>(
    const framework::ExecutionContext& ctx, int64_t* num_updates,
    int64_t* num_accumulates, int64_t* old_num_accumulates) {
  auto* in_old_num_accumulates = ctx.Input<Tensor>("in_old_num_accumulates");
  auto* in_num_accumulates = ctx.Input<Tensor>("in_num_accumulates");
  auto* in_num_updates = ctx.Input<Tensor>("in_num_updates");

  *old_num_accumulates = in_old_num_accumulates->data<int64_t>()[0];
  *num_accumulates = in_num_accumulates->data<int64_t>()[0];
  *num_updates = in_num_updates->data<int64_t>()[0];
}

template <>
void SetAccumulators<paddle::platform::CPUDeviceContext>(
    const framework::ExecutionContext& ctx, int64_t num_updates,
    int64_t num_accumulates, int64_t old_num_accumulates) {
  auto* out_old_num_accumulates = ctx.Output<Tensor>("out_old_num_accumulates");
  auto* out_num_accumulates = ctx.Output<Tensor>("out_num_accumulates");
  auto* out_num_updates = ctx.Output<Tensor>("out_num_updates");

  out_old_num_accumulates->data<int64_t>()[0] = old_num_accumulates;
  out_num_accumulates->data<int64_t>()[0] = num_accumulates;
  out_num_updates->data<int64_t>()[0] = num_updates;
}

class AverageAccumulatesOp : public framework::OperatorWithKernel {
 public:
  using framework::OperatorWithKernel::OperatorWithKernel;

  void InferShape(framework::InferShapeContext* ctx) const override {
    PADDLE_ENFORCE(
        ctx->HasInput("param"),
        "Input (param) of average_accumulates op should not be null.");
    PADDLE_ENFORCE(
        ctx->HasInput("in_sum_1"),
        "Input (sum_1) of average_accumulates op should not be null.");
    PADDLE_ENFORCE(
        ctx->HasInput("in_sum_2"),
        "Input (sum_2) of average_accumulates op should not be null.");
    PADDLE_ENFORCE(
        ctx->HasInput("in_sum_3"),
        "Input (sum_3) of average_accumulates op should not be null.");
    PADDLE_ENFORCE(
        ctx->HasInput("in_num_accumulates"),
        "Input (in_num_accumulates) of average_accumulates op should "
        "not be null.");
    PADDLE_ENFORCE(ctx->HasInput("in_old_num_accumulates"),
                   "Input (old_num_accumulates) of average_accumulates op "
                   "should not be null.");
    PADDLE_ENFORCE(
        ctx->HasInput("in_num_updates"),
        "Input (num_updates) of average_accumulates op should not be null.");

    PADDLE_ENFORCE(
        ctx->HasOutput("out_sum_1"),
        "Output (sum_1) of average_accumulates op should not be null.");
    PADDLE_ENFORCE(
        ctx->HasOutput("out_sum_2"),
        "Output (sum_2) of average_accumulates op should not be null.");
    PADDLE_ENFORCE(
        ctx->HasOutput("out_sum_3"),
        "Output (sum_3) of average_accumulates op should not be null.");
    PADDLE_ENFORCE(ctx->HasOutput("out_num_accumulates"),
                   "Output (num_accumulates) of average_accumulates op should "
                   "not be null.");
    PADDLE_ENFORCE(ctx->HasOutput("out_old_num_accumulates"),
                   "Output (old_num_accumulates) of average_accumulates op "
                   "should not be null.");
    PADDLE_ENFORCE(
        ctx->HasOutput("out_num_updates"),
        "Output (num_updates) of average_accumulates op should not be null.");

    auto in_dim = ctx->GetInputDim("param");

    ctx->SetOutputDim("out_sum_1", in_dim);
    ctx->SetOutputDim("out_sum_2", in_dim);
    ctx->SetOutputDim("out_sum_3", in_dim);
    ctx->SetOutputDim("out_num_accumulates", {1});
    ctx->SetOutputDim("out_old_num_accumulates", {1});
    ctx->SetOutputDim("out_num_updates", {1});
  }

 protected:
  framework::OpKernelType GetExpectedKernelType(
      const framework::ExecutionContext& ctx) const override {
    return framework::OpKernelType(
        OperatorWithKernel::IndicateVarDataType(ctx, "param"), ctx.GetPlace());
  }
};

class AverageAccumulatesOpMaker : public framework::OpProtoAndCheckerMaker {
 public:
  void Make() override {
    AddInput("param", "(Tensor), The parameter to be accumulated.");
    AddInput("in_sum_1",
             "(Tensor), A tensor used to store the parameter "
             "sums with the same shape as input(param).");
    AddInput("in_sum_2",
             "(Tensor), A auxiliary tensor to help "
             "accumulating sums of parameter values with the same shape as "
             "input(param). It is used to avoid loss of precision due to too "
             "many sums.");
    AddInput("in_sum_3",
             "(Tensor), A auxiliary tensor to help "
             "accumulating sums of parameter values with the same shape as "
             "input(param).");
    AddInput("in_num_accumulates",
             "(Tensor<int64_t>), The accumulating times of current window with "
             "shape [1].");
    AddInput(
        "in_old_num_accumulates",
        "(Tensor<int64_t>), The accumulating times of previous window with "
        "shape [1].");
    AddInput("in_num_updates",
             "(Tensor<int64_t>), The total number of batches used by training "
             "before this batch with shape [1].");

    AddOutput("out_sum_1",
              "(Tensor), A tensor used to store the "
              "parameter sums with the same shape as input(param).");
    AddOutput("out_sum_2",
              "(Tensor), A auxiliary tensor to help "
              "accumulating sums of parameter values with the same shape as "
              "input(param). It is used to avoid loss of precision due to too "
              "many sums.");
    AddOutput("out_sum_3",
              "(Tensor), A auxiliary tensor to help "
              "accumulating sums of parameter values with the same shape as "
              "input(param).");
    AddOutput(
        "out_num_accumulates",
        "(Tensor<int64_t>), The accumulating times of current window with "
        "shape [1].");
    AddOutput(
        "out_old_num_accumulates",
        "(Tensor<int64_t>) The accumulating times of previous window with "
        "shape [1].");
    AddOutput("out_num_updates",
              "(Tensor<int64_t>), The total number of batches used by training "
              "before this batch with shape [1].");

    AddAttr<float>("average_window",
                   "(float, default 0) "
                   "The rate of average window size relative to num_updates.")
        .SetDefault(0);
    AddAttr<int64_t>("max_average_window",
                     "(int64_t) "
                     "Maximum size of average window. It suggests that the "
                     "number of mini-batches "
                     "in one pass is appropriate value to set.");
    AddAttr<int64_t>("min_average_window",
                     "(int64_t, default 10000L) "
                     "Minimu size of average window.")
        .SetDefault(10000L);

    AddComment(R"DOC(
AverageAccumulates Operator.
Accumulate the sum of parameter within sliding window. The size of sliding window is
determined by 'average_window', 'max_average_window' and 'min_average_window'.
Memory was shared by Input(in_sum_1) and Output(out_sum_1) which acts as an accumulator 'sum_1'.
'sum_2', 'sum_3', 'num_accumulates', 'old_num_accumulates' and 'num_updates' were the same as 'sum_1'.

All the accumulators were inited to zero before training.

And for a mini-batch in training, accumulators were computed as below steps:
    num_updates += 1
    num_accumulates += 1
    sum_1 += param
    if num_updates % kMaxNumAccumulates == 0:
        sum_2 += sum_1
        sum_1 = 0
    if num_accumulates >= min_average_window && num_accumulates >= min(max_average_window, num_updates * average_window):
        sum_3 = sum_1 + sum_2
        sum_1 = 0
        sum_2 = 0
        old_num_accumulates = num_accumulates
        num_accumulates = 0

)DOC");
  }
};

}  // namespace operators
}  // namespace paddle

namespace ops = paddle::operators;
REGISTER_OPERATOR(
    average_accumulates, ops::AverageAccumulatesOp,
    ops::AverageAccumulatesOpMaker,
    paddle::framework::EmptyGradOpMaker<paddle::framework::OpDesc>,
    paddle::framework::EmptyGradOpMaker<paddle::imperative::OpBase>);
REGISTER_OP_CPU_KERNEL(
    average_accumulates,
    ops::AverageAccumulatesKernel<paddle::platform::CPUDeviceContext, float>,
    ops::AverageAccumulatesKernel<paddle::platform::CPUDeviceContext, double>);
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.`
Add sum accumulator with window for model average 7 years ago
			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

			`#include "paddle/fluid/operators/average_accumulates_op.h"`

			`namespace paddle {`
			`namespace operators {`

			`template <>`
Refine sum_accumulates_op. 7 years ago			`void GetAccumulators<paddle::platform::CPUDeviceContext>(`
small AverageOptimizer enhance. (#11761) * small AverageOptimizer enhance. * clean * clean 7 years ago			`const framework::ExecutionContext& ctx, int64_t* num_updates,`
			`int64_t* num_accumulates, int64_t* old_num_accumulates) {`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`auto* in_old_num_accumulates = ctx.Input<Tensor>("in_old_num_accumulates");`
			`auto* in_num_accumulates = ctx.Input<Tensor>("in_num_accumulates");`
			`auto* in_num_updates = ctx.Input<Tensor>("in_num_updates");`
Add sum accumulator with window for model average 7 years ago
small AverageOptimizer enhance. (#11761) * small AverageOptimizer enhance. * clean * clean 7 years ago			`*old_num_accumulates = in_old_num_accumulates->data<int64_t>()[0];`
			`*num_accumulates = in_num_accumulates->data<int64_t>()[0];`
			`*num_updates = in_num_updates->data<int64_t>()[0];`
Add sum accumulator with window for model average 7 years ago			`}`

			`template <>`
Refine sum_accumulates_op. 7 years ago			`void SetAccumulators<paddle::platform::CPUDeviceContext>(`
small AverageOptimizer enhance. (#11761) * small AverageOptimizer enhance. * clean * clean 7 years ago			`const framework::ExecutionContext& ctx, int64_t num_updates,`
			`int64_t num_accumulates, int64_t old_num_accumulates) {`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`auto* out_old_num_accumulates = ctx.Output<Tensor>("out_old_num_accumulates");`
			`auto* out_num_accumulates = ctx.Output<Tensor>("out_num_accumulates");`
			`auto* out_num_updates = ctx.Output<Tensor>("out_num_updates");`
Add sum accumulator with window for model average 7 years ago
small AverageOptimizer enhance. (#11761) * small AverageOptimizer enhance. * clean * clean 7 years ago			`out_old_num_accumulates->data<int64_t>()[0] = old_num_accumulates;`
			`out_num_accumulates->data<int64_t>()[0] = num_accumulates;`
			`out_num_updates->data<int64_t>()[0] = num_updates;`
Add sum accumulator with window for model average 7 years ago			`}`

			`class AverageAccumulatesOp : public framework::OperatorWithKernel {`
			`public:`
			`using framework::OperatorWithKernel::OperatorWithKernel;`

			`void InferShape(framework::InferShapeContext* ctx) const override {`
			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasInput("param"),`
			`"Input (param) of average_accumulates op should not be null.");`
Add sum accumulator with window for model average 7 years ago			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasInput("in_sum_1"),`
Add sum accumulator with window for model average 7 years ago			`"Input (sum_1) of average_accumulates op should not be null.");`
			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasInput("in_sum_2"),`
Add sum accumulator with window for model average 7 years ago			`"Input (sum_2) of average_accumulates op should not be null.");`
			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasInput("in_sum_3"),`
Add sum accumulator with window for model average 7 years ago			`"Input (sum_3) of average_accumulates op should not be null.");`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`PADDLE_ENFORCE(`
			`ctx->HasInput("in_num_accumulates"),`
			`"Input (in_num_accumulates) of average_accumulates op should "`
			`"not be null.");`
			`PADDLE_ENFORCE(ctx->HasInput("in_old_num_accumulates"),`
Add sum accumulator with window for model average 7 years ago			`"Input (old_num_accumulates) of average_accumulates op "`
			`"should not be null.");`
			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasInput("in_num_updates"),`
Add sum accumulator with window for model average 7 years ago			`"Input (num_updates) of average_accumulates op should not be null.");`

			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasOutput("out_sum_1"),`
Add sum accumulator with window for model average 7 years ago			`"Output (sum_1) of average_accumulates op should not be null.");`
			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasOutput("out_sum_2"),`
Add sum accumulator with window for model average 7 years ago			`"Output (sum_2) of average_accumulates op should not be null.");`
			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasOutput("out_sum_3"),`
Add sum accumulator with window for model average 7 years ago			`"Output (sum_3) of average_accumulates op should not be null.");`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`PADDLE_ENFORCE(ctx->HasOutput("out_num_accumulates"),`
Add sum accumulator with window for model average 7 years ago			`"Output (num_accumulates) of average_accumulates op should "`
			`"not be null.");`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`PADDLE_ENFORCE(ctx->HasOutput("out_old_num_accumulates"),`
Add sum accumulator with window for model average 7 years ago			`"Output (old_num_accumulates) of average_accumulates op "`
			`"should not be null.");`
			`PADDLE_ENFORCE(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->HasOutput("out_num_updates"),`
Add sum accumulator with window for model average 7 years ago			`"Output (num_updates) of average_accumulates op should not be null.");`

Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`auto in_dim = ctx->GetInputDim("param");`
Add sum accumulator with window for model average 7 years ago
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`ctx->SetOutputDim("out_sum_1", in_dim);`
			`ctx->SetOutputDim("out_sum_2", in_dim);`
			`ctx->SetOutputDim("out_sum_3", in_dim);`
			`ctx->SetOutputDim("out_num_accumulates", {1});`
			`ctx->SetOutputDim("out_old_num_accumulates", {1});`
			`ctx->SetOutputDim("out_num_updates", {1});`
Add sum accumulator with window for model average 7 years ago			`}`

			`protected:`
			`framework::OpKernelType GetExpectedKernelType(`
			`const framework::ExecutionContext& ctx) const override {`
Replace risky GetInputType method with secure IndicateVarDataType interface (#20668) * replace part of the old implementation, test=develop * restore concat op, test=develop * update all ops implemention & delete GetDataTypeOfVar func, test=develop 5 years ago			`return framework::OpKernelType(`
			`OperatorWithKernel::IndicateVarDataType(ctx, "param"), ctx.GetPlace());`
Add sum accumulator with window for model average 7 years ago			`}`
			`};`

			`class AverageAccumulatesOpMaker : public framework::OpProtoAndCheckerMaker {`
			`public:`
Clean OpProtoAndCheckerMaker Do not use ctor * Reduce line of codes. * We can use virtual function for Maker now. * The implementation does not care what maker holds, it is easier to refactor later. 7 years ago			`void Make() override {`
Refine sum_accumulates_op. 7 years ago			`AddInput("param", "(Tensor), The parameter to be accumulated.");`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`AddInput("in_sum_1",`
Refine sum_accumulates_op. 7 years ago			`"(Tensor), A tensor used to store the parameter "`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`"sums with the same shape as input(param).");`
			`AddInput("in_sum_2",`
Refine sum_accumulates_op. 7 years ago			`"(Tensor), A auxiliary tensor to help "`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`"accumulating sums of parameter values with the same shape as "`
			`"input(param). It is used to avoid loss of precision due to too "`
			`"many sums.");`
			`AddInput("in_sum_3",`
Refine sum_accumulates_op. 7 years ago			`"(Tensor), A auxiliary tensor to help "`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`"accumulating sums of parameter values with the same shape as "`
			`"input(param).");`
			`AddInput("in_num_accumulates",`
Refine sum_accumulates_op. 7 years ago			`"(Tensor<int64_t>), The accumulating times of current window with "`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`"shape [1].");`
Refine sum_accumulates_op. 7 years ago			`AddInput(`
			`"in_old_num_accumulates",`
			`"(Tensor<int64_t>), The accumulating times of previous window with "`
			`"shape [1].");`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`AddInput("in_num_updates",`
fix typo words (#22653) 5 years ago			`"(Tensor<int64_t>), The total number of batches used by training "`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`"before this batch with shape [1].");`

			`AddOutput("out_sum_1",`
Refine sum_accumulates_op. 7 years ago			`"(Tensor), A tensor used to store the "`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`"parameter sums with the same shape as input(param).");`
			`AddOutput("out_sum_2",`
Refine sum_accumulates_op. 7 years ago			`"(Tensor), A auxiliary tensor to help "`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`"accumulating sums of parameter values with the same shape as "`
			`"input(param). It is used to avoid loss of precision due to too "`
			`"many sums.");`
			`AddOutput("out_sum_3",`
Refine sum_accumulates_op. 7 years ago			`"(Tensor), A auxiliary tensor to help "`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`"accumulating sums of parameter values with the same shape as "`
			`"input(param).");`
Refine sum_accumulates_op. 7 years ago			`AddOutput(`
			`"out_num_accumulates",`
			`"(Tensor<int64_t>), The accumulating times of current window with "`
			`"shape [1].");`
			`AddOutput(`
			`"out_old_num_accumulates",`
			`"(Tensor<int64_t>) The accumulating times of previous window with "`
			`"shape [1].");`
fix typo words (#22653) 5 years ago			`AddOutput("out_num_updates",`
			`"(Tensor<int64_t>), The total number of batches used by training "`
			`"before this batch with shape [1].");`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago
			`AddAttr<float>("average_window",`
Refine sum_accumulates_op. 7 years ago			`"(float, default 0) "`
			`"The rate of average window size relative to num_updates.")`
			`.SetDefault(0);`
			`AddAttr<int64_t>("max_average_window",`
			`"(int64_t) "`
			`"Maximum size of average window. It suggests that the "`
			`"number of mini-batches "`
			`"in one pass is appropriate value to set.");`
			`AddAttr<int64_t>("min_average_window",`
			`"(int64_t, default 10000L) "`
			`"Minimu size of average window.")`
			`.SetDefault(10000L);`
Add sum accumulator with window for model average 7 years ago
			`AddComment(R"DOC(`
			`AverageAccumulates Operator.`
small AverageOptimizer enhance. (#11761) * small AverageOptimizer enhance. * clean * clean 7 years ago			`Accumulate the sum of parameter within sliding window. The size of sliding window is`
Refine sum_accumulates_op. 7 years ago			`determined by 'average_window', 'max_average_window' and 'min_average_window'.`
			`Memory was shared by Input(in_sum_1) and Output(out_sum_1) which acts as an accumulator 'sum_1'.`
			`'sum_2', 'sum_3', 'num_accumulates', 'old_num_accumulates' and 'num_updates' were the same as 'sum_1'.`

			`All the accumulators were inited to zero before training.`

			`And for a mini-batch in training, accumulators were computed as below steps:`
			`num_updates += 1`
			`num_accumulates += 1`
			`sum_1 += param`
			`if num_updates % kMaxNumAccumulates == 0:`
			`sum_2 += sum_1`
			`sum_1 = 0`
			`if num_accumulates >= min_average_window && num_accumulates >= min(max_average_window, num_updates * average_window):`
			`sum_3 = sum_1 + sum_2`
			`sum_1 = 0`
			`sum_2 = 0`
			`old_num_accumulates = num_accumulates`
			`num_accumulates = 0`

Add sum accumulator with window for model average 7 years ago			`)DOC");`
			`}`
			`};`

			`} // namespace operators`
			`} // namespace paddle`

			`namespace ops = paddle::operators;`
GradMaker for dygraph (#19706) * refactor dygraph,test=develop * fix failed unittest,test=develop * polish code,test=develop * check windows ci error,test=develop try to fix windows ci error by np.allclose,test=develop * polish vlog and profiler, test=develop * try to fix preceding ops order,test=develop * test transformer in windows ci, test=develop * use python c-api to speed up tracer.trace,test=develop * test=develop, fix docker with paddle nccl problem * test=develop, add ut for debug string and gradient_accumulator * test=develop, add tests for layer/gradient_accumulator/prepared_op * test=develop, fix complie error for test_prepared_op * test=develop, add more ut for dygraph * test=develop, create API.spec for dygraph api change * optimize grad maker; test=develop * optimize grad maker * test * grad make optim; test=develop * fix unittest bugs; test=develop * add dygraph grad op maker and split_op * grad op maker refactor; test=develop * add dygraph grad maker; test=develop * fix op deformable_conv_v1_op bug; test=develop * fix deformable_conv prroi pool bugs; * fix new op grad op maker bug; test=develop * fix split by ref bug; test=develop * fix dygraph auto prune bug; test=develop * fix test_trace bug; test=develop * fix fused emb seq pool bug; test=develop * remove useless code in op_desc file; test=develop * remove useless code, StrVarBaseNode; test=develop * fix review issues; test=develop * fix rank_loss grad maker; test=develop * remove flag in VarBase; test=develop * fix distributed_notify_op compile bug ; test=develop * fix reshape op double grad; test=develop * fix expand as op; test=develop * add impertive type_defs.h for demo_train; test=develop * fix inference lib cmake; test=develop * fix inference lib; test=develop * fix infernce_lib; test=develop * fix inference cmake; test=develop * fix inference lib; test=develop * fix inference lib; test=develop * remove condition dygraph grad maker, modify local name; test=develop * fix split grad maker bug; test=develop * fix pyramid_op bug; test=develop * change travis time out limit; test=develop * restore travis; test=develop * change timeout limit; test=develop 5 years ago			`REGISTER_OPERATOR(`
			`average_accumulates, ops::AverageAccumulatesOp,`
			`ops::AverageAccumulatesOpMaker,`
			`paddle::framework::EmptyGradOpMaker<paddle::framework::OpDesc>,`
			`paddle::framework::EmptyGradOpMaker<paddle::imperative::OpBase>);`
Add sum accumulator with window for model average 7 years ago			`REGISTER_OP_CPU_KERNEL(`
Refine average accumulates op 1. Rename inputs and outputs 2. Add some comments 7 years ago			`average_accumulates,`
Add sum accumulator with window for model average 7 years ago			`ops::AverageAccumulatesKernel<paddle::platform::CPUDeviceContext, float>,`
			`ops::AverageAccumulatesKernel<paddle::platform::CPUDeviceContext, double>);`