Paddle/paddle/fluid/imperative/layer.cc

// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/imperative/layer.h"

#include <deque>
#include <limits>
#include <map>
#include <random>
#include <utility>

#include "paddle/fluid/framework/lod_tensor.h"
#include "paddle/fluid/framework/op_registry.h"
#include "paddle/fluid/framework/operator.h"
#include "paddle/fluid/framework/tensor_util.h"
#include "paddle/fluid/operators/math/blas.h"
#include "paddle/fluid/platform/device_context.h"
#include "paddle/fluid/string/printf.h"

namespace paddle {
namespace imperative {

std::map<int, py::object> py_funcs_;

using framework::Variable;

namespace detail {

template <typename T>
class TensorAddToFunctor : public boost::static_visitor<> {
 public:
  TensorAddToFunctor(int64_t numel, const T* x, T* y)
      : numel_(numel), x_(x), y_(y) {}

  void operator()(const platform::CPUPlace& place) {
    platform::CPUDeviceContext* ctx = dynamic_cast<platform::CPUDeviceContext*>(
        platform::DeviceContextPool::Instance().Get(place));
    auto blas =
        operators::math::GetBlas<platform::CPUDeviceContext, float>(*ctx);
    blas.AXPY(numel_, 1., x_, y_);
  }

#ifdef PADDLE_WITH_CUDA
  void operator()(const platform::CUDAPlace& place) {
    platform::CUDADeviceContext* ctx =
        dynamic_cast<platform::CUDADeviceContext*>(
            platform::DeviceContextPool::Instance().Get(place));
    auto blas =
        operators::math::GetBlas<platform::CUDADeviceContext, float>(*ctx);
    blas.AXPY(numel_, 1., x_, y_);
  }
#else
  void operator()(const platform::CUDAPlace& place) {
    PADDLE_THROW("Do NOT support gradient merge in place %s", place);
  }
#endif

  // there is NO blas in CUDAPinnedPlace
  void operator()(const platform::CUDAPinnedPlace& place) {
    PADDLE_THROW("Do NOT support gradient merge in place %s", place);
  }

 private:
  int64_t numel_;
  const T* x_;
  T* y_;
};

}  // namespace detail

void AddGradTo(Variable* src, Variable* dst, platform::Place place) {
  framework::Tensor* dst_tensor = dst->GetMutable<framework::LoDTensor>();
  framework::Tensor* src_tensor = src->GetMutable<framework::LoDTensor>();

  // FIXME(minqiyang): loss_grad op will pass a zero grad of label
  // ugly fix for it
  if (src_tensor->numel() == 0) {
    return;
  }

  PADDLE_ENFORCE(dst_tensor->numel() == src_tensor->numel(),
                 "dst_numel %lld vs. src_numel %lld", dst_tensor->numel(),
                 src_tensor->numel());

  detail::TensorAddToFunctor<float> func(
      src_tensor->numel(), src_tensor->data<float>(),
      dst_tensor->mutable_data<float>(place));
  boost::apply_visitor(func, place);
}

class Autograd {
 public:
  Autograd() {}

  void RunBackward(VarBase* var) {
    if (var->stop_gradient_) {
      return;
    }
    VLOG(3) << "start autograd";

    std::deque<OpBase*> ready;
    ready.push_back(var->pre_op_);

    std::map<OpBase*, int> dep_counts = ComputeDepCounts(var->pre_op_);

    while (!ready.empty()) {
      OpBase* ready_op = ready.front();
      ready.pop_front();
      std::map<std::string, std::vector<VarBase*>> input_grads =
          ready_op->ApplyGrad();

      for (auto it : input_grads) {
        const std::vector<VarBase*>& ingrads = it.second;
        for (size_t i = 0; i < ingrads.size(); ++i) {
          if (!ingrads[i]) continue;
          if (ready_op->input_vars_[it.first][i]->stop_gradient_) {
            continue;
          }
          OpBase* pre_op = ready_op->pre_ops_[it.first][i];
          if (!pre_op) continue;

          dep_counts[pre_op] -= 1;
          PADDLE_ENFORCE(dep_counts[pre_op] >= 0);
          bool pre_op_ready = dep_counts[pre_op] == 0;
          if (pre_op_ready) {
            ready.push_back(pre_op);
          }
        }
      }
    }
  }

 private:
  std::map<OpBase*, int> ComputeDepCounts(OpBase* op) {
    std::map<OpBase*, int> ret;

    std::deque<OpBase*> queue;
    queue.push_back(op);
    std::unordered_set<OpBase*> visited;
    visited.insert(op);
    while (!queue.empty()) {
      OpBase* candidate = queue.front();
      queue.pop_front();
      for (auto it : candidate->pre_ops_) {
        for (OpBase* pre_op : it.second) {
          if (!pre_op) continue;
          if (visited.find(pre_op) == visited.end()) {
            visited.insert(pre_op);
            queue.push_back(pre_op);
          }
          ret[pre_op] += 1;
        }
      }
    }
    return ret;
  }
};

framework::LoDTensor& VarBase::GradValue() {
  VLOG(3) << "get var grad " << var_desc_->Name();
  return *(grads_->var_->GetMutable<framework::LoDTensor>());
}

std::map<std::string, std::vector<VarBase*>> OpBase::ApplyGrad() {
  if (!grad_op_desc_ && backward_id_ <= 0) {
    LOG(WARNING) << "op with no grad: " << op_desc_->Type();
    return {};
  }

  std::map<std::string, std::vector<framework::Variable*>> grad_outputs;
  if (backward_id_ > 0) {
    VLOG(3) << "py_layer_grad";
    grad_outputs["Out@GRAD"] =
        PyLayer::ApplyGrad(backward_id_, grad_input_vars_["X@GRAD"]);
  } else {
    VLOG(3) << "op grad " << grad_op_desc_->Type();
    for (auto it : grad_output_vars_) {
      auto& outputs = grad_outputs[it.first];
      for (size_t i = 0; i < it.second.size(); ++i) {
        // Allocate a new variable
        Variable* tmp_var = new framework::Variable();
        tmp_var->GetMutable<framework::LoDTensor>();
        outputs.push_back(tmp_var);
      }
    }

    framework::RuntimeContext ctx(grad_input_vars_, grad_outputs);

    // No need to do compile time infer shape here.
    // grad_op_desc_->InferShape(*block_);
    grad_op_desc_->InferVarType(block_);

    std::unique_ptr<framework::OperatorBase> opbase =
        framework::OpRegistry::CreateOp(*grad_op_desc_);
    framework::OperatorWithKernel* op_kernel =
        dynamic_cast<framework::OperatorWithKernel*>(opbase.get());
    PADDLE_ENFORCE_NOT_NULL(op_kernel, "only support op with kernel");

    framework::Scope scope;
    platform::Place place = expected_place_;
    PreparedOp p = PreparedOp::Prepare(ctx, *op_kernel, place);
    p.op.RuntimeInferShape(scope, place, ctx);
    p.func(framework::ExecutionContext(p.op, scope, *p.dev_ctx, p.ctx));
  }

  for (auto it : grad_output_vars_) {
    auto& outputs = grad_outputs[it.first];
    auto& origin_outputs = it.second;
    PADDLE_ENFORCE_EQ(outputs.size(), origin_outputs.size());

    for (size_t i = 0; i < outputs.size(); ++i) {
      framework::Variable* grad = outputs[i];
      framework::Variable* orig_grad = origin_outputs[i];
      AddGradTo(grad, orig_grad, expected_place_);
      delete grad;
    }
  }
  return input_vars_;
}

void VarBase::RunBackward() {
  if (!pre_op_) return;

  VLOG(3) << "start backward";
  auto grads_t = grads_->var_->GetMutable<framework::LoDTensor>();
  operators::math::set_constant(
      *(platform::DeviceContextPool::Instance().Get(
          var_->GetMutable<framework::LoDTensor>()->place())),
      grads_t, 1.0);

  PADDLE_ENFORCE(
      grads_ ==
      pre_op_->output_vars_[pre_op_out_name_][pre_op_out_idx_]->grads_);
  Autograd().RunBackward(this);
}

void PyLayer::RegisterFunc(int func_id, const py::object& py_func) {
  py_funcs_[func_id] = py_func;
}

int PyLayer::NumFuncs() { return py_funcs_.size(); }

std::vector<VarBase*> PyLayer::Apply(int func_id,
                                     const std::vector<VarBase*>& inputs) {
  std::vector<framework::Variable*> invars;
  for (const VarBase* in : inputs) {
    invars.push_back(in->var_);
  }
  PADDLE_ENFORCE(py_funcs_.find(func_id) != py_funcs_.end());
  std::vector<Variable*> outvars = CallPythonFunc(py_funcs_[func_id], invars);
  std::vector<VarBase*> ret;
  for (Variable* v : outvars) {
    ret.push_back(new VarBase(v, new VarBase(true)));
  }
  return ret;
}

std::vector<Variable*> PyLayer::ApplyGrad(
    int func_id, const std::vector<framework::Variable*>& inputs) {
  PADDLE_ENFORCE(py_funcs_.find(func_id) != py_funcs_.end());
  return CallPythonFunc(py_funcs_[func_id], inputs);
}

std::vector<framework::Variable*> PyLayer::CallPythonFunc(
    const py::object& callable, const std::vector<framework::Variable*>& ins) {
  py::gil_scoped_acquire guard;
  py::tuple in_args(ins.size());
  for (size_t i = 0; i < ins.size(); ++i) {
    const framework::LoDTensor& t = ins[i]->Get<framework::LoDTensor>();
    in_args[i] = t.IsInitialized() ? py::cast(t) : py::cast(nullptr);
  }
  VLOG(3) << "pyfunc in " << py::len(in_args);

  // TODO(panyx0718): Who owns the returned LoDTensor.
  auto ret = callable(in_args);
  auto ret_tuple = py::cast<py::tuple>(ret);
  size_t ret_num = py::len(ret_tuple);
  std::vector<framework::Variable*> outs;
  VLOG(3) << "pyfunc out " << ret_num;
  for (size_t i = 0; i < ret_num; ++i) {
    try {
      auto* py_out_tensor = py::cast<framework::LoDTensor*>(ret_tuple[i]);
      PADDLE_ENFORCE_NOT_NULL(py_out_tensor,
                              "Output tensor %d should not be nullptr", i);
      auto* var = new framework::Variable();
      auto* tensor = var->GetMutable<framework::LoDTensor>();
      tensor->ShareDataWith(*py_out_tensor);
      tensor->set_lod(py_out_tensor->lod());
      outs.push_back(var);
    } catch (py::cast_error&) {
      PADDLE_THROW("The %d-th output must be LoDTensor", i);
    }
  }
  return outs;
}

}  // namespace imperative
}  // namespace paddle
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.`
			`//`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`

			`#include "paddle/fluid/imperative/layer.h"`
Add single GPU support to imperative 6 years ago
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`#include <deque>`
			`#include <limits>`
			`#include <map>`
			`#include <random>`
			`#include <utility>`

			`#include "paddle/fluid/framework/lod_tensor.h"`
			`#include "paddle/fluid/framework/op_registry.h"`
Support stop_gradients var in imperative backward test=develop 6 years ago			`#include "paddle/fluid/framework/operator.h"`
Add single GPU support to imperative 6 years ago			`#include "paddle/fluid/framework/tensor_util.h"`
			`#include "paddle/fluid/operators/math/blas.h"`
			`#include "paddle/fluid/platform/device_context.h"`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`#include "paddle/fluid/string/printf.h"`

			`namespace paddle {`
			`namespace imperative {`

checkpoint test=develop 6 years ago			`std::map<int, py::object> py_funcs_;`

Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`using framework::Variable;`

Add single GPU support to imperative 6 years ago			`namespace detail {`

			`template <typename T>`
			`class TensorAddToFunctor : public boost::static_visitor<> {`
			`public:`
			`TensorAddToFunctor(int64_t numel, const T* x, T* y)`
			`: numel_(numel), x_(x), y_(y) {}`

			`void operator()(const platform::CPUPlace& place) {`
			`platform::CPUDeviceContext* ctx = dynamic_cast<platform::CPUDeviceContext*>(`
			`platform::DeviceContextPool::Instance().Get(place));`
			`auto blas =`
			`operators::math::GetBlas<platform::CPUDeviceContext, float>(*ctx);`
			`blas.AXPY(numel_, 1., x_, y_);`
			`}`

			`#ifdef PADDLE_WITH_CUDA`
			`void operator()(const platform::CUDAPlace& place) {`
			`platform::CUDADeviceContext* ctx =`
			`dynamic_cast<platform::CUDADeviceContext*>(`
			`platform::DeviceContextPool::Instance().Get(place));`
			`auto blas =`
			`operators::math::GetBlas<platform::CUDADeviceContext, float>(*ctx);`
			`blas.AXPY(numel_, 1., x_, y_);`
			`}`
			`#else`
			`void operator()(const platform::CUDAPlace& place) {`
			`PADDLE_THROW("Do NOT support gradient merge in place %s", place);`
			`}`
			`#endif`

			`// there is NO blas in CUDAPinnedPlace`
			`void operator()(const platform::CUDAPinnedPlace& place) {`
			`PADDLE_THROW("Do NOT support gradient merge in place %s", place);`
			`}`

			`private:`
			`int64_t numel_;`
			`const T* x_;`
			`T* y_;`
			`};`

			`} // namespace detail`

			`void AddGradTo(Variable* src, Variable* dst, platform::Place place) {`
			`framework::Tensor* dst_tensor = dst->GetMutable<framework::LoDTensor>();`
			`framework::Tensor* src_tensor = src->GetMutable<framework::LoDTensor>();`

Polish code test=develop 6 years ago			`// FIXME(minqiyang): loss_grad op will pass a zero grad of label`
			`// ugly fix for it`
			`if (src_tensor->numel() == 0) {`
			`return;`
			`}`
Add single GPU support to imperative 6 years ago
Support stop_gradients var in imperative backward test=develop 6 years ago			`PADDLE_ENFORCE(dst_tensor->numel() == src_tensor->numel(),`
			`"dst_numel %lld vs. src_numel %lld", dst_tensor->numel(),`
			`src_tensor->numel());`
Add single GPU support to imperative 6 years ago
			`detail::TensorAddToFunctor<float> func(`
			`src_tensor->numel(), src_tensor->data<float>(),`
			`dst_tensor->mutable_data<float>(place));`
			`boost::apply_visitor(func, place);`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`

			`class Autograd {`
			`public:`
refactor to avoid scope. test=develop 6 years ago			`Autograd() {}`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago
			`void RunBackward(VarBase* var) {`
Merge branch 'develop' of https://github.com/PaddlePaddle/Paddle into imperative_mnist test=develop 6 years ago			`if (var->stop_gradient_) {`
			`return;`
			`}`
forward and backward test=develop 6 years ago			`VLOG(3) << "start autograd";`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago
			`std::deque<OpBase*> ready;`
			`ready.push_back(var->pre_op_);`

			`std::map<OpBase*, int> dep_counts = ComputeDepCounts(var->pre_op_);`

			`while (!ready.empty()) {`
			`OpBase* ready_op = ready.front();`
			`ready.pop_front();`
refactor to avoid scope. test=develop 6 years ago			`std::map<std::string, std::vector<VarBase*>> input_grads =`
			`ready_op->ApplyGrad();`

			`for (auto it : input_grads) {`
			`const std::vector<VarBase*>& ingrads = it.second;`
			`for (size_t i = 0; i < ingrads.size(); ++i) {`
			`if (!ingrads[i]) continue;`
Merge branch 'develop' of https://github.com/PaddlePaddle/Paddle into imperative_mnist test=develop 6 years ago			`if (ready_op->input_vars_[it.first][i]->stop_gradient_) {`
			`continue;`
			`}`
call kernel 6 years ago			`OpBase* pre_op = ready_op->pre_ops_[it.first][i];`
refactor to avoid scope. test=develop 6 years ago			`if (!pre_op) continue;`

			`dep_counts[pre_op] -= 1;`
			`PADDLE_ENFORCE(dep_counts[pre_op] >= 0);`
			`bool pre_op_ready = dep_counts[pre_op] == 0;`
			`if (pre_op_ready) {`
			`ready.push_back(pre_op);`
			`}`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`
			`}`
			`}`
			`}`

			`private:`
			`std::map<OpBase, int> ComputeDepCounts(OpBase op) {`
			`std::map<OpBase*, int> ret;`

			`std::deque<OpBase*> queue;`
			`queue.push_back(op);`
			`std::unordered_set<OpBase*> visited;`
			`visited.insert(op);`
			`while (!queue.empty()) {`
			`OpBase* candidate = queue.front();`
			`queue.pop_front();`
call kernel 6 years ago			`for (auto it : candidate->pre_ops_) {`
refactor to avoid scope. test=develop 6 years ago			`for (OpBase* pre_op : it.second) {`
			`if (!pre_op) continue;`
			`if (visited.find(pre_op) == visited.end()) {`
			`visited.insert(pre_op);`
			`queue.push_back(pre_op);`
			`}`
			`ret[pre_op] += 1;`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`
			`}`
			`}`
			`return ret;`
			`}`
			`};`

Change var_ and grad_ to shared_ptr 6 years ago			`framework::LoDTensor& VarBase::GradValue() {`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`VLOG(3) << "get var grad " << var_desc_->Name();`
Change grads to VarBase 6 years ago			`return *(grads_->var_->GetMutable<framework::LoDTensor>());`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`

refactor to avoid scope. test=develop 6 years ago			`std::map<std::string, std::vector<VarBase*>> OpBase::ApplyGrad() {`
forward and backward test=develop 6 years ago			`if (!grad_op_desc_ && backward_id_ <= 0) {`
Support stop_gradients var in imperative backward test=develop 6 years ago			`LOG(WARNING) << "op with no grad: " << op_desc_->Type();`
refactor to avoid scope. test=develop 6 years ago			`return {};`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`

refactor to avoid scope. test=develop 6 years ago			`std::map<std::string, std::vector<framework::Variable*>> grad_outputs;`
forward and backward test=develop 6 years ago			`if (backward_id_ > 0) {`
			`VLOG(3) << "py_layer_grad";`
polish test=develop 6 years ago			`grad_outputs["Out@GRAD"] =`
			`PyLayer::ApplyGrad(backward_id_, grad_input_vars_["X@GRAD"]);`
forward and backward test=develop 6 years ago			`} else {`
			`VLOG(3) << "op grad " << grad_op_desc_->Type();`
polish test=develop 6 years ago			`for (auto it : grad_output_vars_) {`
			`auto& outputs = grad_outputs[it.first];`
			`for (size_t i = 0; i < it.second.size(); ++i) {`
			`// Allocate a new variable`
			`Variable* tmp_var = new framework::Variable();`
			`tmp_var->GetMutable<framework::LoDTensor>();`
			`outputs.push_back(tmp_var);`
			`}`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`

forward and backward test=develop 6 years ago			`framework::RuntimeContext ctx(grad_input_vars_, grad_outputs);`
Add stop_gradient to VarBase to support loss function test=develop 6 years ago
forward and backward test=develop 6 years ago			`// No need to do compile time infer shape here.`
			`// grad_op_desc_->InferShape(*block_);`
			`grad_op_desc_->InferVarType(block_);`
refactor to avoid scope. test=develop 6 years ago
forward and backward test=develop 6 years ago			`std::unique_ptr<framework::OperatorBase> opbase =`
			`framework::OpRegistry::CreateOp(*grad_op_desc_);`
			`framework::OperatorWithKernel* op_kernel =`
			`dynamic_cast<framework::OperatorWithKernel*>(opbase.get());`
			`PADDLE_ENFORCE_NOT_NULL(op_kernel, "only support op with kernel");`
call kernel 6 years ago
forward and backward test=develop 6 years ago			`framework::Scope scope;`
Add single GPU support to imperative 6 years ago			`platform::Place place = expected_place_;`
forward and backward test=develop 6 years ago			`PreparedOp p = PreparedOp::Prepare(ctx, *op_kernel, place);`
			`p.op.RuntimeInferShape(scope, place, ctx);`
			`p.func(framework::ExecutionContext(p.op, scope, *p.dev_ctx, p.ctx));`
			`}`
refactor to avoid scope. test=develop 6 years ago
			`for (auto it : grad_output_vars_) {`
			`auto& outputs = grad_outputs[it.first];`
			`auto& origin_outputs = it.second;`
polish test=develop 6 years ago			`PADDLE_ENFORCE_EQ(outputs.size(), origin_outputs.size());`
Support stop_gradients var in imperative backward test=develop 6 years ago
refactor to avoid scope. test=develop 6 years ago			`for (size_t i = 0; i < outputs.size(); ++i) {`
polish test=develop 6 years ago			`framework::Variable* grad = outputs[i];`
Polish code test=develop 6 years ago			`framework::Variable* orig_grad = origin_outputs[i];`
Add single GPU support to imperative 6 years ago			`AddGradTo(grad, orig_grad, expected_place_);`
polish test=develop 6 years ago			`delete grad;`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`
			`}`
refactor to avoid scope. test=develop 6 years ago			`return input_vars_;`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`

refactor to avoid scope. test=develop 6 years ago			`void VarBase::RunBackward() {`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`if (!pre_op_) return;`
call kernel 6 years ago
forward and backward test=develop 6 years ago			`VLOG(3) << "start backward";`
Change grads to VarBase 6 years ago			`auto grads_t = grads_->var_->GetMutable<framework::LoDTensor>();`
Add single GPU support to imperative 6 years ago			`operators::math::set_constant(`
			`*(platform::DeviceContextPool::Instance().Get(`
			`var_->GetMutable<framework::LoDTensor>()->place())),`
			`grads_t, 1.0);`
refactor to avoid scope. test=develop 6 years ago
call kernel 6 years ago			`PADDLE_ENFORCE(`
			`grads_ ==`
			`pre_op_->output_vars_[pre_op_out_name_][pre_op_out_idx_]->grads_);`
refactor to avoid scope. test=develop 6 years ago			`Autograd().RunBackward(this);`
Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`}`

checkpoint test=develop 6 years ago			`void PyLayer::RegisterFunc(int func_id, const py::object& py_func) {`
			`py_funcs_[func_id] = py_func;`
			`}`

polish test=develop 6 years ago			`int PyLayer::NumFuncs() { return py_funcs_.size(); }`

checkpoint test=develop 6 years ago			`std::vector<VarBase*> PyLayer::Apply(int func_id,`
forward and backward test=develop 6 years ago			`const std::vector<VarBase*>& inputs) {`
polish test=develop 6 years ago			`std::vector<framework::Variable*> invars;`
forward and backward test=develop 6 years ago			`for (const VarBase* in : inputs) {`
polish test=develop 6 years ago			`invars.push_back(in->var_);`
checkpoint test=develop 6 years ago			`}`
			`PADDLE_ENFORCE(py_funcs_.find(func_id) != py_funcs_.end());`
polish test=develop 6 years ago			`std::vector<Variable*> outvars = CallPythonFunc(py_funcs_[func_id], invars);`
			`std::vector<VarBase*> ret;`
			`for (Variable* v : outvars) {`
Merge branch 'develop' of https://github.com/PaddlePaddle/Paddle into imperative_shared_ptr test=develop 6 years ago			`ret.push_back(new VarBase(v, new VarBase(true)));`
polish test=develop 6 years ago			`}`
checkpoint test=develop 6 years ago			`return ret;`
			`}`

polish test=develop 6 years ago			`std::vector<Variable*> PyLayer::ApplyGrad(`
			`int func_id, const std::vector<framework::Variable*>& inputs) {`
			`PADDLE_ENFORCE(py_funcs_.find(func_id) != py_funcs_.end());`
			`return CallPythonFunc(py_funcs_[func_id], inputs);`
			`}`
forward and backward test=develop 6 years ago
polish test=develop 6 years ago			`std::vector<framework::Variable*> PyLayer::CallPythonFunc(`
			`const py::object& callable, const std::vector<framework::Variable*>& ins) {`
			`py::gil_scoped_acquire guard;`
			`py::tuple in_args(ins.size());`
			`for (size_t i = 0; i < ins.size(); ++i) {`
			`const framework::LoDTensor& t = ins[i]->Get<framework::LoDTensor>();`
			`in_args[i] = t.IsInitialized() ? py::cast(t) : py::cast(nullptr);`
forward and backward test=develop 6 years ago			`}`
polish test=develop 6 years ago			`VLOG(3) << "pyfunc in " << py::len(in_args);`

			`// TODO(panyx0718): Who owns the returned LoDTensor.`
			`auto ret = callable(in_args);`
			`auto ret_tuple = py::cast<py::tuple>(ret);`
			`size_t ret_num = py::len(ret_tuple);`
			`std::vector<framework::Variable*> outs;`
			`VLOG(3) << "pyfunc out " << ret_num;`
			`for (size_t i = 0; i < ret_num; ++i) {`
			`try {`
			`auto* py_out_tensor = py::cast<framework::LoDTensor*>(ret_tuple[i]);`
			`PADDLE_ENFORCE_NOT_NULL(py_out_tensor,`
			`"Output tensor %d should not be nullptr", i);`
			`auto* var = new framework::Variable();`
			`auto* tensor = var->GetMutable<framework::LoDTensor>();`
			`tensor->ShareDataWith(*py_out_tensor);`
			`tensor->set_lod(py_out_tensor->lod());`
			`outs.push_back(var);`
			`} catch (py::cast_error&) {`
			`PADDLE_THROW("The %d-th output must be LoDTensor", i);`
			`}`
			`}`
			`return outs;`
forward and backward test=develop 6 years ago			`}`

Revert "Merge pull request #14798 from PaddlePaddle/revert-14786-revert-14782-revert-14398-imperative" This reverts commit b1d3a1c8b41fdb4cfcb58ec2d4fb938b09dac057, reversing changes made to f1fb64b17fb0290e7e1f110069de19b0ea0d0474. 6 years ago			`} // namespace imperative`
			`} // namespace paddle`