Remove debug info

7 years ago · b75bd29c3a
parent 7a43e51703
commit b75bd29c3a
6 changed files with 224 additions and 263 deletions
--- a/paddle/fluid/framework/details/computation_op_handle.cc
+++ b/paddle/fluid/framework/details/computation_op_handle.cc
@ -26,40 +26,12 @@ ComputationOpHandle::ComputationOpHandle(ir::Node *node, Scope *scope,
      scope_(scope),
      place_(place) {}

-struct RecordTime {
-  RecordTime(const std::string &name, const std::string &type)
-      : name_(name), type_(type), start_(std::chrono::system_clock::now()) {}
-
-  ~RecordTime() {
-    if (type_ == "elementsize_add") {
-      end_ = std::chrono::system_clock::now();
-      std::chrono::duration<double> diff = end_ - start_;
-      VLOG(1) << name_ << " " << type_ << " time record: " << diff.count();
-    }
-  }
-
-  std::string name_;
-  std::string type_;
-  std::chrono::system_clock::time_point start_;
-  std::chrono::system_clock::time_point end_;
-};
-
 void ComputationOpHandle::RunImpl() {
-  {
-    RecordTime rt("ComputationOpHandle::RunImpl", "Wait");
  WaitInputVarGenerated(place_);
-  }
-
-  Scope *scope = nullptr;
-  {
-    RecordTime rt("ComputationOpHandle::RunImpl", "PrepareScope");
-    scope = scope_->FindVar(kLocalExecScopeName)->Get<Scope *>();
-  }

-  {
-    RecordTime rt("ComputationOpHandle::RunImpl", "ReallyRun " + op_->Type());
-
-    auto run_func = [this, scope]() { op_->Run(*scope, place_); };
+  auto run_func = [this]() {
+    op_->Run(*scope_->FindVar(kLocalExecScopeName)->Get<Scope *>(), place_);
+  };

  if (is_lock_and_record_event_free_) {
    run_func();
@ -67,7 +39,6 @@ void ComputationOpHandle::RunImpl() {
    this->RunAndRecordEvent(run_func);
  }
 }
-}

 bool ComputationOpHandle::NeedWait(VarHandleBase *in_var) {
  bool need_wait =
--- a/paddle/fluid/framework/details/op_handle_base.cc
+++ b/paddle/fluid/framework/details/op_handle_base.cc
@ -41,7 +41,7 @@ OpHandleBase::~OpHandleBase() {

 void OpHandleBase::Run(bool use_cuda) {
 #ifdef PADDLE_WITH_CUDA
-  if (events_.empty() && use_cuda && !dev_ctxes_.empty()) {
+  if (events_.empty() && use_cuda) {
    for (auto &p : dev_ctxes_) {
      int dev_id = boost::get<platform::CUDAPlace>(p.first).device;
      PADDLE_ENFORCE(cudaSetDevice(dev_id));
--- a/paddle/fluid/framework/ir/graph.cc
+++ b/paddle/fluid/framework/ir/graph.cc
@ -20,6 +20,10 @@ limitations under the License. */
 #include "paddle/fluid/framework/program_desc.h"
 #include "paddle/fluid/framework/var_desc.h"

+DEFINE_bool(enforce_when_check_program, true,
+            "Checking whether the program is correct or not. We will log "
+            "errors rather than throwing exceptions if this flag turned off");
+
 namespace paddle {
 namespace framework {
 namespace ir {
@ -28,55 +32,85 @@ namespace {
 void CheckProgram(const ProgramDesc &program) {
 #define _INT(role) static_cast<int>(role)

-// std::map<int, bool> visit;
-// for (OpDesc *op : program.Block(0).AllOps()) {
-// // For backward compatibility, some program doesn't have role added.
-// if (!op->HasAttr(OpProtoAndCheckerMaker::OpRoleAttrName())) continue;
-// int role_id =
-// boost::get<int>(op->GetAttr(OpProtoAndCheckerMaker::OpRoleAttrName()));
-// visit[role_id] = true;
-// switch (role_id) {
-// case _INT(OpRole::kForward):
-// if (visit.find(_INT(OpRole::kBackward)) != visit.end()) {
-// LOG(ERROR)
-// << "Cannot add backward operator before forward operator %s."
-// << op->Type();
-// }
-// break;
-// case _INT(OpRole::kBackward):
-// case _INT(OpRole::kBackward) | _INT(OpRole::kLoss):
-// PADDLE_ENFORCE(
-// visit.find(_INT(OpRole::kOptimize)) == visit.end(),
-// "Cannot add backward operator %s after optimize operator.",
-// op->Type());
-// break;
-// case _INT(OpRole::kForward) | _INT(OpRole::kLoss):
-// PADDLE_ENFORCE(visit.find(_INT(OpRole::kBackward) |
-// _INT(OpRole::kLoss)) == visit.end(),
-// "Cannot add backward|loss operator before "
-// "forward|loss operator %s.",
-// op->Type());
-// PADDLE_ENFORCE(
-// visit.find(_INT(OpRole::kOptimize)) == visit.end(),
-// "Cannot add forward|loss operator %s after optimize operator.",
-// op->Type());
-// break;
-// case _INT(OpRole::kOptimize):
-// case _INT(OpRole::kOptimize) | _INT(OpRole::kLRSched):
-// PADDLE_ENFORCE(visit.find(_INT(OpRole::kBackward)) != visit.end(),
-// "Optimize operators %s must follow backward operator.",
-// op->Type());
-// break;
-// case _INT(OpRole::kLRSched):
-// case _INT(OpRole::kDist):
-// case _INT(OpRole::kRPC):
-// case _INT(OpRole::kNotSpecified):
-// break;
-// default:
-// LOG(FATAL) << "Unknown operator role. Don't add new role because "
-// "you don't know what you are doing.";
-// }
-// }
+  std::map<int, bool> visit;
+  for (OpDesc *op : program.Block(0).AllOps()) {
+    // For backward compatibility, some program doesn't have role added.
+    if (!op->HasAttr(OpProtoAndCheckerMaker::OpRoleAttrName())) continue;
+    int role_id =
+        boost::get<int>(op->GetAttr(OpProtoAndCheckerMaker::OpRoleAttrName()));
+    visit[role_id] = true;
+    switch (role_id) {
+      case _INT(OpRole::kForward):
+        if (visit.find(_INT(OpRole::kBackward)) != visit.end()) {
+          LOG(ERROR)
+              << "Cannot add backward operator before forward operator %s."
+              << op->Type();
+        }
+        break;
+      case _INT(OpRole::kBackward):
+      case _INT(OpRole::kBackward) | _INT(OpRole::kLoss):
+        if (!FLAGS_enforce_when_check_program) {
+          PADDLE_ENFORCE(
+              visit.find(_INT(OpRole::kOptimize)) == visit.end(),
+              "Cannot add backward operator %s after optimize operator.",
+              op->Type());
+        } else {
+          if (visit.find(_INT(OpRole::kOptimize)) != visit.end()) {
+            LOG(ERROR)
+                << "Cannot add backward operator %s after optimize operator.",
+                << op->Type();
+          }
+        }
+        break;
+      case _INT(OpRole::kForward) | _INT(OpRole::kLoss):
+        if (!FLAGS_enforce_when_check_program) {
+          PADDLE_ENFORCE(visit.find(_INT(OpRole::kBackward) |
+                                    _INT(OpRole::kLoss)) == visit.end(),
+                         "Cannot add backward|loss operator before "
+                         "forward|loss operator %s.",
+                         op->Type());
+          PADDLE_ENFORCE(
+              visit.find(_INT(OpRole::kOptimize)) == visit.end(),
+              "Cannot add forward|loss operator %s after optimize operator.",
+              op->Type());
+        } else {
+          if (visit.find(_INT(OpRole::kBackward) | _INT(OpRole::kLoss)) !=
+              visit.end()) {
+            LOG(ERROR) << "Cannot add backward|loss operator before "
+                       << "forward|loss operator %s." << op->Type();
+          }
+
+          if (visit.find(_INT(OpRole::kOptimize)) != visit.end()) {
+            LOG(ERROR) << "Cannot add forward|loss operator %s after optimize "
+                          "operator.",
+                << op->Type();
+          }
+        }
+        break;
+      case _INT(OpRole::kOptimize):
+      case _INT(OpRole::kOptimize) | _INT(OpRole::kLRSched):
+        if (!FLAGS_enforce_when_check_program) {
+          PADDLE_ENFORCE(visit.find(_INT(OpRole::kBackward)) != visit.end(),
+                         "Optimize operators %s must follow backward operator.",
+                         op->Type());
+        } else {
+          if (visit.find(_INT(OpRole::kBackward)) == visit.end()) {
+            LOG(ERROR)
+                << "Optimize operators %s must follow backward operator.",
+                << op->Type();
+          }
+        }
+        break;
+      case _INT(OpRole::kLRSched):
+      case _INT(OpRole::kDist):
+      case _INT(OpRole::kRPC):
+      case _INT(OpRole::kNotSpecified):
+        break;
+      default:
+        LOG(FATAL) << "Unknown operator role. Don't add new role because "
+                      "you don't know what you are doing.";
+    }
+  }

 #undef _INT
 }
--- a/paddle/fluid/framework/operator.cc
+++ b/paddle/fluid/framework/operator.cc
@ -701,40 +701,10 @@ void OperatorWithKernel::RuntimeInferShape(const Scope& scope,
  this->InferShape(&infer_shape_ctx);
 }

-struct RecordTime {
-  RecordTime(const std::string& name, const std::string& type)
-      : name_(name), type_(type), start_(std::chrono::system_clock::now()) {}
-
-  void inline stop() {
-    end_ = std::chrono::system_clock::now();
-    std::chrono::duration<double> diff = end_ - start_;
-    VLOG(1) << name_ << " " << type_ << " time record: " << diff.count();
-  }
-
-  ~RecordTime() {
-    if (type_ == "elementwise_add") {
-      stop();
-    }
-    // stop();
-  }
-
-  std::string name_;
-  std::string type_;
-  std::chrono::system_clock::time_point start_;
-  std::chrono::system_clock::time_point end_;
-};
-
 void OperatorWithKernel::RunImpl(const Scope& scope,
                                 const platform::Place& place) const {
-  RecordTime rt("OperatorWithKernel::All", type_);
-  {
-    RecordTime rt("OperatorWithKernel::InferShape", type_);
  RuntimeInferShapeContext infer_shape_ctx(*this, scope);
  this->InferShape(&infer_shape_ctx);
-  }
-
-  {
-    RecordTime* rt_1 = new RecordTime("OperatorWithKernel::Compute1", type_);
  platform::DeviceContextPool& pool = platform::DeviceContextPool::Instance();
  auto* dev_ctx = pool.Get(place);

@ -743,8 +713,7 @@ void OperatorWithKernel::RunImpl(const Scope& scope,
  auto kernels_iter = all_op_kernels.find(type_);
  if (kernels_iter == all_op_kernels.end()) {
    PADDLE_THROW(
-          "There are no kernels which are registered in the %s operator.",
-          type_);
+        "There are no kernels which are registered in the %s operator.", type_);
  }

  OpKernelMap& kernels = kernels_iter->second;
@ -778,25 +747,19 @@ void OperatorWithKernel::RunImpl(const Scope& scope,

  // do data transformScope &transfer_scope;
  std::vector<std::string> transfered_inplace_vars;
-    Scope* transfer_scope = nullptr;
-    // auto* transfer_scope =
-    // TryTransferData(scope, expected_kernel_key, &transfered_inplace_vars);
+  auto* transfer_scope =
+      TryTransferData(scope, expected_kernel_key, &transfered_inplace_vars);

  // exec scope is the scope that kernel actually executed on.
-    const Scope& exec_scope = scope;
-    // const Scope& exec_scope =
-    // (transfer_scope == nullptr ? scope : *transfer_scope);
+  const Scope& exec_scope =
+      (transfer_scope == nullptr ? scope : *transfer_scope);

  if (!(expected_kernel_key.place_ == dev_ctx->GetPlace())) {
    dev_ctx = pool.Get(expected_kernel_key.place_);
  }
-    delete rt_1;

-    RecordTime* rt_2 = new RecordTime("OperatorWithKernel::Compute2", type_);
  kernel_iter->second(ExecutionContext(*this, exec_scope, *dev_ctx));
-    delete rt_2;

-    RecordTime* rt_3 = new RecordTime("OperatorWithKernel::Compute3", type_);
  if (!transfered_inplace_vars.empty()) {
    // there is inplace variable has been transfered.
    TransferInplaceVarsBack(scope, transfered_inplace_vars, *transfer_scope);
@ -814,12 +777,9 @@ void OperatorWithKernel::RunImpl(const Scope& scope,
      if (var->IsType<framework::LoDTensor>()) {
        CheckTensorNANOrInf(vname, var->Get<framework::LoDTensor>());
      } else if (var->IsType<framework::SelectedRows>()) {
-          CheckTensorNANOrInf(vname,
-                              var->Get<framework::SelectedRows>().value());
-        }
+        CheckTensorNANOrInf(vname, var->Get<framework::SelectedRows>().value());
      }
    }
-    delete rt_3;
  }
 }
 void OperatorWithKernel::TransferInplaceVarsBack(
--- a/paddle/fluid/operators/elementwise/elementwise_op.h
+++ b/paddle/fluid/operators/elementwise/elementwise_op.h
@ -33,7 +33,6 @@ class ElementwiseOp : public framework::OperatorWithKernel {
  using Tensor = framework::Tensor;

  void InferShape(framework::InferShapeContext *ctx) const override {
-    if (!ctx->IsRuntime()) {
    PADDLE_ENFORCE(ctx->HasInput("X"),
                   "Input(X) of elementwise op should not be null.");
    PADDLE_ENFORCE(ctx->HasInput("Y"),
@ -41,12 +40,11 @@ class ElementwiseOp : public framework::OperatorWithKernel {
    PADDLE_ENFORCE(ctx->HasOutput("Out"),
                   "Output(Out) of elementwise op should not be null.");

-      PADDLE_ENFORCE(ctx->GetInputsVarType("Y").front() ==
+    PADDLE_ENFORCE(
+        ctx->GetInputsVarType("Y").front() ==
            framework::proto::VarType::LOD_TENSOR,
-                     "The input var's type should be LoDTensor, but the "
-                     "received is %s [%s]",
-                     ctx->GetInputsVarType("Y").front(),
-                     ctx->Inputs("Y").front());
+        "The input var's type should be LoDTensor, but the received is %s [%s]",
+        ctx->GetInputsVarType("Y").front(), ctx->Inputs("Y").front());

    if (ctx->GetInputsVarType("X").front() ==
        framework::proto::VarType::LOD_TENSOR) {
@ -64,7 +62,6 @@ class ElementwiseOp : public framework::OperatorWithKernel {
      PADDLE_THROW("X's type[%s] is not supported by elementwise_op.",
                   ctx->GetInputsVarType("X").front());
    }
-    }

    ctx->ShareDim("X", /*->*/ "Out");
    ctx->ShareLoD("X", /*->*/ "Out");
--- a/paddle/fluid/operators/optimizers/adam_op.cc
+++ b/paddle/fluid/operators/optimizers/adam_op.cc
@ -23,57 +23,56 @@ class AdamOp : public framework::OperatorWithKernel {
  using framework::OperatorWithKernel::OperatorWithKernel;

  void InferShape(framework::InferShapeContext *ctx) const override {
-    // PADDLE_ENFORCE(ctx->HasInput("Param"),
-    // "Input(Param) of AdamOp should not be null.");
-    // PADDLE_ENFORCE(ctx->HasInput("Grad"),
-    // "Input(Grad) of AdamOp should not be null.");
-    // PADDLE_ENFORCE(ctx->HasInput("Moment1"),
-    // "Input(Moment1) of AdamOp should not be null.");
-    // PADDLE_ENFORCE(ctx->HasInput("Moment2"),
-    // "Input(Moment2) of AdamOp should not be null.");
-    // PADDLE_ENFORCE(ctx->HasInput("LearningRate"),
-    // "Input(LearningRate) of AdamOp should not be null.");
-    // PADDLE_ENFORCE(ctx->HasInput("Beta1Pow"),
-    // "Input(Beta1Pow) of AdamOp should not be null.");
-    // PADDLE_ENFORCE(ctx->HasInput("Beta2Pow"),
-    // "Input(Beta2Pow) of AdamOp should not be null.");
-
-    // PADDLE_ENFORCE(ctx->HasOutput("ParamOut"),
-    // "Output(ParamOut) of AdamOp should not be null.");
-    // PADDLE_ENFORCE(ctx->HasOutput("Moment1Out"),
-    // "Output(Moment1Out) of AdamOp should not be null.");
-    // PADDLE_ENFORCE(ctx->HasOutput("Moment2Out"),
-    // "Output(Moment2Out) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasInput("Param"),
+                   "Input(Param) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasInput("Grad"),
+                   "Input(Grad) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasInput("Moment1"),
+                   "Input(Moment1) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasInput("Moment2"),
+                   "Input(Moment2) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasInput("LearningRate"),
+                   "Input(LearningRate) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasInput("Beta1Pow"),
+                   "Input(Beta1Pow) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasInput("Beta2Pow"),
+                   "Input(Beta2Pow) of AdamOp should not be null.");
+
+    PADDLE_ENFORCE(ctx->HasOutput("ParamOut"),
+                   "Output(ParamOut) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasOutput("Moment1Out"),
+                   "Output(Moment1Out) of AdamOp should not be null.");
+    PADDLE_ENFORCE(ctx->HasOutput("Moment2Out"),
+                   "Output(Moment2Out) of AdamOp should not be null.");

    auto lr_dims = ctx->GetInputDim("LearningRate");
-    // PADDLE_ENFORCE_EQ(framework::product(lr_dims), 1,
-    // "Learning rate should have 1 dimension");
+    PADDLE_ENFORCE_EQ(framework::product(lr_dims), 1,
+                      "Learning rate should have 1 dimension");
    auto beta1_pow_dims = ctx->GetInputDim("Beta1Pow");
-    // PADDLE_ENFORCE_EQ(framework::product(beta1_pow_dims), 1,
-    // "Beta1 power accumulator should have 1 dimension");
+    PADDLE_ENFORCE_EQ(framework::product(beta1_pow_dims), 1,
+                      "Beta1 power accumulator should have 1 dimension");
    auto beta2_pow_dims = ctx->GetInputDim("Beta2Pow");
-    // PADDLE_ENFORCE_EQ(framework::product(beta2_pow_dims), 1,
-    // "Beta2 power accumulator should have 1 dimension");
+    PADDLE_ENFORCE_EQ(framework::product(beta2_pow_dims), 1,
+                      "Beta2 power accumulator should have 1 dimension");

    auto param_dims = ctx->GetInputDim("Param");
-    // if (ctx->GetInputsVarType("Grad")[0] ==
-    // framework::proto::VarType::LOD_TENSOR) {
-    // PADDLE_ENFORCE_EQ(
-    // param_dims, ctx->GetInputDim("Grad"),
-    // "Param and Grad input of AdamOp should have same dimension");
-    // }
-    // PADDLE_ENFORCE_EQ(
-    // param_dims, ctx->GetInputDim("Moment1"),
-    // "Param and Moment1 input of AdamOp should have same dimension");
-    // PADDLE_ENFORCE_EQ(
-    // param_dims, ctx->GetInputDim("Moment2"),
-    // "Param and Moment2 input of AdamOp should have same dimension");
+    if (ctx->GetInputsVarType("Grad")[0] ==
+        framework::proto::VarType::LOD_TENSOR) {
+      PADDLE_ENFORCE_EQ(
+          param_dims, ctx->GetInputDim("Grad"),
+          "Param and Grad input of AdamOp should have same dimension");
+    }
+    PADDLE_ENFORCE_EQ(
+        param_dims, ctx->GetInputDim("Moment1"),
+        "Param and Moment1 input of AdamOp should have same dimension");
+    PADDLE_ENFORCE_EQ(
+        param_dims, ctx->GetInputDim("Moment2"),
+        "Param and Moment2 input of AdamOp should have same dimension");

    ctx->SetOutputDim("ParamOut", param_dims);
    ctx->SetOutputDim("Moment1Out", param_dims);
    ctx->SetOutputDim("Moment2Out", param_dims);
  }
-
  framework::OpKernelType GetExpectedKernelType(
      const framework::ExecutionContext &ctx) const override {
    auto input_data_type =