helinwang-patch-1
Yu Yang 7 years ago
parent 3da4159f88
commit 4137bb4eda

@ -813,7 +813,7 @@ void ParallelExecutor::Run(const std::vector<std::string> &fetch_tensors,
fetch_ops.clear();
*member_->global_scope_->Var(fetched_var_name)->GetMutable<LoDTensorArray>() =
fetched_data->tensors_;
VLOG(3) << "Before Wait";
// FIXME:
// It could be optimized by using multiple events in an operator.
// Manually sync computation during iter.
@ -824,6 +824,7 @@ void ParallelExecutor::Run(const std::vector<std::string> &fetch_tensors,
for (auto &p : member_->places_) {
platform::DeviceContextPool::Instance().Get(p)->Wait();
}
VLOG(3) << "Done wait";
}
void ParallelExecutor::RunOp(

Loading…
Cancel
Save