|
|
|
@ -12,14 +12,35 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
|
limitations under the License. */
|
|
|
|
|
|
|
|
|
|
#include <algorithm>
|
|
|
|
|
#include <unordered_set>
|
|
|
|
|
|
|
|
|
|
#include "paddle/fluid/framework/ir/graph.h"
|
|
|
|
|
#include "paddle/fluid/framework/op_proto_maker.h"
|
|
|
|
|
#include "paddle/fluid/framework/program_desc.h"
|
|
|
|
|
#include "paddle/fluid/framework/var_desc.h"
|
|
|
|
|
|
|
|
|
|
namespace paddle {
|
|
|
|
|
namespace framework {
|
|
|
|
|
namespace {
|
|
|
|
|
void SortHelper(
|
|
|
|
|
const std::map<ir::Node *, std::unordered_set<ir::Node *>> &adj_list,
|
|
|
|
|
ir::Node *node, std::unordered_set<ir::Node *> *visited,
|
|
|
|
|
std::vector<ir::Node *> *ret) {
|
|
|
|
|
visited->insert(node);
|
|
|
|
|
|
|
|
|
|
for (auto adj : adj_list.at(node)) {
|
|
|
|
|
if (visited->find(adj) == visited->end()) {
|
|
|
|
|
SortHelper(adj_list, adj, visited, ret);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
VLOG(3) << "topology sort insert: " << node->Name()
|
|
|
|
|
<< reinterpret_cast<void *>(node) << " input " << node->inputs.size();
|
|
|
|
|
ret->push_back(node);
|
|
|
|
|
}
|
|
|
|
|
} // namespace
|
|
|
|
|
|
|
|
|
|
// NOTE(paddle-dev): This graph contains circle.
|
|
|
|
|
Graph::Graph(const ProgramDesc &program) : program_(program) {
|
|
|
|
|
VLOG(3) << "block in program:" << program_.Size();
|
|
|
|
|
std::unordered_map<std::string, VarDesc *> all_vars;
|
|
|
|
@ -27,40 +48,128 @@ Graph::Graph(const ProgramDesc &program) : program_(program) {
|
|
|
|
|
all_vars.emplace(var->Name(), var);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::map<std::string, ir::Node *> var_nodes;
|
|
|
|
|
ir::Node *last_backward = nullptr;
|
|
|
|
|
std::vector<ir::Node *> optimize_ops;
|
|
|
|
|
std::map<std::string, std::vector<ir::Node *>> var_nodes;
|
|
|
|
|
for (auto *op : program.Block(0).AllOps()) {
|
|
|
|
|
ir::Node *node = CreateOpNode(op);
|
|
|
|
|
if (boost::get<int>(
|
|
|
|
|
op->GetAttr(OpProtoAndCheckerMaker::OpRoleAttrName())) ==
|
|
|
|
|
static_cast<int>(OpRole::kBackward)) {
|
|
|
|
|
last_backward = node;
|
|
|
|
|
} else if (boost::get<int>(
|
|
|
|
|
op->GetAttr(OpProtoAndCheckerMaker::OpRoleAttrName())) ==
|
|
|
|
|
static_cast<int>(OpRole::kOptimize)) {
|
|
|
|
|
optimize_ops.push_back(node);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for (auto &each_var_name : op->InputArgumentNames()) {
|
|
|
|
|
ir::Node *var = nullptr;
|
|
|
|
|
if (var_nodes.find(each_var_name) != var_nodes.end()) {
|
|
|
|
|
var = var_nodes.at(each_var_name);
|
|
|
|
|
var = var_nodes.at(each_var_name).back();
|
|
|
|
|
} else if (all_vars.count(each_var_name) != 0) {
|
|
|
|
|
var = CreateVarNode(all_vars.at(each_var_name));
|
|
|
|
|
var_nodes[each_var_name] = var;
|
|
|
|
|
var_nodes[each_var_name].push_back(var);
|
|
|
|
|
} else {
|
|
|
|
|
// TODO(paddle-dev): Seems some assumption doesn't hold?
|
|
|
|
|
VLOG(3) << op->Type()
|
|
|
|
|
<< " input var not in all_var list: " << each_var_name;
|
|
|
|
|
var = CreateEmptyNode(each_var_name, ir::Node::Type::kVariable);
|
|
|
|
|
var_nodes[each_var_name] = var;
|
|
|
|
|
var_nodes[each_var_name].push_back(var);
|
|
|
|
|
}
|
|
|
|
|
node->inputs.push_back(var);
|
|
|
|
|
var->outputs.push_back(node);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for (auto &each_var_name : op->OutputArgumentNames()) {
|
|
|
|
|
ir::Node *var = nullptr;
|
|
|
|
|
if (var_nodes.find(each_var_name) != var_nodes.end()) {
|
|
|
|
|
var = var_nodes.at(each_var_name);
|
|
|
|
|
} else {
|
|
|
|
|
var = CreateVarNode(all_vars.at(each_var_name));
|
|
|
|
|
var_nodes[each_var_name] = var;
|
|
|
|
|
}
|
|
|
|
|
ir::Node *var = CreateVarNode(all_vars.at(each_var_name));
|
|
|
|
|
var_nodes[each_var_name].push_back(var);
|
|
|
|
|
node->outputs.push_back(var);
|
|
|
|
|
var->inputs.push_back(node);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
for (auto &var : var_nodes) {
|
|
|
|
|
auto &versions = var.second;
|
|
|
|
|
if (versions.size() <= 1) continue;
|
|
|
|
|
|
|
|
|
|
auto it_new = versions.rbegin();
|
|
|
|
|
auto it_old = versions.rbegin();
|
|
|
|
|
++it_old;
|
|
|
|
|
for (; it_old != versions.rend(); it_new = it_old, ++it_old) {
|
|
|
|
|
ir::Node *write_op =
|
|
|
|
|
(*it_new)->inputs.empty() ? nullptr : (*it_new)->inputs[0];
|
|
|
|
|
const auto &read_ops = (*it_old)->outputs;
|
|
|
|
|
|
|
|
|
|
for (auto *read_op : read_ops) {
|
|
|
|
|
// Manually add a dependency var from read_op to write_op;
|
|
|
|
|
if (read_op == write_op) {
|
|
|
|
|
// Read Write is the same op.
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
ir::Node *dep_var = CreateEmptyNode("dummy", ir::Node::Type::kVariable);
|
|
|
|
|
read_op->outputs.push_back(dep_var);
|
|
|
|
|
dep_var->inputs.push_back(read_op);
|
|
|
|
|
write_op->inputs.push_back(dep_var);
|
|
|
|
|
dep_var->outputs.push_back(write_op);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (last_backward) {
|
|
|
|
|
for (ir::Node *opt_node : optimize_ops) {
|
|
|
|
|
ir::Node *dep_var = CreateEmptyNode("dummy", ir::Node::Type::kVariable);
|
|
|
|
|
last_backward->outputs.push_back(dep_var);
|
|
|
|
|
dep_var->inputs.push_back(last_backward);
|
|
|
|
|
opt_node->inputs.push_back(dep_var);
|
|
|
|
|
dep_var->outputs.push_back(opt_node);
|
|
|
|
|
VLOG(3) << "appending connect: " << last_backward->Name()
|
|
|
|
|
<< reinterpret_cast<void *>(last_backward) << "->"
|
|
|
|
|
<< opt_node->Name() << reinterpret_cast<void *>(opt_node);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
std::vector<ir::Node *> TopologySortOperationFromInToOut(
|
|
|
|
|
const std::vector<std::unique_ptr<ir::Node>> &nodes) {
|
|
|
|
|
std::map<ir::Node *, std::unordered_set<ir::Node *>> adj_list;
|
|
|
|
|
std::unordered_set<ir::Node *> visited;
|
|
|
|
|
std::vector<ir::Node *> ret;
|
|
|
|
|
|
|
|
|
|
for (auto &n : nodes) {
|
|
|
|
|
if (n->NodeType() != ir::Node::Type::kOperation) continue;
|
|
|
|
|
if (adj_list.find(n.get()) == adj_list.end()) {
|
|
|
|
|
adj_list[n.get()] = std::unordered_set<ir::Node *>();
|
|
|
|
|
}
|
|
|
|
|
for (auto &var : n->inputs) {
|
|
|
|
|
for (auto &adj_n : var->inputs) {
|
|
|
|
|
PADDLE_ENFORCE(adj_n->NodeType() == ir::Node::Type::kOperation);
|
|
|
|
|
adj_list[n.get()].insert(adj_n);
|
|
|
|
|
LOG(ERROR) << "adj " << adj_n->Name() << reinterpret_cast<void *>(adj_n)
|
|
|
|
|
<< " -> " << n->Name() << reinterpret_cast<void *>(n.get())
|
|
|
|
|
<< " via " << var->Name() << reinterpret_cast<void *>(var);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for (auto adj : adj_list) {
|
|
|
|
|
if (visited.find(adj.first) == visited.end()) {
|
|
|
|
|
SortHelper(adj_list, adj.first, &visited, &ret);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for (ir::Node *n : ret) {
|
|
|
|
|
std::unordered_set<ir::Node *> dummy;
|
|
|
|
|
n->inputs.erase(
|
|
|
|
|
std::remove_if(n->inputs.begin(), n->inputs.end(),
|
|
|
|
|
[n](ir::Node *t) { return t->Name() == "dummy"; }),
|
|
|
|
|
n->inputs.end());
|
|
|
|
|
n->outputs.erase(
|
|
|
|
|
std::remove_if(n->outputs.begin(), n->outputs.end(),
|
|
|
|
|
[n](ir::Node *t) { return t->Name() == "dummy"; }),
|
|
|
|
|
n->outputs.end());
|
|
|
|
|
}
|
|
|
|
|
return ret;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
} // namespace framework
|
|
|
|
|
} // namespace paddle
|
|
|
|
|