mirror of
https://github.com/KhronosGroup/SPIRV-Tools
synced 2024-12-29 03:01:08 +00:00
731d1899b1
- Add generic depth first iterator - Update the dominator tree to use this iterator instead of "randomly" iterate over the nodes
392 lines
14 KiB
C++
392 lines
14 KiB
C++
// Copyright (c) 2017 Google Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#include <iostream>
|
|
#include <memory>
|
|
#include <set>
|
|
|
|
#include "cfa.h"
|
|
#include "dominator_tree.h"
|
|
|
|
using namespace spvtools;
|
|
using namespace spvtools::opt;
|
|
|
|
// Calculates the dominator or postdominator tree for a given function.
|
|
// 1 - Compute the successors and predecessors for each BasicBlock. We add a
|
|
// dummy node for the start node or for postdominators the exit. This node will
|
|
// point to all entry or all exit nodes.
|
|
// 2 - Using the CFA::DepthFirstTraversal get a depth first postordered list of
|
|
// all BasicBlocks. Using the successors (or for postdominator, predecessors)
|
|
// calculated in step 1 to traverse the tree.
|
|
// 3 - Pass the list calculated in step 2 to the CFA::CalculateDominators using
|
|
// the predecessors list (or for postdominator, successors). This will give us a
|
|
// vector of BB pairs. Each BB and its immediate dominator.
|
|
// 4 - Using the list from 3 use those edges to build a tree of
|
|
// DominatorTreeNodes. Each node containing a link to the parent dominator and
|
|
// children which are dominated.
|
|
// 5 - Using the tree from 4, perform a depth first traversal to calculate the
|
|
// preorder and postorder index of each node. We use these indexes to compare
|
|
// nodes against each other for domination checks.
|
|
|
|
namespace {
|
|
|
|
// Wrapper around CFA::DepthFirstTraversal to provide an interface to perform
|
|
// depth first search on generic BasicBlock types. Will call post and pre order
|
|
// user defined functions during traversal
|
|
//
|
|
// BBType - BasicBlock type. Will either be ir::BasicBlock or DominatorTreeNode
|
|
// SuccessorLambda - Lamdba matching the signature of 'const
|
|
// std::vector<BBType>*(const BBType *A)'. Will return a vector of the nodes
|
|
// succeding BasicBlock A.
|
|
// PostLambda - Lamdba matching the signature of 'void (const BBType*)' will be
|
|
// called on each node traversed AFTER their children.
|
|
// PreLambda - Lamdba matching the signature of 'void (const BBType*)' will be
|
|
// called on each node traversed BEFORE their children.
|
|
template <typename BBType, typename SuccessorLambda, typename PreLambda,
|
|
typename PostLambda>
|
|
static void DepthFirstSearch(const BBType* bb, SuccessorLambda successors,
|
|
PreLambda pre, PostLambda post) {
|
|
// Ignore backedge operation.
|
|
auto nop_backedge = [](const BBType*, const BBType*) {};
|
|
CFA<BBType>::DepthFirstTraversal(bb, successors, pre, post, nop_backedge);
|
|
}
|
|
|
|
// Wrapper around CFA::DepthFirstTraversal to provide an interface to perform
|
|
// depth first search on generic BasicBlock types. This overload is for only
|
|
// performing user defined post order.
|
|
//
|
|
// BBType - BasicBlock type. Will either be ir::BasicBlock or DominatorTreeNode
|
|
// SuccessorLambda - Lamdba matching the signature of 'const
|
|
// std::vector<BBType>*(const BBType *A)'. Will return a vector of the nodes
|
|
// succeding BasicBlock A.
|
|
// PostLambda - Lamdba matching the signature of 'void (const BBType*)' will be
|
|
// called on each node traversed after their children.
|
|
template <typename BBType, typename SuccessorLambda, typename PostLambda>
|
|
static void DepthFirstSearchPostOrder(const BBType* bb,
|
|
SuccessorLambda successors,
|
|
PostLambda post) {
|
|
// Ignore preorder operation.
|
|
auto nop_preorder = [](const BBType*) {};
|
|
DepthFirstSearch(bb, successors, nop_preorder, post);
|
|
}
|
|
|
|
// Small type trait to get the function class type.
|
|
template <typename BBType>
|
|
struct GetFunctionClass {
|
|
using FunctionType = ir::Function;
|
|
};
|
|
|
|
// Helper class to compute predecessors and successors for each Basic Block in a
|
|
// function. Through GetPredFunctor and GetSuccessorFunctor it provides an
|
|
// interface to get the successor and predecessor lists for each basic
|
|
// block. This is required by the DepthFirstTraversal and ComputeDominator
|
|
// functions which take as parameter an std::function returning the successors
|
|
// and predecessors respectively.
|
|
//
|
|
// When computing the post-dominator tree, all edges are inverted. So successors
|
|
// returned by this class will be predecessors in the original CFG.
|
|
template <typename BBType>
|
|
class BasicBlockSuccessorHelper {
|
|
// This should eventually become const ir::BasicBlock.
|
|
using BasicBlock = BBType;
|
|
using Function = typename GetFunctionClass<BBType>::FunctionType;
|
|
|
|
using BasicBlockListTy = std::vector<BasicBlock*>;
|
|
using BasicBlockMapTy = std::map<const BasicBlock*, BasicBlockListTy>;
|
|
|
|
public:
|
|
// For compliance with the dominance tree computation, entry nodes are
|
|
// connected to a single dummy node.
|
|
BasicBlockSuccessorHelper(Function& func, const BasicBlock* dummy_start_node,
|
|
bool post);
|
|
|
|
// CFA::CalculateDominators requires std::vector<BasicBlock*>.
|
|
using GetBlocksFunction =
|
|
std::function<const std::vector<BasicBlock*>*(const BasicBlock*)>;
|
|
|
|
// Returns the list of predecessor functions.
|
|
GetBlocksFunction GetPredFunctor() {
|
|
return [this](const BasicBlock* bb) {
|
|
BasicBlockListTy* v = &this->predecessors_[bb];
|
|
return v;
|
|
};
|
|
}
|
|
|
|
// Returns a vector of the list of successor nodes from a given node.
|
|
GetBlocksFunction GetSuccessorFunctor() {
|
|
return [this](const BasicBlock* bb) {
|
|
BasicBlockListTy* v = &this->successors_[bb];
|
|
return v;
|
|
};
|
|
}
|
|
|
|
private:
|
|
bool invert_graph_;
|
|
BasicBlockMapTy successors_;
|
|
BasicBlockMapTy predecessors_;
|
|
|
|
// Build the successors and predecessors map for each basic blocks |f|.
|
|
// If |invert_graph_| is true, all edges are reversed (successors becomes
|
|
// predecessors and vice versa).
|
|
// For convenience, the start of the graph is |dummy_start_node|.
|
|
// The dominator tree construction requires a unique entry node, which cannot
|
|
// be guaranteed for the postdominator graph. The |dummy_start_node| BB is
|
|
// here to gather all entry nodes.
|
|
void CreateSuccessorMap(Function& f, const BasicBlock* dummy_start_node);
|
|
};
|
|
|
|
template <typename BBType>
|
|
BasicBlockSuccessorHelper<BBType>::BasicBlockSuccessorHelper(
|
|
Function& func, const BasicBlock* dummy_start_node, bool invert)
|
|
: invert_graph_(invert) {
|
|
CreateSuccessorMap(func, dummy_start_node);
|
|
}
|
|
|
|
template <typename BBType>
|
|
void BasicBlockSuccessorHelper<BBType>::CreateSuccessorMap(
|
|
Function& f, const BasicBlock* dummy_start_node) {
|
|
std::map<uint32_t, BasicBlock*> id_to_BB_map;
|
|
auto GetSuccessorBasicBlock = [&f, &id_to_BB_map](uint32_t successor_id) {
|
|
BasicBlock*& Succ = id_to_BB_map[successor_id];
|
|
if (!Succ) {
|
|
for (BasicBlock& BBIt : f) {
|
|
if (successor_id == BBIt.id()) {
|
|
Succ = &BBIt;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
return Succ;
|
|
};
|
|
|
|
if (invert_graph_) {
|
|
// For the post dominator tree, we see the inverted graph.
|
|
// successors_ in the inverted graph are the predecessors in the CFG.
|
|
// The tree construction requires 1 entry point, so we add a dummy node
|
|
// that is connected to all function exiting basic blocks.
|
|
// An exiting basic block is a block with an OpKill, OpUnreachable,
|
|
// OpReturn or OpReturnValue as terminator instruction.
|
|
for (BasicBlock& bb : f) {
|
|
if (bb.hasSuccessor()) {
|
|
BasicBlockListTy& pred_list = predecessors_[&bb];
|
|
bb.ForEachSuccessorLabel(
|
|
[this, &pred_list, &bb,
|
|
&GetSuccessorBasicBlock](const uint32_t successor_id) {
|
|
BasicBlock* succ = GetSuccessorBasicBlock(successor_id);
|
|
// Inverted graph: our successors in the CFG
|
|
// are our predecessors in the inverted graph.
|
|
this->successors_[succ].push_back(&bb);
|
|
pred_list.push_back(succ);
|
|
});
|
|
} else {
|
|
successors_[dummy_start_node].push_back(&bb);
|
|
predecessors_[&bb].push_back(const_cast<BasicBlock*>(dummy_start_node));
|
|
}
|
|
}
|
|
} else {
|
|
// Technically, this is not needed, but it unifies
|
|
// the handling of dominator and postdom tree later on.
|
|
successors_[dummy_start_node].push_back(f.entry().get());
|
|
predecessors_[f.entry().get()].push_back(
|
|
const_cast<BasicBlock*>(dummy_start_node));
|
|
for (BasicBlock& bb : f) {
|
|
BasicBlockListTy& succ_list = successors_[&bb];
|
|
|
|
bb.ForEachSuccessorLabel([&](const uint32_t successor_id) {
|
|
BasicBlock* succ = GetSuccessorBasicBlock(successor_id);
|
|
succ_list.push_back(succ);
|
|
predecessors_[succ].push_back(&bb);
|
|
});
|
|
}
|
|
}
|
|
}
|
|
|
|
} // namespace
|
|
|
|
namespace spvtools {
|
|
namespace opt {
|
|
|
|
bool DominatorTree::StrictlyDominates(uint32_t a, uint32_t b) const {
|
|
if (a == b) return false;
|
|
return Dominates(a, b);
|
|
}
|
|
|
|
bool DominatorTree::StrictlyDominates(const ir::BasicBlock* a,
|
|
const ir::BasicBlock* b) const {
|
|
return DominatorTree::StrictlyDominates(a->id(), b->id());
|
|
}
|
|
|
|
bool DominatorTree::Dominates(uint32_t a, uint32_t b) const {
|
|
// Check that both of the inputs are actual nodes.
|
|
auto a_itr = nodes_.find(a);
|
|
auto b_itr = nodes_.find(b);
|
|
if (a_itr == nodes_.end() || b_itr == nodes_.end()) return false;
|
|
|
|
// Node A dominates node B if they are the same.
|
|
if (a == b) return true;
|
|
const DominatorTreeNode* nodeA = &a_itr->second;
|
|
const DominatorTreeNode* nodeB = &b_itr->second;
|
|
|
|
if (nodeA->dfs_num_pre_ < nodeB->dfs_num_pre_ &&
|
|
nodeA->dfs_num_post_ > nodeB->dfs_num_post_) {
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
bool DominatorTree::Dominates(const ir::BasicBlock* A,
|
|
const ir::BasicBlock* B) const {
|
|
return Dominates(A->id(), B->id());
|
|
}
|
|
|
|
ir::BasicBlock* DominatorTree::ImmediateDominator(
|
|
const ir::BasicBlock* A) const {
|
|
return ImmediateDominator(A->id());
|
|
}
|
|
|
|
ir::BasicBlock* DominatorTree::ImmediateDominator(uint32_t a) const {
|
|
// Check that A is a valid node in the tree.
|
|
auto a_itr = nodes_.find(a);
|
|
if (a_itr == nodes_.end()) return nullptr;
|
|
|
|
const DominatorTreeNode* node = &a_itr->second;
|
|
|
|
if (node->parent_ == nullptr) {
|
|
return nullptr;
|
|
}
|
|
|
|
return node->parent_->bb_;
|
|
}
|
|
|
|
DominatorTreeNode* DominatorTree::GetOrInsertNode(ir::BasicBlock* bb) {
|
|
DominatorTreeNode* dtn = nullptr;
|
|
|
|
std::map<uint32_t, DominatorTreeNode>::iterator node_iter =
|
|
nodes_.find(bb->id());
|
|
if (node_iter == nodes_.end()) {
|
|
dtn = &nodes_.emplace(std::make_pair(bb->id(), DominatorTreeNode{bb}))
|
|
.first->second;
|
|
} else
|
|
dtn = &node_iter->second;
|
|
|
|
return dtn;
|
|
}
|
|
|
|
void DominatorTree::GetDominatorEdges(
|
|
const ir::Function* f, const ir::BasicBlock* dummy_start_node,
|
|
std::vector<std::pair<ir::BasicBlock*, ir::BasicBlock*>>* edges) {
|
|
// Each time the depth first traversal calls the postorder callback
|
|
// std::function we push that node into the postorder vector to create our
|
|
// postorder list.
|
|
std::vector<const ir::BasicBlock*> postorder;
|
|
auto postorder_function = [&](const ir::BasicBlock* b) {
|
|
postorder.push_back(b);
|
|
};
|
|
|
|
// CFA::CalculateDominators requires std::vector<ir::BasicBlock*>
|
|
// BB are derived from F, so we need to const cast it at some point
|
|
// no modification is made on F.
|
|
BasicBlockSuccessorHelper<ir::BasicBlock> helper{
|
|
*const_cast<ir::Function*>(f), dummy_start_node, postdominator_};
|
|
|
|
// The successor function tells DepthFirstTraversal how to move to successive
|
|
// nodes by providing an interface to get a list of successor nodes from any
|
|
// given node.
|
|
auto successor_functor = helper.GetSuccessorFunctor();
|
|
|
|
// The predecessor functor does the same as the successor functor
|
|
// but for all nodes preceding a given node.
|
|
auto predecessor_functor = helper.GetPredFunctor();
|
|
|
|
// If we're building a post dominator tree we traverse the tree in reverse
|
|
// using the predecessor function in place of the successor function and vice
|
|
// versa.
|
|
DepthFirstSearchPostOrder(dummy_start_node, successor_functor,
|
|
postorder_function);
|
|
*edges =
|
|
CFA<ir::BasicBlock>::CalculateDominators(postorder, predecessor_functor);
|
|
}
|
|
|
|
void DominatorTree::InitializeTree(const ir::Function* f, const ir::CFG& cfg) {
|
|
ClearTree();
|
|
|
|
// Skip over empty functions.
|
|
if (f->cbegin() == f->cend()) {
|
|
return;
|
|
}
|
|
|
|
const ir::BasicBlock* dummy_start_node =
|
|
postdominator_ ? cfg.pseudo_exit_block() : cfg.pseudo_entry_block();
|
|
|
|
// Get the immediate dominator for each node.
|
|
std::vector<std::pair<ir::BasicBlock*, ir::BasicBlock*>> edges;
|
|
GetDominatorEdges(f, dummy_start_node, &edges);
|
|
|
|
// Transform the vector<pair> into the tree structure which we can use to
|
|
// efficiently query dominance.
|
|
for (auto edge : edges) {
|
|
DominatorTreeNode* first = GetOrInsertNode(edge.first);
|
|
|
|
if (edge.first == edge.second) {
|
|
if (std::find(roots_.begin(), roots_.end(), first) == roots_.end())
|
|
roots_.push_back(first);
|
|
continue;
|
|
}
|
|
|
|
DominatorTreeNode* second = GetOrInsertNode(edge.second);
|
|
|
|
first->parent_ = second;
|
|
second->children_.push_back(first);
|
|
}
|
|
|
|
int index = 0;
|
|
auto preFunc = [&index](const DominatorTreeNode* node) {
|
|
const_cast<DominatorTreeNode*>(node)->dfs_num_pre_ = ++index;
|
|
};
|
|
|
|
auto postFunc = [&index](const DominatorTreeNode* node) {
|
|
const_cast<DominatorTreeNode*>(node)->dfs_num_post_ = ++index;
|
|
};
|
|
|
|
auto getSucc = [](const DominatorTreeNode* node) { return &node->children_; };
|
|
|
|
for (auto root : roots_) DepthFirstSearch(root, getSucc, preFunc, postFunc);
|
|
}
|
|
|
|
void DominatorTree::DumpTreeAsDot(std::ostream& out_stream) const {
|
|
out_stream << "digraph {\n";
|
|
Visit([&out_stream](const DominatorTreeNode* node) {
|
|
// Print the node.
|
|
if (node->bb_) {
|
|
out_stream << node->bb_->id() << "[label=\"" << node->bb_->id()
|
|
<< "\"];\n";
|
|
}
|
|
|
|
// Print the arrow from the parent to this node. Entry nodes will not have
|
|
// parents so draw them as children from the dummy node.
|
|
if (node->parent_) {
|
|
out_stream << node->parent_->bb_->id() << " -> " << node->bb_->id()
|
|
<< ";\n";
|
|
}
|
|
|
|
// Return true to continue the traversal.
|
|
return true;
|
|
});
|
|
out_stream << "}\n";
|
|
}
|
|
|
|
} // namespace opt
|
|
} // namespace spvtools
|