| 1 | // Copyright (c) 2015-2016 The Khronos Group Inc. | 
|---|
| 2 | // | 
|---|
| 3 | // Licensed under the Apache License, Version 2.0 (the "License"); | 
|---|
| 4 | // you may not use this file except in compliance with the License. | 
|---|
| 5 | // You may obtain a copy of the License at | 
|---|
| 6 | // | 
|---|
| 7 | //     http://www.apache.org/licenses/LICENSE-2.0 | 
|---|
| 8 | // | 
|---|
| 9 | // Unless required by applicable law or agreed to in writing, software | 
|---|
| 10 | // distributed under the License is distributed on an "AS IS" BASIS, | 
|---|
| 11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
|---|
| 12 | // See the License for the specific language governing permissions and | 
|---|
| 13 | // limitations under the License. | 
|---|
| 14 |  | 
|---|
| 15 | #ifndef SOURCE_CFA_H_ | 
|---|
| 16 | #define SOURCE_CFA_H_ | 
|---|
| 17 |  | 
|---|
| 18 | #include <algorithm> | 
|---|
| 19 | #include <cassert> | 
|---|
| 20 | #include <cstdint> | 
|---|
| 21 | #include <functional> | 
|---|
| 22 | #include <map> | 
|---|
| 23 | #include <unordered_map> | 
|---|
| 24 | #include <unordered_set> | 
|---|
| 25 | #include <utility> | 
|---|
| 26 | #include <vector> | 
|---|
| 27 |  | 
|---|
| 28 | namespace spvtools { | 
|---|
| 29 |  | 
|---|
| 30 | // Control Flow Analysis of control flow graphs of basic block nodes |BB|. | 
|---|
| 31 | template <class BB> | 
|---|
| 32 | class CFA { | 
|---|
| 33 | using bb_ptr = BB*; | 
|---|
| 34 | using cbb_ptr = const BB*; | 
|---|
| 35 | using bb_iter = typename std::vector<BB*>::const_iterator; | 
|---|
| 36 | using get_blocks_func = std::function<const std::vector<BB*>*(const BB*)>; | 
|---|
| 37 |  | 
|---|
| 38 | struct block_info { | 
|---|
| 39 | cbb_ptr block;  ///< pointer to the block | 
|---|
| 40 | bb_iter iter;   ///< Iterator to the current child node being processed | 
|---|
| 41 | }; | 
|---|
| 42 |  | 
|---|
| 43 | /// Returns true if a block with @p id is found in the @p work_list vector | 
|---|
| 44 | /// | 
|---|
| 45 | /// @param[in] work_list  Set of blocks visited in the the depth first | 
|---|
| 46 | /// traversal | 
|---|
| 47 | ///                       of the CFG | 
|---|
| 48 | /// @param[in] id         The ID of the block being checked | 
|---|
| 49 | /// | 
|---|
| 50 | /// @return true if the edge work_list.back().block->id() => id is a back-edge | 
|---|
| 51 | static bool FindInWorkList(const std::vector<block_info>& work_list, | 
|---|
| 52 | uint32_t id); | 
|---|
| 53 |  | 
|---|
| 54 | public: | 
|---|
| 55 | /// @brief Depth first traversal starting from the \p entry BasicBlock | 
|---|
| 56 | /// | 
|---|
| 57 | /// This function performs a depth first traversal from the \p entry | 
|---|
| 58 | /// BasicBlock and calls the pre/postorder functions when it needs to process | 
|---|
| 59 | /// the node in pre order, post order. It also calls the backedge function | 
|---|
| 60 | /// when a back edge is encountered. | 
|---|
| 61 | /// | 
|---|
| 62 | /// @param[in] entry      The root BasicBlock of a CFG | 
|---|
| 63 | /// @param[in] successor_func  A function which will return a pointer to the | 
|---|
| 64 | ///                            successor nodes | 
|---|
| 65 | /// @param[in] preorder   A function that will be called for every block in a | 
|---|
| 66 | ///                       CFG following preorder traversal semantics | 
|---|
| 67 | /// @param[in] postorder  A function that will be called for every block in a | 
|---|
| 68 | ///                       CFG following postorder traversal semantics | 
|---|
| 69 | /// @param[in] backedge   A function that will be called when a backedge is | 
|---|
| 70 | ///                       encountered during a traversal | 
|---|
| 71 | /// NOTE: The @p successor_func and predecessor_func each return a pointer to | 
|---|
| 72 | /// a | 
|---|
| 73 | /// collection such that iterators to that collection remain valid for the | 
|---|
| 74 | /// lifetime of the algorithm. | 
|---|
| 75 | static void DepthFirstTraversal( | 
|---|
| 76 | const BB* entry, get_blocks_func successor_func, | 
|---|
| 77 | std::function<void(cbb_ptr)> preorder, | 
|---|
| 78 | std::function<void(cbb_ptr)> postorder, | 
|---|
| 79 | std::function<void(cbb_ptr, cbb_ptr)> backedge); | 
|---|
| 80 |  | 
|---|
| 81 | /// @brief Calculates dominator edges for a set of blocks | 
|---|
| 82 | /// | 
|---|
| 83 | /// Computes dominators using the algorithm of Cooper, Harvey, and Kennedy | 
|---|
| 84 | /// "A Simple, Fast Dominance Algorithm", 2001. | 
|---|
| 85 | /// | 
|---|
| 86 | /// The algorithm assumes there is a unique root node (a node without | 
|---|
| 87 | /// predecessors), and it is therefore at the end of the postorder vector. | 
|---|
| 88 | /// | 
|---|
| 89 | /// This function calculates the dominator edges for a set of blocks in the | 
|---|
| 90 | /// CFG. | 
|---|
| 91 | /// Uses the dominator algorithm by Cooper et al. | 
|---|
| 92 | /// | 
|---|
| 93 | /// @param[in] postorder        A vector of blocks in post order traversal | 
|---|
| 94 | /// order | 
|---|
| 95 | ///                             in a CFG | 
|---|
| 96 | /// @param[in] predecessor_func Function used to get the predecessor nodes of | 
|---|
| 97 | /// a | 
|---|
| 98 | ///                             block | 
|---|
| 99 | /// | 
|---|
| 100 | /// @return the dominator tree of the graph, as a vector of pairs of nodes. | 
|---|
| 101 | /// The first node in the pair is a node in the graph. The second node in the | 
|---|
| 102 | /// pair is its immediate dominator in the sense of Cooper et.al., where a | 
|---|
| 103 | /// block | 
|---|
| 104 | /// without predecessors (such as the root node) is its own immediate | 
|---|
| 105 | /// dominator. | 
|---|
| 106 | static std::vector<std::pair<BB*, BB*>> CalculateDominators( | 
|---|
| 107 | const std::vector<cbb_ptr>& postorder, get_blocks_func predecessor_func); | 
|---|
| 108 |  | 
|---|
| 109 | // Computes a minimal set of root nodes required to traverse, in the forward | 
|---|
| 110 | // direction, the CFG represented by the given vector of blocks, and successor | 
|---|
| 111 | // and predecessor functions.  When considering adding two nodes, each having | 
|---|
| 112 | // predecessors, favour using the one that appears earlier on the input blocks | 
|---|
| 113 | // list. | 
|---|
| 114 | static std::vector<BB*> TraversalRoots(const std::vector<BB*>& blocks, | 
|---|
| 115 | get_blocks_func succ_func, | 
|---|
| 116 | get_blocks_func pred_func); | 
|---|
| 117 |  | 
|---|
| 118 | static void ComputeAugmentedCFG( | 
|---|
| 119 | std::vector<BB*>& ordered_blocks, BB* pseudo_entry_block, | 
|---|
| 120 | BB* pseudo_exit_block, | 
|---|
| 121 | std::unordered_map<const BB*, std::vector<BB*>>* augmented_successors_map, | 
|---|
| 122 | std::unordered_map<const BB*, std::vector<BB*>>* | 
|---|
| 123 | augmented_predecessors_map, | 
|---|
| 124 | get_blocks_func succ_func, get_blocks_func pred_func); | 
|---|
| 125 | }; | 
|---|
| 126 |  | 
|---|
| 127 | template <class BB> | 
|---|
| 128 | bool CFA<BB>::FindInWorkList(const std::vector<block_info>& work_list, | 
|---|
| 129 | uint32_t id) { | 
|---|
| 130 | for (const auto b : work_list) { | 
|---|
| 131 | if (b.block->id() == id) return true; | 
|---|
| 132 | } | 
|---|
| 133 | return false; | 
|---|
| 134 | } | 
|---|
| 135 |  | 
|---|
| 136 | template <class BB> | 
|---|
| 137 | void CFA<BB>::DepthFirstTraversal( | 
|---|
| 138 | const BB* entry, get_blocks_func successor_func, | 
|---|
| 139 | std::function<void(cbb_ptr)> preorder, | 
|---|
| 140 | std::function<void(cbb_ptr)> postorder, | 
|---|
| 141 | std::function<void(cbb_ptr, cbb_ptr)> backedge) { | 
|---|
| 142 | std::unordered_set<uint32_t> processed; | 
|---|
| 143 |  | 
|---|
| 144 | /// NOTE: work_list is the sequence of nodes from the root node to the node | 
|---|
| 145 | /// being processed in the traversal | 
|---|
| 146 | std::vector<block_info> work_list; | 
|---|
| 147 | work_list.reserve(10); | 
|---|
| 148 |  | 
|---|
| 149 | work_list.push_back({entry, std::begin(*successor_func(entry))}); | 
|---|
| 150 | preorder(entry); | 
|---|
| 151 | processed.insert(entry->id()); | 
|---|
| 152 |  | 
|---|
| 153 | while (!work_list.empty()) { | 
|---|
| 154 | block_info& top = work_list.back(); | 
|---|
| 155 | if (top.iter == end(*successor_func(top.block))) { | 
|---|
| 156 | postorder(top.block); | 
|---|
| 157 | work_list.pop_back(); | 
|---|
| 158 | } else { | 
|---|
| 159 | BB* child = *top.iter; | 
|---|
| 160 | top.iter++; | 
|---|
| 161 | if (FindInWorkList(work_list, child->id())) { | 
|---|
| 162 | backedge(top.block, child); | 
|---|
| 163 | } | 
|---|
| 164 | if (processed.count(child->id()) == 0) { | 
|---|
| 165 | preorder(child); | 
|---|
| 166 | work_list.emplace_back( | 
|---|
| 167 | block_info{child, std::begin(*successor_func(child))}); | 
|---|
| 168 | processed.insert(child->id()); | 
|---|
| 169 | } | 
|---|
| 170 | } | 
|---|
| 171 | } | 
|---|
| 172 | } | 
|---|
| 173 |  | 
|---|
| 174 | template <class BB> | 
|---|
| 175 | std::vector<std::pair<BB*, BB*>> CFA<BB>::CalculateDominators( | 
|---|
| 176 | const std::vector<cbb_ptr>& postorder, get_blocks_func predecessor_func) { | 
|---|
| 177 | struct block_detail { | 
|---|
| 178 | size_t dominator;  ///< The index of blocks's dominator in post order array | 
|---|
| 179 | size_t postorder_index;  ///< The index of the block in the post order array | 
|---|
| 180 | }; | 
|---|
| 181 | const size_t undefined_dom = postorder.size(); | 
|---|
| 182 |  | 
|---|
| 183 | std::unordered_map<cbb_ptr, block_detail> idoms; | 
|---|
| 184 | for (size_t i = 0; i < postorder.size(); i++) { | 
|---|
| 185 | idoms[postorder[i]] = {undefined_dom, i}; | 
|---|
| 186 | } | 
|---|
| 187 | idoms[postorder.back()].dominator = idoms[postorder.back()].postorder_index; | 
|---|
| 188 |  | 
|---|
| 189 | bool changed = true; | 
|---|
| 190 | while (changed) { | 
|---|
| 191 | changed = false; | 
|---|
| 192 | for (auto b = postorder.rbegin() + 1; b != postorder.rend(); ++b) { | 
|---|
| 193 | const std::vector<BB*>& predecessors = *predecessor_func(*b); | 
|---|
| 194 | // Find the first processed/reachable predecessor that is reachable | 
|---|
| 195 | // in the forward traversal. | 
|---|
| 196 | auto res = std::find_if(std::begin(predecessors), std::end(predecessors), | 
|---|
| 197 | [&idoms, undefined_dom](BB* pred) { | 
|---|
| 198 | return idoms.count(pred) && | 
|---|
| 199 | idoms[pred].dominator != undefined_dom; | 
|---|
| 200 | }); | 
|---|
| 201 | if (res == end(predecessors)) continue; | 
|---|
| 202 | const BB* idom = *res; | 
|---|
| 203 | size_t idom_idx = idoms[idom].postorder_index; | 
|---|
| 204 |  | 
|---|
| 205 | // all other predecessors | 
|---|
| 206 | for (const auto* p : predecessors) { | 
|---|
| 207 | if (idom == p) continue; | 
|---|
| 208 | // Only consider nodes reachable in the forward traversal. | 
|---|
| 209 | // Otherwise the intersection doesn't make sense and will never | 
|---|
| 210 | // terminate. | 
|---|
| 211 | if (!idoms.count(p)) continue; | 
|---|
| 212 | if (idoms[p].dominator != undefined_dom) { | 
|---|
| 213 | size_t finger1 = idoms[p].postorder_index; | 
|---|
| 214 | size_t finger2 = idom_idx; | 
|---|
| 215 | while (finger1 != finger2) { | 
|---|
| 216 | while (finger1 < finger2) { | 
|---|
| 217 | finger1 = idoms[postorder[finger1]].dominator; | 
|---|
| 218 | } | 
|---|
| 219 | while (finger2 < finger1) { | 
|---|
| 220 | finger2 = idoms[postorder[finger2]].dominator; | 
|---|
| 221 | } | 
|---|
| 222 | } | 
|---|
| 223 | idom_idx = finger1; | 
|---|
| 224 | } | 
|---|
| 225 | } | 
|---|
| 226 | if (idoms[*b].dominator != idom_idx) { | 
|---|
| 227 | idoms[*b].dominator = idom_idx; | 
|---|
| 228 | changed = true; | 
|---|
| 229 | } | 
|---|
| 230 | } | 
|---|
| 231 | } | 
|---|
| 232 |  | 
|---|
| 233 | std::vector<std::pair<bb_ptr, bb_ptr>> out; | 
|---|
| 234 | for (auto idom : idoms) { | 
|---|
| 235 | // NOTE: performing a const cast for convenient usage with | 
|---|
| 236 | // UpdateImmediateDominators | 
|---|
| 237 | out.push_back({const_cast<BB*>(std::get<0>(idom)), | 
|---|
| 238 | const_cast<BB*>(postorder[std::get<1>(idom).dominator])}); | 
|---|
| 239 | } | 
|---|
| 240 |  | 
|---|
| 241 | // Sort by postorder index to generate a deterministic ordering of edges. | 
|---|
| 242 | std::sort( | 
|---|
| 243 | out.begin(), out.end(), | 
|---|
| 244 | [&idoms](const std::pair<bb_ptr, bb_ptr>& lhs, | 
|---|
| 245 | const std::pair<bb_ptr, bb_ptr>& rhs) { | 
|---|
| 246 | assert(lhs.first); | 
|---|
| 247 | assert(lhs.second); | 
|---|
| 248 | assert(rhs.first); | 
|---|
| 249 | assert(rhs.second); | 
|---|
| 250 | auto lhs_indices = std::make_pair(idoms[lhs.first].postorder_index, | 
|---|
| 251 | idoms[lhs.second].postorder_index); | 
|---|
| 252 | auto rhs_indices = std::make_pair(idoms[rhs.first].postorder_index, | 
|---|
| 253 | idoms[rhs.second].postorder_index); | 
|---|
| 254 | return lhs_indices < rhs_indices; | 
|---|
| 255 | }); | 
|---|
| 256 | return out; | 
|---|
| 257 | } | 
|---|
| 258 |  | 
|---|
| 259 | template <class BB> | 
|---|
| 260 | std::vector<BB*> CFA<BB>::TraversalRoots(const std::vector<BB*>& blocks, | 
|---|
| 261 | get_blocks_func succ_func, | 
|---|
| 262 | get_blocks_func pred_func) { | 
|---|
| 263 | // The set of nodes which have been visited from any of the roots so far. | 
|---|
| 264 | std::unordered_set<const BB*> visited; | 
|---|
| 265 |  | 
|---|
| 266 | auto mark_visited = [&visited](const BB* b) { visited.insert(b); }; | 
|---|
| 267 | auto ignore_block = [](const BB*) {}; | 
|---|
| 268 | auto ignore_blocks = [](const BB*, const BB*) {}; | 
|---|
| 269 |  | 
|---|
| 270 | auto traverse_from_root = [&mark_visited, &succ_func, &ignore_block, | 
|---|
| 271 | &ignore_blocks](const BB* entry) { | 
|---|
| 272 | DepthFirstTraversal(entry, succ_func, mark_visited, ignore_block, | 
|---|
| 273 | ignore_blocks); | 
|---|
| 274 | }; | 
|---|
| 275 |  | 
|---|
| 276 | std::vector<BB*> result; | 
|---|
| 277 |  | 
|---|
| 278 | // First collect nodes without predecessors. | 
|---|
| 279 | for (auto block : blocks) { | 
|---|
| 280 | if (pred_func(block)->empty()) { | 
|---|
| 281 | assert(visited.count(block) == 0 && "Malformed graph!"); | 
|---|
| 282 | result.push_back(block); | 
|---|
| 283 | traverse_from_root(block); | 
|---|
| 284 | } | 
|---|
| 285 | } | 
|---|
| 286 |  | 
|---|
| 287 | // Now collect other stranded nodes.  These must be in unreachable cycles. | 
|---|
| 288 | for (auto block : blocks) { | 
|---|
| 289 | if (visited.count(block) == 0) { | 
|---|
| 290 | result.push_back(block); | 
|---|
| 291 | traverse_from_root(block); | 
|---|
| 292 | } | 
|---|
| 293 | } | 
|---|
| 294 |  | 
|---|
| 295 | return result; | 
|---|
| 296 | } | 
|---|
| 297 |  | 
|---|
| 298 | template <class BB> | 
|---|
| 299 | void CFA<BB>::ComputeAugmentedCFG( | 
|---|
| 300 | std::vector<BB*>& ordered_blocks, BB* pseudo_entry_block, | 
|---|
| 301 | BB* pseudo_exit_block, | 
|---|
| 302 | std::unordered_map<const BB*, std::vector<BB*>>* augmented_successors_map, | 
|---|
| 303 | std::unordered_map<const BB*, std::vector<BB*>>* augmented_predecessors_map, | 
|---|
| 304 | get_blocks_func succ_func, get_blocks_func pred_func) { | 
|---|
| 305 | // Compute the successors of the pseudo-entry block, and | 
|---|
| 306 | // the predecessors of the pseudo exit block. | 
|---|
| 307 | auto sources = TraversalRoots(ordered_blocks, succ_func, pred_func); | 
|---|
| 308 |  | 
|---|
| 309 | // For the predecessor traversals, reverse the order of blocks.  This | 
|---|
| 310 | // will affect the post-dominance calculation as follows: | 
|---|
| 311 | //  - Suppose you have blocks A and B, with A appearing before B in | 
|---|
| 312 | //    the list of blocks. | 
|---|
| 313 | //  - Also, A branches only to B, and B branches only to A. | 
|---|
| 314 | //  - We want to compute A as dominating B, and B as post-dominating B. | 
|---|
| 315 | // By using reversed blocks for predecessor traversal roots discovery, | 
|---|
| 316 | // we'll add an edge from B to the pseudo-exit node, rather than from A. | 
|---|
| 317 | // All this is needed to correctly process the dominance/post-dominance | 
|---|
| 318 | // constraint when A is a loop header that points to itself as its | 
|---|
| 319 | // own continue target, and B is the latch block for the loop. | 
|---|
| 320 | std::vector<BB*> reversed_blocks(ordered_blocks.rbegin(), | 
|---|
| 321 | ordered_blocks.rend()); | 
|---|
| 322 | auto sinks = TraversalRoots(reversed_blocks, pred_func, succ_func); | 
|---|
| 323 |  | 
|---|
| 324 | // Wire up the pseudo entry block. | 
|---|
| 325 | (*augmented_successors_map)[pseudo_entry_block] = sources; | 
|---|
| 326 | for (auto block : sources) { | 
|---|
| 327 | auto& augmented_preds = (*augmented_predecessors_map)[block]; | 
|---|
| 328 | const auto preds = pred_func(block); | 
|---|
| 329 | augmented_preds.reserve(1 + preds->size()); | 
|---|
| 330 | augmented_preds.push_back(pseudo_entry_block); | 
|---|
| 331 | augmented_preds.insert(augmented_preds.end(), preds->begin(), preds->end()); | 
|---|
| 332 | } | 
|---|
| 333 |  | 
|---|
| 334 | // Wire up the pseudo exit block. | 
|---|
| 335 | (*augmented_predecessors_map)[pseudo_exit_block] = sinks; | 
|---|
| 336 | for (auto block : sinks) { | 
|---|
| 337 | auto& augmented_succ = (*augmented_successors_map)[block]; | 
|---|
| 338 | const auto succ = succ_func(block); | 
|---|
| 339 | augmented_succ.reserve(1 + succ->size()); | 
|---|
| 340 | augmented_succ.push_back(pseudo_exit_block); | 
|---|
| 341 | augmented_succ.insert(augmented_succ.end(), succ->begin(), succ->end()); | 
|---|
| 342 | } | 
|---|
| 343 | } | 
|---|
| 344 |  | 
|---|
| 345 | }  // namespace spvtools | 
|---|
| 346 |  | 
|---|
| 347 | #endif  // SOURCE_CFA_H_ | 
|---|
| 348 |  | 
|---|