cfa.h source code [Skia/third_party/externals/spirv-tools/source/cfa.h]

1	// Copyright (c) 2015-2016 The Khronos Group Inc.
2	//
3	// Licensed under the Apache License, Version 2.0 (the "License");
4	// you may not use this file except in compliance with the License.
5	// You may obtain a copy of the License at
6	//
7	// http://www.apache.org/licenses/LICENSE-2.0
8	//
9	// Unless required by applicable law or agreed to in writing, software
10	// distributed under the License is distributed on an "AS IS" BASIS,
11	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12	// See the License for the specific language governing permissions and
13	// limitations under the License.
14
15	#ifndef SOURCE_CFA_H_
16	#define SOURCE_CFA_H_
17
18	#include <algorithm>
19	#include <cassert>
20	#include <cstdint>
21	#include <functional>
22	#include <map>
23	#include <unordered_map>
24	#include <unordered_set>
25	#include <utility>
26	#include <vector>
27
28	namespace spvtools {
29
30	// Control Flow Analysis of control flow graphs of basic block nodes \|BB\|.
31	template <class BB>
32	class CFA {
33	using bb_ptr = BB*;
34	using cbb_ptr = const BB*;
35	using bb_iter = typename std::vector<BB*>::const_iterator;
36	using get_blocks_func = std::function<const std::vector<BB>(const BB*)>;
37
38	struct block_info {
39	cbb_ptr block; ///< pointer to the block
40	bb_iter iter; ///< Iterator to the current child node being processed
41	};
42
43	/// Returns true if a block with @p id is found in the @p work_list vector
44	///
45	/// @param[in] work_list Set of blocks visited in the the depth first
46	/// traversal
47	/// of the CFG
48	/// @param[in] id The ID of the block being checked
49	///
50	/// @return true if the edge work_list.back().block->id() => id is a back-edge
51	static bool FindInWorkList(const std::vector<block_info>& work_list,
52	uint32_t id);
53
54	public:
55	/// @brief Depth first traversal starting from the \p entry BasicBlock
56	///
57	/// This function performs a depth first traversal from the \p entry
58	/// BasicBlock and calls the pre/postorder functions when it needs to process
59	/// the node in pre order, post order. It also calls the backedge function
60	/// when a back edge is encountered.
61	///
62	/// @param[in] entry The root BasicBlock of a CFG
63	/// @param[in] successor_func A function which will return a pointer to the
64	/// successor nodes
65	/// @param[in] preorder A function that will be called for every block in a
66	/// CFG following preorder traversal semantics
67	/// @param[in] postorder A function that will be called for every block in a
68	/// CFG following postorder traversal semantics
69	/// @param[in] backedge A function that will be called when a backedge is
70	/// encountered during a traversal
71	/// NOTE: The @p successor_func and predecessor_func each return a pointer to
72	/// a
73	/// collection such that iterators to that collection remain valid for the
74	/// lifetime of the algorithm.
75	static void DepthFirstTraversal(
76	const BB* entry, get_blocks_func successor_func,
77	std::function<void(cbb_ptr)> preorder,
78	std::function<void(cbb_ptr)> postorder,
79	std::function<void(cbb_ptr, cbb_ptr)> backedge);
80
81	/// @brief Calculates dominator edges for a set of blocks
82	///
83	/// Computes dominators using the algorithm of Cooper, Harvey, and Kennedy
84	/// "A Simple, Fast Dominance Algorithm", 2001.
85	///
86	/// The algorithm assumes there is a unique root node (a node without
87	/// predecessors), and it is therefore at the end of the postorder vector.
88	///
89	/// This function calculates the dominator edges for a set of blocks in the
90	/// CFG.
91	/// Uses the dominator algorithm by Cooper et al.
92	///
93	/// @param[in] postorder A vector of blocks in post order traversal
94	/// order
95	/// in a CFG
96	/// @param[in] predecessor_func Function used to get the predecessor nodes of
97	/// a
98	/// block
99	///
100	/// @return the dominator tree of the graph, as a vector of pairs of nodes.
101	/// The first node in the pair is a node in the graph. The second node in the
102	/// pair is its immediate dominator in the sense of Cooper et.al., where a
103	/// block
104	/// without predecessors (such as the root node) is its own immediate
105	/// dominator.
106	static std::vector<std::pair<BB, BB>> CalculateDominators(
107	const std::vector<cbb_ptr>& postorder, get_blocks_func predecessor_func);
108
109	// Computes a minimal set of root nodes required to traverse, in the forward
110	// direction, the CFG represented by the given vector of blocks, and successor
111	// and predecessor functions. When considering adding two nodes, each having
112	// predecessors, favour using the one that appears earlier on the input blocks
113	// list.
114	static std::vector<BB> TraversalRoots(const* std::vector<BB*>& blocks,
115	get_blocks_func succ_func,
116	get_blocks_func pred_func);
117
118	static void ComputeAugmentedCFG(
119	std::vector<BB>& ordered_blocks, BB pseudo_entry_block,
120	BB* pseudo_exit_block,
121	std::unordered_map<const BB, std::vector<BB>>* augmented_successors_map,
122	std::unordered_map<const BB, std::vector<BB>>*
123	augmented_predecessors_map,
124	get_blocks_func succ_func, get_blocks_func pred_func);
125	};
126
127	template <class BB>
128	bool CFA<BB>::FindInWorkList(const std::vector<block_info>& work_list,
129	uint32_t id) {
130	for (const auto b : work_list) {
131	if (b.block->id() == id) return true;
132	}
133	return false;
134	}
135
136	template <class BB>
137	void CFA<BB>::DepthFirstTraversal(
138	const BB* entry, get_blocks_func successor_func,
139	std::function<void(cbb_ptr)> preorder,
140	std::function<void(cbb_ptr)> postorder,
141	std::function<void(cbb_ptr, cbb_ptr)> backedge) {
142	std::unordered_set<uint32_t> processed;
143
144	/// NOTE: work_list is the sequence of nodes from the root node to the node
145	/// being processed in the traversal
146	std::vector<block_info> work_list;
147	work_list.reserve(`10`);
148
149	work_list.push_back({entry, std::begin(*successor_func(entry))});
150	preorder(entry);
151	processed.insert(entry->id());
152
153	while (!work_list.empty()) {
154	block_info& top = work_list.back();
155	if (top.iter == end(*successor_func(top.block))) {
156	postorder(top.block);
157	work_list.pop_back();
158	} else {
159	BB* child = *top.iter;
160	top.iter++;
161	if (FindInWorkList(work_list, child->id())) {
162	backedge(top.block, child);
163	}
164	if (processed.count(child->id()) == `0`) {
165	preorder(child);
166	work_list.emplace_back(
167	block_info{child, std::begin(*successor_func(child))});
168	processed.insert(child->id());
169	}
170	}
171	}
172	}
173
174	template <class BB>
175	std::vector<std::pair<BB, BB>> CFA<BB>::CalculateDominators(
176	const std::vector<cbb_ptr>& postorder, get_blocks_func predecessor_func) {
177	struct block_detail {
178	size_t dominator; ///< The index of blocks's dominator in post order array
179	size_t postorder_index; ///< The index of the block in the post order array
180	};
181	const size_t undefined_dom = postorder.size();
182
183	std::unordered_map<cbb_ptr, block_detail> idoms;
184	for (size_t i = `0`; i < postorder.size(); i++) {
185	idoms[postorder[i]] = {undefined_dom, i};
186	}
187	idoms[postorder.back()].dominator = idoms[postorder.back()].postorder_index;
188
189	bool changed = true;
190	while (changed) {
191	changed = false;
192	for (auto b = postorder.rbegin() + `1`; b != postorder.rend(); ++b) {
193	const std::vector<BB>& predecessors = predecessor_func(*b);
194	// Find the first processed/reachable predecessor that is reachable
195	// in the forward traversal.
196	auto res = std::find_if(std::begin(predecessors), std::end(predecessors),
197	[&idoms, undefined_dom](BB* pred) {
198	return idoms.count(pred) &&
199	idoms[pred].dominator != undefined_dom;
200	});
201	if (res == end(predecessors)) continue;
202	const BB* idom = *res;
203	size_t idom_idx = idoms[idom].postorder_index;
204
205	// all other predecessors
206	for (const auto* p : predecessors) {
207	if (idom == p) continue;
208	// Only consider nodes reachable in the forward traversal.
209	// Otherwise the intersection doesn't make sense and will never
210	// terminate.
211	if (!idoms.count(p)) continue;
212	if (idoms[p].dominator != undefined_dom) {
213	size_t finger1 = idoms[p].postorder_index;
214	size_t finger2 = idom_idx;
215	while (finger1 != finger2) {
216	while (finger1 < finger2) {
217	finger1 = idoms[postorder[finger1]].dominator;
218	}
219	while (finger2 < finger1) {
220	finger2 = idoms[postorder[finger2]].dominator;
221	}
222	}
223	idom_idx = finger1;
224	}
225	}
226	if (idoms[*b].dominator != idom_idx) {
227	idoms[*b].dominator = idom_idx;
228	changed = true;
229	}
230	}
231	}
232
233	std::vector<std::pair<bb_ptr, bb_ptr>> out;
234	for (auto idom : idoms) {
235	// NOTE: performing a const cast for convenient usage with
236	// UpdateImmediateDominators
237	out.push_back({const_cast<BB*>(std::get<`0`>(idom)),
238	const_cast<BB*>(postorder[std::get<`1`>(idom).dominator])});
239	}
240
241	// Sort by postorder index to generate a deterministic ordering of edges.
242	std::sort(
243	out.begin(), out.end(),
244	[&idoms](const std::pair<bb_ptr, bb_ptr>& lhs,
245	const std::pair<bb_ptr, bb_ptr>& rhs) {
246	assert(lhs.first);
247	assert(lhs.second);
248	assert(rhs.first);
249	assert(rhs.second);
250	auto lhs_indices = std::make_pair(idoms[lhs.first].postorder_index,
251	idoms[lhs.second].postorder_index);
252	auto rhs_indices = std::make_pair(idoms[rhs.first].postorder_index,
253	idoms[rhs.second].postorder_index);
254	return lhs_indices < rhs_indices;
255	});
256	return out;
257	}
258
259	template <class BB>
260	std::vector<BB> CFA<BB>::TraversalRoots(const* std::vector<BB*>& blocks,
261	get_blocks_func succ_func,
262	get_blocks_func pred_func) {
263	// The set of nodes which have been visited from any of the roots so far.
264	std::unordered_set<const BB*> visited;
265
266	auto mark_visited = [&visited](const BB* b) { visited.insert(b); };
267	auto ignore_block = [](const BB*) {};
268	auto ignore_blocks = [](const BB, const* BB*) {};
269
270	auto traverse_from_root = [&mark_visited, &succ_func, &ignore_block,
271	&ignore_blocks](const BB* entry) {
272	DepthFirstTraversal(entry, succ_func, mark_visited, ignore_block,
273	ignore_blocks);
274	};
275
276	std::vector<BB*> result;
277
278	// First collect nodes without predecessors.
279	for (auto block : blocks) {
280	if (pred_func(block)->empty()) {
281	assert(visited.count(block) == `0` && "Malformed graph!");
282	result.push_back(block);
283	traverse_from_root(block);
284	}
285	}
286
287	// Now collect other stranded nodes. These must be in unreachable cycles.
288	for (auto block : blocks) {
289	if (visited.count(block) == `0`) {
290	result.push_back(block);
291	traverse_from_root(block);
292	}
293	}
294
295	return result;
296	}
297
298	template <class BB>
299	void CFA<BB>::ComputeAugmentedCFG(
300	std::vector<BB>& ordered_blocks, BB pseudo_entry_block,
301	BB* pseudo_exit_block,
302	std::unordered_map<const BB, std::vector<BB>>* augmented_successors_map,
303	std::unordered_map<const BB, std::vector<BB>>* augmented_predecessors_map,
304	get_blocks_func succ_func, get_blocks_func pred_func) {
305	// Compute the successors of the pseudo-entry block, and
306	// the predecessors of the pseudo exit block.
307	auto sources = TraversalRoots(ordered_blocks, succ_func, pred_func);
308
309	// For the predecessor traversals, reverse the order of blocks. This
310	// will affect the post-dominance calculation as follows:
311	// - Suppose you have blocks A and B, with A appearing before B in
312	// the list of blocks.
313	// - Also, A branches only to B, and B branches only to A.
314	// - We want to compute A as dominating B, and B as post-dominating B.
315	// By using reversed blocks for predecessor traversal roots discovery,
316	// we'll add an edge from B to the pseudo-exit node, rather than from A.
317	// All this is needed to correctly process the dominance/post-dominance
318	// constraint when A is a loop header that points to itself as its
319	// own continue target, and B is the latch block for the loop.
320	std::vector<BB*> reversed_blocks(ordered_blocks.rbegin(),
321	ordered_blocks.rend());
322	auto sinks = TraversalRoots(reversed_blocks, pred_func, succ_func);
323
324	// Wire up the pseudo entry block.
325	(*augmented_successors_map)[pseudo_entry_block] = sources;
326	for (auto block : sources) {
327	auto& augmented_preds = (*augmented_predecessors_map)[block];
328	const auto preds = pred_func(block);
329	augmented_preds.reserve(`1` + preds->size());
330	augmented_preds.push_back(pseudo_entry_block);
331	augmented_preds.insert(augmented_preds.end(), preds->begin(), preds->end());
332	}
333
334	// Wire up the pseudo exit block.
335	(*augmented_predecessors_map)[pseudo_exit_block] = sinks;
336	for (auto block : sinks) {
337	auto& augmented_succ = (*augmented_successors_map)[block];
338	const auto succ = succ_func(block);
339	augmented_succ.reserve(`1` + succ->size());
340	augmented_succ.push_back(pseudo_exit_block);
341	augmented_succ.insert(augmented_succ.end(), succ->begin(), succ->end());
342	}
343	}
344
345	} // namespace spvtools
346
347	#endif // SOURCE_CFA_H_
348

Browse the source code of Skia/third_party/externals/spirv-tools/source/cfa.h