SimplifyCFGPass.cpp source code [llvm_projects/llvm/lib/Transforms/Scalar/SimplifyCFGPass.cpp]

1	//===- SimplifyCFGPass.cpp - CFG Simplification Pass ----------------------===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	//
9	// This file implements dead code elimination and basic block merging, along
10	// with a collection of other peephole control flow optimizations. For example:
11	//
12	// Removes basic blocks with no predecessors.*
13	// Merges a basic block into its predecessor if there is only one and the*
14	// predecessor only has one successor.
15	// Eliminates PHI nodes for basic blocks with a single predecessor.*
16	// Eliminates a basic block that only contains an unconditional branch.*
17	// Changes invoke instructions to nounwind functions to be calls.*
18	// Change things like "if (x) if (y)" into "if (x&y)".*
19	// etc..*
20	//
21	//===----------------------------------------------------------------------===//
22
23	#include "llvm/ADT/MapVector.h"
24	#include "llvm/ADT/SmallPtrSet.h"
25	#include "llvm/ADT/SmallVector.h"
26	#include "llvm/ADT/Statistic.h"
27	#include "llvm/Analysis/AssumptionCache.h"
28	#include "llvm/Analysis/CFG.h"
29	#include "llvm/Analysis/DomTreeUpdater.h"
30	#include "llvm/Analysis/GlobalsModRef.h"
31	#include "llvm/Analysis/TargetTransformInfo.h"
32	#include "llvm/IR/Attributes.h"
33	#include "llvm/IR/CFG.h"
34	#include "llvm/IR/Dominators.h"
35	#include "llvm/IR/Instructions.h"
36	#include "llvm/IR/ValueHandle.h"
37	#include "llvm/InitializePasses.h"
38	#include "llvm/Pass.h"
39	#include "llvm/Support/CommandLine.h"
40	#include "llvm/Transforms/Scalar.h"
41	#include "llvm/Transforms/Scalar/SimplifyCFG.h"
42	#include "llvm/Transforms/Utils/Local.h"
43	#include "llvm/Transforms/Utils/SimplifyCFGOptions.h"
44	#include <utility>
45	using namespace llvm;
46
47	#define DEBUG_TYPE "simplifycfg"
48
49	static cl::opt<unsigned> UserBonusInstThreshold(
50	"bonus-inst-threshold", cl::Hidden, cl::init(Val: `1`),
51	cl::desc ("Control the number of bonus instructions (default = 1)"));
52
53	static cl::opt<bool> UserKeepLoops(
54	"keep-loops", cl::Hidden, cl::init(Val: true),
55	cl::desc ("Preserve canonical loop structure (default = true)"));
56
57	static cl::opt<bool> UserSwitchRangeToICmp(
58	"switch-range-to-icmp", cl::Hidden, cl::init(Val: false),
59	cl::desc (
60	"Convert switches into an integer range comparison (default = false)"));
61
62	static cl::opt<bool> UserSwitchToLookup(
63	"switch-to-lookup", cl::Hidden, cl::init(Val: false),
64	cl::desc ("Convert switches to lookup tables (default = false)"));
65
66	static cl::opt<bool> UserForwardSwitchCond(
67	"forward-switch-cond", cl::Hidden, cl::init(Val: false),
68	cl::desc ("Forward switch condition to phi ops (default = false)"));
69
70	static cl::opt<bool> UserHoistCommonInsts(
71	"hoist-common-insts", cl::Hidden, cl::init(Val: false),
72	cl::desc ("hoist common instructions (default = false)"));
73
74	static cl::opt<bool> UserHoistLoadsStoresWithCondFaulting(
75	"hoist-loads-stores-with-cond-faulting", cl::Hidden, cl::init(Val: false),
76	cl::desc ("Hoist loads/stores if the target supports conditional faulting "
77	"(default = false)"));
78
79	static cl::opt<bool> UserSinkCommonInsts(
80	"sink-common-insts", cl::Hidden, cl::init(Val: false),
81	cl::desc ("Sink common instructions (default = false)"));
82
83	static cl::opt<bool> UserSpeculateUnpredictables(
84	"speculate-unpredictables", cl::Hidden, cl::init(Val: false),
85	cl::desc ("Speculate unpredictable branches (default = false)"));
86
87	STATISTIC(NumSimpl, "Number of blocks simplified");
88
89	static bool
90	performBlockTailMerging(Function &F, ArrayRef<BasicBlock *> BBs,
91	std::vector<DominatorTree::UpdateType> *Updates) {
92	SmallVector<PHINode *, `1`> NewOps;
93
94	// We don't want to change IR just because we can.
95	// Only do that if there are at least two blocks we'll tail-merge.
96	if (BBs.size() < `2`)
97	return false;
98
99	if (Updates)
100	Updates->reserve(n: Updates->size() + BBs.size());
101
102	BasicBlock *CanonicalBB;
103	Instruction *CanonicalTerm;
104	{
105	auto *Term = BBs [`0`]->getTerminator();
106
107	// Create a canonical block for this function terminator type now,
108	// placing it before* the first block that will branch to it.*
109	CanonicalBB = BasicBlock::Create(
110	Context&: F.getContext(), Name: Twine ("common.") + Term->getOpcodeName(), Parent: &F, InsertBefore: BBs [`0`]);
111	// We'll also need a PHI node per each operand of the terminator.
112	NewOps.resize(N: Term->getNumOperands());
113	for (auto I : zip(t: Term->operands(), u&: NewOps)) {
114	std::get<`1`>(t&: I) = PHINode::Create(Ty: std::get<`0`>(t&: I)->getType(),
115	/NumReservedValues=/BBs.size(),
116	NameStr: CanonicalBB->getName() + ".op");
117	std::get<`1`>(t&: I)->insertInto(ParentBB: CanonicalBB, It: CanonicalBB->end());
118	}
119	// Make it so that this canonical block actually has the right
120	// terminator.
121	CanonicalTerm = Term->clone();
122	CanonicalTerm->insertInto(ParentBB: CanonicalBB, It: CanonicalBB->end());
123	// If the canonical terminator has operands, rewrite it to take PHI's.
124	for (auto I : zip(t&: NewOps, u: CanonicalTerm->operands()))
125	std::get<`1`>(t&: I) = std::get<`0`>(t&: I);
126	}
127
128	// Now, go through each block (with the current terminator type)
129	// we've recorded, and rewrite it to branch to the new common block.
130	DebugLoc CommonDebugLoc;
131	for (BasicBlock *BB : BBs) {
132	auto *Term = BB->getTerminator();
133	assert(Term->getOpcode() == CanonicalTerm->getOpcode() &&
134	"All blocks to be tail-merged must be the same "
135	"(function-terminating) terminator type.");
136
137	// Aha, found a new non-canonical function terminator. If it has operands,
138	// forward them to the PHI nodes in the canonical block.
139	for (auto I : zip(t: Term->operands(), u&: NewOps))
140	std::get<`1`>(t&: I)->addIncoming(V: std::get<`0`>(t&: I), BB);
141
142	// Compute the debug location common to all the original terminators.
143	if (!CommonDebugLoc)
144	CommonDebugLoc = Term->getDebugLoc();
145	else
146	CommonDebugLoc =
147	DebugLoc::getMergedLocation(LocA: CommonDebugLoc, LocB: Term->getDebugLoc());
148
149	// And turn BB into a block that just unconditionally branches
150	// to the canonical block.
151	Instruction *BI = BranchInst::Create(IfTrue: CanonicalBB, InsertBefore: BB);
152	BI->setDebugLoc(Term->getDebugLoc());
153	Term->eraseFromParent();
154
155	if (Updates)
156	Updates->push_back(x: {DominatorTree::Insert, BB, CanonicalBB});
157	}
158
159	CanonicalTerm->setDebugLoc(CommonDebugLoc);
160
161	return true;
162	}
163
164	static bool tailMergeBlocksWithSimilarFunctionTerminators(Function &F,
165	DomTreeUpdater *DTU) {
166	SmallMapVector<unsigned /TerminatorOpcode/, SmallVector<BasicBlock *, `2`>, `4`>
167	Structure;
168
169	// Scan all the blocks in the function, record the interesting-ones.
170	for (BasicBlock &BB : F) {
171	if (DTU && DTU->isBBPendingDeletion(DelBB: &BB))
172	continue;
173
174	// We are only interested in function-terminating blocks.
175	if (!succ_empty(BB: &BB))
176	continue;
177
178	auto *Term = BB.getTerminator();
179
180	// Fow now only support `ret`/`resume` function terminators.
181	// FIXME: lift this restriction.
182	switch (Term->getOpcode()) {
183	case Instruction::Ret:
184	case Instruction::Resume:
185	break;
186	default:
187	continue;
188	}
189
190	// We can't tail-merge block that contains a musttail call.
191	if (BB.getTerminatingMustTailCall())
192	continue;
193
194	// Calls to experimental_deoptimize must be followed by a return
195	// of the value computed by experimental_deoptimize.
196	// I.e., we can not change `ret` to `br` for this block.
197	if (auto *CI =
198	dyn_cast_or_null<CallInst>(Val: Term->getPrevNonDebugInstruction())) {
199	if (Function *F = CI->getCalledFunction())
200	if (Intrinsic::ID ID = F->getIntrinsicID())
201	if (ID == Intrinsic::experimental_deoptimize)
202	continue;
203	}
204
205	// PHI nodes cannot have token type, so if the terminator has an operand
206	// with token type, we can not tail-merge this kind of function terminators.
207	if (any_of(Range: Term->operands(),
208	P: [](Value Op) { return* Op->getType()->isTokenTy(); }))
209	continue;
210
211	// Canonical blocks are uniqued based on the terminator type (opcode).
212	Structure [Term->getOpcode()].emplace_back(Args: &BB);
213	}
214
215	bool Changed = false;
216
217	std::vector<DominatorTree::UpdateType> Updates;
218
219	for (ArrayRef<BasicBlock *> BBs : make_second_range(c&: Structure))
220	Changed \|= performBlockTailMerging(F, BBs, Updates: DTU ? &Updates : nullptr);
221
222	if (DTU)
223	DTU->applyUpdates(Updates);
224
225	return Changed;
226	}
227
228	/// Call SimplifyCFG on all the blocks in the function,
229	/// iterating until no more changes are made.
230	static bool iterativelySimplifyCFG(Function &F, const TargetTransformInfo &TTI,
231	DomTreeUpdater *DTU,
232	const SimplifyCFGOptions &Options) {
233	bool Changed = false;
234	bool LocalChange = true;
235
236	SmallVector<std::pair<const BasicBlock , const* BasicBlock *>, `32`> Edges;
237	FindFunctionBackedges(F, Result&: Edges);
238	SmallPtrSet<BasicBlock *, `16`> UniqueLoopHeaders;
239	for (const auto &Edge : Edges)
240	UniqueLoopHeaders.insert(Ptr: const_cast<BasicBlock *>(Edge.second));
241
242	SmallVector<WeakVH, `16`> LoopHeaders(UniqueLoopHeaders.begin(),
243	UniqueLoopHeaders.end());
244
245	unsigned IterCnt = `0`;
246	(void)IterCnt;
247	while (LocalChange) {
248	assert(IterCnt++ < `1000` && "Iterative simplification didn't converge!");
249	LocalChange = false;
250
251	// Loop over all of the basic blocks and remove them if they are unneeded.
252	for (Function::iterator BBIt = F.begin(); BBIt != F.end(); ) {
253	BasicBlock &BB = *BBIt ++;
254	if (DTU) {
255	assert(
256	!DTU->isBBPendingDeletion(&BB) &&
257	"Should not end up trying to simplify blocks marked for removal.");
258	// Make sure that the advanced iterator does not point at the blocks
259	// that are marked for removal, skip over all such blocks.
260	while (BBIt != F.end() && DTU->isBBPendingDeletion(DelBB: &*BBIt))
261	++BBIt;
262	}
263	if (simplifyCFG(BB: &BB, TTI, DTU, Options, LoopHeaders)) {
264	LocalChange = true;
265	++NumSimpl;
266	}
267	}
268	Changed \|= LocalChange;
269	}
270	return Changed;
271	}
272
273	static bool simplifyFunctionCFGImpl(Function &F, const TargetTransformInfo &TTI,
274	DominatorTree *DT,
275	const SimplifyCFGOptions &Options) {
276	DomTreeUpdater DTU(DT, DomTreeUpdater::UpdateStrategy::Eager);
277
278	bool EverChanged = removeUnreachableBlocks(F, DTU: DT ? &DTU : nullptr);
279	EverChanged \|=
280	tailMergeBlocksWithSimilarFunctionTerminators(F, DTU: DT ? &DTU : nullptr);
281	EverChanged \|= iterativelySimplifyCFG(F, TTI, DTU: DT ? &DTU : nullptr, Options);
282
283	// If neither pass changed anything, we're done.
284	if (!EverChanged) return false;
285
286	// iterativelySimplifyCFG can (rarely) make some loops dead. If this happens,
287	// removeUnreachableBlocks is needed to nuke them, which means we should
288	// iterate between the two optimizations. We structure the code like this to
289	// avoid rerunning iterativelySimplifyCFG if the second pass of
290	// removeUnreachableBlocks doesn't do anything.
291	if (!removeUnreachableBlocks(F, DTU: DT ? &DTU : nullptr))
292	return true;
293
294	do {
295	EverChanged = iterativelySimplifyCFG(F, TTI, DTU: DT ? &DTU : nullptr, Options);
296	EverChanged \|= removeUnreachableBlocks(F, DTU: DT ? &DTU : nullptr);
297	} while (EverChanged);
298
299	return true;
300	}
301
302	static bool simplifyFunctionCFG(Function &F, const TargetTransformInfo &TTI,
303	DominatorTree *DT,
304	const SimplifyCFGOptions &Options) {
305	assert((!RequireAndPreserveDomTree \|\|
306	(DT && DT->verify(DominatorTree::VerificationLevel::Full))) &&
307	"Original domtree is invalid?");
308
309	bool Changed = simplifyFunctionCFGImpl(F, TTI, DT, Options);
310
311	assert((!RequireAndPreserveDomTree \|\|
312	(DT && DT->verify(DominatorTree::VerificationLevel::Full))) &&
313	"Failed to maintain validity of domtree!");
314
315	return Changed;
316	}
317
318	// Command-line settings override compile-time settings.
319	static void applyCommandLineOverridesToOptions(SimplifyCFGOptions &Options) {
320	if (UserBonusInstThreshold.getNumOccurrences())
321	Options.BonusInstThreshold = UserBonusInstThreshold;
322	if (UserForwardSwitchCond.getNumOccurrences())
323	Options.ForwardSwitchCondToPhi = UserForwardSwitchCond;
324	if (UserSwitchRangeToICmp.getNumOccurrences())
325	Options.ConvertSwitchRangeToICmp = UserSwitchRangeToICmp;
326	if (UserSwitchToLookup.getNumOccurrences())
327	Options.ConvertSwitchToLookupTable = UserSwitchToLookup;
328	if (UserKeepLoops.getNumOccurrences())
329	Options.NeedCanonicalLoop = UserKeepLoops;
330	if (UserHoistCommonInsts.getNumOccurrences())
331	Options.HoistCommonInsts = UserHoistCommonInsts;
332	if (UserHoistLoadsStoresWithCondFaulting.getNumOccurrences())
333	Options.HoistLoadsStoresWithCondFaulting =
334	UserHoistLoadsStoresWithCondFaulting;
335	if (UserSinkCommonInsts.getNumOccurrences())
336	Options.SinkCommonInsts = UserSinkCommonInsts;
337	if (UserSpeculateUnpredictables.getNumOccurrences())
338	Options.SpeculateUnpredictables = UserSpeculateUnpredictables;
339	}
340
341	SimplifyCFGPass::SimplifyCFGPass() {
342	applyCommandLineOverridesToOptions(Options);
343	}
344
345	SimplifyCFGPass::SimplifyCFGPass(const SimplifyCFGOptions &Opts)
346	: Options (Opts) {
347	applyCommandLineOverridesToOptions(Options);
348	}
349
350	void SimplifyCFGPass::printPipeline(
351	raw_ostream &OS, function_ref<StringRef(StringRef)> MapClassName2PassName) {
352	static_cast<PassInfoMixin<SimplifyCFGPass> >(this*)->printPipeline(
353	OS, MapClassName2PassName);
354	OS << `'<'`;
355	OS << "bonus-inst-threshold=" << Options.BonusInstThreshold << `';'`;
356	OS << (Options.ForwardSwitchCondToPhi ? "" : "no-") << "forward-switch-cond;";
357	OS << (Options.ConvertSwitchRangeToICmp ? "" : "no-")
358	<< "switch-range-to-icmp;";
359	OS << (Options.ConvertSwitchToLookupTable ? "" : "no-")
360	<< "switch-to-lookup;";
361	OS << (Options.NeedCanonicalLoop ? "" : "no-") << "keep-loops;";
362	OS << (Options.HoistCommonInsts ? "" : "no-") << "hoist-common-insts;";
363	OS << (Options.HoistLoadsStoresWithCondFaulting ? "" : "no-")
364	<< "hoist-loads-stores-with-cond-faulting;";
365	OS << (Options.SinkCommonInsts ? "" : "no-") << "sink-common-insts;";
366	OS << (Options.SpeculateBlocks ? "" : "no-") << "speculate-blocks;";
367	OS << (Options.SimplifyCondBranch ? "" : "no-") << "simplify-cond-branch;";
368	OS << (Options.SpeculateUnpredictables ? "" : "no-")
369	<< "speculate-unpredictables";
370	OS << `'>'`;
371	}
372
373	PreservedAnalyses SimplifyCFGPass::run(Function &F,
374	FunctionAnalysisManager &AM) {
375	auto &TTI = AM.getResult<TargetIRAnalysis>(IR&: F);
376	Options.AC = &AM.getResult<AssumptionAnalysis>(IR&: F);
377	DominatorTree DT = nullptr*;
378	if (RequireAndPreserveDomTree)
379	DT = &AM.getResult<DominatorTreeAnalysis>(IR&: F);
380	if (!simplifyFunctionCFG(F, TTI, DT, Options))
381	return PreservedAnalyses::all();
382	PreservedAnalyses PA;
383	if (RequireAndPreserveDomTree)
384	PA.preserve<DominatorTreeAnalysis>();
385	return PA;
386	}
387
388	namespace {
389	struct CFGSimplifyPass : public FunctionPass {
390	static char ID;
391	SimplifyCFGOptions Options;
392	std::function<bool(const Function &)> PredicateFtor;
393
394	CFGSimplifyPass(SimplifyCFGOptions Options_ = SimplifyCFGOptions (),
395	std::function<bool(const Function &)> Ftor = nullptr)
396	: FunctionPass (ID), Options (Options_), PredicateFtor (std::move(Ftor)) {
397
398	initializeCFGSimplifyPassPass(*PassRegistry::getPassRegistry());
399
400	// Check for command-line overrides of options for debug/customization.
401	applyCommandLineOverridesToOptions(Options);
402	}
403
404	bool runOnFunction(Function &F) override {
405	if (skipFunction(F) \|\| (PredicateFtor && !PredicateFtor (F)))
406	return false;
407
408	Options.AC = &getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F);
409	DominatorTree DT = nullptr*;
410	if (RequireAndPreserveDomTree)
411	DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
412
413	auto &TTI = getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);
414	return simplifyFunctionCFG(F, TTI, DT, Options);
415	}
416	void getAnalysisUsage(AnalysisUsage &AU) const override {
417	AU.addRequired<AssumptionCacheTracker>();
418	if (RequireAndPreserveDomTree)
419	AU.addRequired<DominatorTreeWrapperPass>();
420	AU.addRequired<TargetTransformInfoWrapperPass>();
421	if (RequireAndPreserveDomTree)
422	AU.addPreserved<DominatorTreeWrapperPass>();
423	AU.addPreserved<GlobalsAAWrapperPass>();
424	}
425	};
426	}
427
428	char CFGSimplifyPass::ID = `0`;
429	INITIALIZE_PASS_BEGIN(CFGSimplifyPass, "simplifycfg", "Simplify the CFG", false,
430	false)
431	INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
432	INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)
433	INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
434	INITIALIZE_PASS_END(CFGSimplifyPass, "simplifycfg", "Simplify the CFG", false,
435	false)
436
437	// Public interface to the CFGSimplification pass
438	FunctionPass *
439	llvm::createCFGSimplificationPass(SimplifyCFGOptions Options,
440	std::function<bool(const Function &)> Ftor) {
441	return new CFGSimplifyPass (Options, std::move(Ftor));
442	}
443

Browse the source code of llvm_projects/llvm/lib/Transforms/Scalar/SimplifyCFGPass.cpp