UnifyLoopExits.cpp source code [llvm_projects/llvm/lib/Transforms/Utils/UnifyLoopExits.cpp]

1	//===- UnifyLoopExits.cpp - Redirect exiting edges to one block -- C++ --===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	//
9	// For each natural loop with multiple exit blocks, this pass creates a new
10	// block N such that all exiting blocks now branch to N, and then control flow
11	// is redistributed to all the original exit blocks.
12	//
13	// Limitation: This assumes that all terminators in the CFG are direct branches
14	// (the "br" instruction). The presence of any other control flow
15	// such as indirectbr, switch or callbr will cause an assert.
16	//
17	//===----------------------------------------------------------------------===//
18
19	#include "llvm/Transforms/Utils/UnifyLoopExits.h"
20	#include "llvm/ADT/MapVector.h"
21	#include "llvm/Analysis/DomTreeUpdater.h"
22	#include "llvm/Analysis/LoopInfo.h"
23	#include "llvm/IR/Constants.h"
24	#include "llvm/IR/Dominators.h"
25	#include "llvm/InitializePasses.h"
26	#include "llvm/Support/CommandLine.h"
27	#include "llvm/Transforms/Utils.h"
28	#include "llvm/Transforms/Utils/BasicBlockUtils.h"
29	#include "llvm/Transforms/Utils/ControlFlowUtils.h"
30
31	#define DEBUG_TYPE "unify-loop-exits"
32
33	using namespace llvm;
34
35	static cl::opt<unsigned> MaxBooleansInControlFlowHub(
36	"max-booleans-in-control-flow-hub", cl::init(Val: `32`), cl::Hidden,
37	cl::desc ("Set the maximum number of outgoing blocks for using a boolean "
38	"value to record the exiting block in the ControlFlowHub."));
39
40	namespace {
41	struct UnifyLoopExitsLegacyPass : public FunctionPass {
42	static char ID;
43	UnifyLoopExitsLegacyPass() : FunctionPass (ID) {
44	initializeUnifyLoopExitsLegacyPassPass(*PassRegistry::getPassRegistry());
45	}
46
47	void getAnalysisUsage(AnalysisUsage &AU) const override {
48	AU.addRequired<LoopInfoWrapperPass>();
49	AU.addRequired<DominatorTreeWrapperPass>();
50	AU.addPreserved<LoopInfoWrapperPass>();
51	AU.addPreserved<DominatorTreeWrapperPass>();
52	}
53
54	bool runOnFunction(Function &F) override;
55	};
56	} // namespace
57
58	char UnifyLoopExitsLegacyPass::ID = `0`;
59
60	FunctionPass *llvm::createUnifyLoopExitsPass() {
61	return new UnifyLoopExitsLegacyPass ();
62	}
63
64	INITIALIZE_PASS_BEGIN(UnifyLoopExitsLegacyPass, "unify-loop-exits",
65	"Fixup each natural loop to have a single exit block",
66	false / Only looks at CFG /, false / Analysis Pass /)
67	INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
68	INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)
69	INITIALIZE_PASS_END(UnifyLoopExitsLegacyPass, "unify-loop-exits",
70	"Fixup each natural loop to have a single exit block",
71	false / Only looks at CFG /, false / Analysis Pass /)
72
73	// The current transform introduces new control flow paths which may break the
74	// SSA requirement that every def must dominate all its uses. For example,
75	// consider a value D defined inside the loop that is used by some instruction
76	// U outside the loop. It follows that D dominates U, since the original
77	// program has valid SSA form. After merging the exits, all paths from D to U
78	// now flow through the unified exit block. In addition, there may be other
79	// paths that do not pass through D, but now reach the unified exit
80	// block. Thus, D no longer dominates U.
81	//
82	// Restore the dominance by creating a phi for each such D at the new unified
83	// loop exit. But when doing this, ignore any uses U that are in the new unified
84	// loop exit, since those were introduced specially when the block was created.
85	//
86	// The use of SSAUpdater seems like overkill for this operation. The location
87	// for creating the new PHI is well-known, and also the set of incoming blocks
88	// to the new PHI.
89	static void restoreSSA(const DominatorTree &DT, const Loop *L,
90	SmallVectorImpl<BasicBlock *> &Incoming,
91	BasicBlock *LoopExitBlock) {
92	using InstVector = SmallVector<Instruction *, `8`>;
93	using IIMap = MapVector<Instruction *, InstVector>;
94	IIMap ExternalUsers;
95	for (auto *BB : L->blocks()) {
96	for (auto &I : *BB) {
97	for (auto &U : I.uses()) {
98	auto UserInst = cast<Instruction>(Val: U.getUser());
99	auto UserBlock = UserInst->getParent();
100	if (UserBlock == LoopExitBlock)
101	continue;
102	if (L->contains(BB: UserBlock))
103	continue;
104	LLVM_DEBUG(dbgs() << "added ext use for " << I.getName() << "("
105	<< BB->getName() << ")"
106	<< ": " << UserInst->getName() << "("
107	<< UserBlock->getName() << ")"
108	<< "\n");
109	ExternalUsers [&I].push_back(Elt: UserInst);
110	}
111	}
112	}
113
114	for (const auto &II : ExternalUsers) {
115	// For each Def used outside the loop, create NewPhi in
116	// LoopExitBlock. NewPhi receives Def only along exiting blocks that
117	// dominate it, while the remaining values are undefined since those paths
118	// didn't exist in the original CFG.
119	auto Def = II.first;
120	LLVM_DEBUG(dbgs() << "externally used: " << Def->getName() << "\n");
121	auto NewPhi =
122	PHINode::Create(Ty: Def->getType(), NumReservedValues: Incoming.size(),
123	NameStr: Def->getName() + ".moved", InsertBefore: LoopExitBlock->begin());
124	for (auto *In : Incoming) {
125	LLVM_DEBUG(dbgs() << "predecessor " << In->getName() << ": ");
126	if (Def->getParent() == In \|\| DT.dominates(Def, BB: In)) {
127	LLVM_DEBUG(dbgs() << "dominated\n");
128	NewPhi->addIncoming(V: Def, BB: In);
129	} else {
130	LLVM_DEBUG(dbgs() << "not dominated\n");
131	NewPhi->addIncoming(V: PoisonValue::get(T: Def->getType()), BB: In);
132	}
133	}
134
135	LLVM_DEBUG(dbgs() << "external users:");
136	for (auto *U : II.second) {
137	LLVM_DEBUG(dbgs() << " " << U->getName());
138	U->replaceUsesOfWith(From: Def, To: NewPhi);
139	}
140	LLVM_DEBUG(dbgs() << "\n");
141	}
142	}
143
144	static bool unifyLoopExits(DominatorTree &DT, LoopInfo &LI, Loop *L) {
145	// To unify the loop exits, we need a list of the exiting blocks as
146	// well as exit blocks. The functions for locating these lists both
147	// traverse the entire loop body. It is more efficient to first
148	// locate the exiting blocks and then examine their successors to
149	// locate the exit blocks.
150	SmallVector<BasicBlock *, `8`> ExitingBlocks;
151	L->getExitingBlocks(ExitingBlocks);
152
153	// Redirect exiting edges through a control flow hub.
154	ControlFlowHub CHub;
155	for (auto *BB : ExitingBlocks) {
156	auto *Branch = cast<BranchInst>(Val: BB->getTerminator());
157	BasicBlock *Succ0 = Branch->getSuccessor(i: `0`);
158	Succ0 = L->contains(BB: Succ0) ? nullptr : Succ0;
159
160	BasicBlock *Succ1 =
161	Branch->isUnconditional() ? nullptr : Branch->getSuccessor(i: `1`);
162	Succ1 = L->contains(BB: Succ1) ? nullptr : Succ1;
163	CHub.addBranch(BB, Succ0, Succ1);
164
165	LLVM_DEBUG(dbgs() << "Added exiting branch: " << BB->getName() << " -> {"
166	<< (Succ0 ? Succ0->getName() : "<none>") << ", "
167	<< (Succ1 ? Succ1->getName() : "<none>") << "}\n");
168	}
169
170	SmallVector<BasicBlock *, `8`> GuardBlocks;
171	DomTreeUpdater DTU(DT, DomTreeUpdater::UpdateStrategy::Eager);
172	BasicBlock *LoopExitBlock;
173	bool ChangedCFG;
174	std::tie(args&: LoopExitBlock, args&: ChangedCFG) = CHub.finalize(
175	DTU: &DTU, GuardBlocks, Prefix: "loop.exit", MaxControlFlowBooleans: MaxBooleansInControlFlowHub.getValue());
176	if (!ChangedCFG)
177	return false;
178
179	restoreSSA(DT, L, Incoming&: ExitingBlocks, LoopExitBlock);
180
181	#if defined(EXPENSIVE_CHECKS)
182	assert(DT.verify(DominatorTree::VerificationLevel::Full));
183	#else
184	assert(DT.verify(DominatorTree::VerificationLevel::Fast));
185	#endif // EXPENSIVE_CHECKS
186	L->verifyLoop();
187
188	// The guard blocks were created outside the loop, so they need to become
189	// members of the parent loop.
190	if (auto ParentLoop = L->getParentLoop()) {
191	for (auto *G : GuardBlocks) {
192	ParentLoop->addBasicBlockToLoop(NewBB: G, LI);
193	}
194	ParentLoop->verifyLoop();
195	}
196
197	#if defined(EXPENSIVE_CHECKS)
198	LI.verify(DT);
199	#endif // EXPENSIVE_CHECKS
200
201	return true;
202	}
203
204	static bool runImpl(LoopInfo &LI, DominatorTree &DT) {
205
206	bool Changed = false;
207	auto Loops = LI.getLoopsInPreorder();
208	for (auto *L : Loops) {
209	LLVM_DEBUG(dbgs() << "Processing loop:\n"; L->print(dbgs()));
210	Changed \|= unifyLoopExits(DT, LI, L);
211	}
212	return Changed;
213	}
214
215	bool UnifyLoopExitsLegacyPass::runOnFunction(Function &F) {
216	LLVM_DEBUG(dbgs() << "===== Unifying loop exits in function " << F.getName()
217	<< "\n");
218	auto &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
219	auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
220
221	assert(hasOnlySimpleTerminator(F) && "Unsupported block terminator.");
222
223	return runImpl(LI, DT);
224	}
225
226	namespace llvm {
227
228	PreservedAnalyses UnifyLoopExitsPass::run(Function &F,
229	FunctionAnalysisManager &AM) {
230	LLVM_DEBUG(dbgs() << "===== Unifying loop exits in function " << F.getName()
231	<< "\n");
232	auto &LI = AM.getResult<LoopAnalysis>(IR&: F);
233	auto &DT = AM.getResult<DominatorTreeAnalysis>(IR&: F);
234
235	if (!runImpl(LI, DT))
236	return PreservedAnalyses::all();
237	PreservedAnalyses PA;
238	PA.preserve<LoopAnalysis>();
239	PA.preserve<DominatorTreeAnalysis>();
240	return PA;
241	}
242	} // namespace llvm
243

Browse the source code of llvm_projects/llvm/lib/Transforms/Utils/UnifyLoopExits.cpp