ObjCARCOpts.cpp source code [llvm_projects/llvm/lib/Transforms/ObjCARC/ObjCARCOpts.cpp]

1	//===- ObjCARCOpts.cpp - ObjC ARC Optimization ----------------------------===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	//
9	/// \file
10	/// This file defines ObjC ARC optimizations. ARC stands for Automatic
11	/// Reference Counting and is a system for managing reference counts for objects
12	/// in Objective C.
13	///
14	/// The optimizations performed include elimination of redundant, partially
15	/// redundant, and inconsequential reference count operations, elimination of
16	/// redundant weak pointer operations, and numerous minor simplifications.
17	///
18	/// WARNING: This file knows about certain library functions. It recognizes them
19	/// by name, and hardwires knowledge of their semantics.
20	///
21	/// WARNING: This file knows about how certain Objective-C library functions are
22	/// used. Naive LLVM IR transformations which would otherwise be
23	/// behavior-preserving may break these assumptions.
24	//
25	//===----------------------------------------------------------------------===//
26
27	#include "ARCRuntimeEntryPoints.h"
28	#include "BlotMapVector.h"
29	#include "DependencyAnalysis.h"
30	#include "ObjCARC.h"
31	#include "ProvenanceAnalysis.h"
32	#include "PtrState.h"
33	#include "llvm/ADT/DenseMap.h"
34	#include "llvm/ADT/STLExtras.h"
35	#include "llvm/ADT/SmallPtrSet.h"
36	#include "llvm/ADT/SmallVector.h"
37	#include "llvm/ADT/Statistic.h"
38	#include "llvm/Analysis/AliasAnalysis.h"
39	#include "llvm/Analysis/ObjCARCAnalysisUtils.h"
40	#include "llvm/Analysis/ObjCARCInstKind.h"
41	#include "llvm/Analysis/ObjCARCUtil.h"
42	#include "llvm/Analysis/OptimizationRemarkEmitter.h"
43	#include "llvm/IR/BasicBlock.h"
44	#include "llvm/IR/CFG.h"
45	#include "llvm/IR/Constant.h"
46	#include "llvm/IR/Constants.h"
47	#include "llvm/IR/DerivedTypes.h"
48	#include "llvm/IR/EHPersonalities.h"
49	#include "llvm/IR/Function.h"
50	#include "llvm/IR/GlobalVariable.h"
51	#include "llvm/IR/InstIterator.h"
52	#include "llvm/IR/InstrTypes.h"
53	#include "llvm/IR/Instruction.h"
54	#include "llvm/IR/Instructions.h"
55	#include "llvm/IR/LLVMContext.h"
56	#include "llvm/IR/Metadata.h"
57	#include "llvm/IR/Type.h"
58	#include "llvm/IR/User.h"
59	#include "llvm/IR/Value.h"
60	#include "llvm/Support/Casting.h"
61	#include "llvm/Support/CommandLine.h"
62	#include "llvm/Support/Compiler.h"
63	#include "llvm/Support/Debug.h"
64	#include "llvm/Support/ErrorHandling.h"
65	#include "llvm/Support/raw_ostream.h"
66	#include "llvm/Transforms/ObjCARC.h"
67	#include <cassert>
68	#include <iterator>
69	#include <utility>
70
71	using namespace llvm;
72	using namespace llvm::objcarc;
73
74	#define DEBUG_TYPE "objc-arc-opts"
75
76	static cl::opt<unsigned> MaxPtrStates("arc-opt-max-ptr-states",
77	cl::Hidden,
78	cl::desc ("Maximum number of ptr states the optimizer keeps track of"),
79	cl::init(Val: `4095`));
80
81	/// \defgroup ARCUtilities Utility declarations/definitions specific to ARC.
82	/// @{
83
84	/// This is similar to GetRCIdentityRoot but it stops as soon
85	/// as it finds a value with multiple uses.
86	static const Value FindSingleUseIdentifiedObject(const* Value *Arg) {
87	// ConstantData (like ConstantPointerNull and UndefValue) is used across
88	// modules. It's never a single-use value.
89	if (isa<ConstantData>(Val: Arg))
90	return nullptr;
91
92	if (Arg->hasOneUse()) {
93	if (const BitCastInst *BC = dyn_cast<BitCastInst>(Val: Arg))
94	return FindSingleUseIdentifiedObject(Arg: BC->getOperand(i_nocapture: `0`));
95	if (const GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(Val: Arg))
96	if (GEP->hasAllZeroIndices())
97	return FindSingleUseIdentifiedObject(Arg: GEP->getPointerOperand());
98	if (IsForwarding(Class: GetBasicARCInstKind(V: Arg)))
99	return FindSingleUseIdentifiedObject(
100	Arg: cast<CallInst>(Val: Arg)->getArgOperand(i: `0`));
101	if (!IsObjCIdentifiedObject(V: Arg))
102	return nullptr;
103	return Arg;
104	}
105
106	// If we found an identifiable object but it has multiple uses, but they are
107	// trivial uses, we can still consider this to be a single-use value.
108	if (IsObjCIdentifiedObject(V: Arg)) {
109	for (const User *U : Arg->users())
110	if (!U->use_empty() \|\| GetRCIdentityRoot(V: U) != Arg)
111	return nullptr;
112
113	return Arg;
114	}
115
116	return nullptr;
117	}
118
119	/// @}
120	///
121	/// \defgroup ARCOpt ARC Optimization.
122	/// @{
123
124	// TODO: On code like this:
125	//
126	// objc_retain(%x)
127	// stuff_that_cannot_release()
128	// objc_autorelease(%x)
129	// stuff_that_cannot_release()
130	// objc_retain(%x)
131	// stuff_that_cannot_release()
132	// objc_autorelease(%x)
133	//
134	// The second retain and autorelease can be deleted.
135
136	// TODO: Autorelease calls followed by objc_autoreleasePoolPop calls (perhaps in
137	// ObjC++ code after inlining) can be turned into plain release calls.
138
139	// TODO: Critical-edge splitting. If the optimial insertion point is
140	// a critical edge, the current algorithm has to fail, because it doesn't
141	// know how to split edges. It should be possible to make the optimizer
142	// think in terms of edges, rather than blocks, and then split critical
143	// edges on demand.
144
145	// TODO: OptimizeSequences could generalized to be Interprocedural.
146
147	// TODO: Recognize that a bunch of other objc runtime calls have
148	// non-escaping arguments and non-releasing arguments, and may be
149	// non-autoreleasing.
150
151	// TODO: Sink autorelease calls as far as possible. Unfortunately we
152	// usually can't sink them past other calls, which would be the main
153	// case where it would be useful.
154
155	// TODO: The pointer returned from objc_loadWeakRetained is retained.
156
157	// TODO: Delete release+retain pairs (rare).
158
159	STATISTIC(NumNoops, "Number of no-op objc calls eliminated");
160	STATISTIC(NumPartialNoops, "Number of partially no-op objc calls eliminated");
161	STATISTIC(NumAutoreleases,"Number of autoreleases converted to releases");
162	STATISTIC(NumRets, "Number of return value forwarding "
163	"retain+autoreleases eliminated");
164	STATISTIC(NumRRs, "Number of retain+release paths eliminated");
165	STATISTIC(NumPeeps, "Number of calls peephole-optimized");
166	#ifndef NDEBUG
167	STATISTIC(NumRetainsBeforeOpt,
168	"Number of retains before optimization");
169	STATISTIC(NumReleasesBeforeOpt,
170	"Number of releases before optimization");
171	STATISTIC(NumRetainsAfterOpt,
172	"Number of retains after optimization");
173	STATISTIC(NumReleasesAfterOpt,
174	"Number of releases after optimization");
175	#endif
176
177	namespace {
178
179	/// Per-BasicBlock state.
180	class BBState {
181	/// The number of unique control paths from the entry which can reach this
182	/// block.
183	unsigned TopDownPathCount = `0`;
184
185	/// The number of unique control paths to exits from this block.
186	unsigned BottomUpPathCount = `0`;
187
188	/// The top-down traversal uses this to record information known about a
189	/// pointer at the bottom of each block.
190	BlotMapVector<const Value *, TopDownPtrState> PerPtrTopDown;
191
192	/// The bottom-up traversal uses this to record information known about a
193	/// pointer at the top of each block.
194	BlotMapVector<const Value *, BottomUpPtrState> PerPtrBottomUp;
195
196	/// Effective predecessors of the current block ignoring ignorable edges and
197	/// ignored backedges.
198	SmallVector<BasicBlock *, `2`> Preds;
199
200	/// Effective successors of the current block ignoring ignorable edges and
201	/// ignored backedges.
202	SmallVector<BasicBlock *, `2`> Succs;
203
204	public:
205	static const unsigned OverflowOccurredValue;
206
207	BBState() = default;
208
209	using top_down_ptr_iterator = decltype(PerPtrTopDown)::iterator;
210	using const_top_down_ptr_iterator = decltype(PerPtrTopDown)::const_iterator;
211
212	top_down_ptr_iterator top_down_ptr_begin() { return PerPtrTopDown.begin(); }
213	top_down_ptr_iterator top_down_ptr_end() { return PerPtrTopDown.end(); }
214	const_top_down_ptr_iterator top_down_ptr_begin() const {
215	return PerPtrTopDown.begin();
216	}
217	const_top_down_ptr_iterator top_down_ptr_end() const {
218	return PerPtrTopDown.end();
219	}
220	bool hasTopDownPtrs() const {
221	return !PerPtrTopDown.empty();
222	}
223
224	unsigned top_down_ptr_list_size() const {
225	return std::distance(first: top_down_ptr_begin(), last: top_down_ptr_end());
226	}
227
228	using bottom_up_ptr_iterator = decltype(PerPtrBottomUp)::iterator;
229	using const_bottom_up_ptr_iterator =
230	decltype(PerPtrBottomUp)::const_iterator;
231
232	bottom_up_ptr_iterator bottom_up_ptr_begin() {
233	return PerPtrBottomUp.begin();
234	}
235	bottom_up_ptr_iterator bottom_up_ptr_end() { return PerPtrBottomUp.end(); }
236	const_bottom_up_ptr_iterator bottom_up_ptr_begin() const {
237	return PerPtrBottomUp.begin();
238	}
239	const_bottom_up_ptr_iterator bottom_up_ptr_end() const {
240	return PerPtrBottomUp.end();
241	}
242	bool hasBottomUpPtrs() const {
243	return !PerPtrBottomUp.empty();
244	}
245
246	unsigned bottom_up_ptr_list_size() const {
247	return std::distance(first: bottom_up_ptr_begin(), last: bottom_up_ptr_end());
248	}
249
250	/// Mark this block as being an entry block, which has one path from the
251	/// entry by definition.
252	void SetAsEntry() { TopDownPathCount = `1`; }
253
254	/// Mark this block as being an exit block, which has one path to an exit by
255	/// definition.
256	void SetAsExit() { BottomUpPathCount = `1`; }
257
258	/// Attempt to find the PtrState object describing the top down state for
259	/// pointer Arg. Return a new initialized PtrState describing the top down
260	/// state for Arg if we do not find one.
261	TopDownPtrState &getPtrTopDownState(const Value *Arg) {
262	return PerPtrTopDown [Arg];
263	}
264
265	/// Attempt to find the PtrState object describing the bottom up state for
266	/// pointer Arg. Return a new initialized PtrState describing the bottom up
267	/// state for Arg if we do not find one.
268	BottomUpPtrState &getPtrBottomUpState(const Value *Arg) {
269	return PerPtrBottomUp [Arg];
270	}
271
272	/// Attempt to find the PtrState object describing the bottom up state for
273	/// pointer Arg.
274	bottom_up_ptr_iterator findPtrBottomUpState(const Value *Arg) {
275	return PerPtrBottomUp.find(Key: Arg);
276	}
277
278	void clearBottomUpPointers() {
279	PerPtrBottomUp.clear();
280	}
281
282	void clearTopDownPointers() {
283	PerPtrTopDown.clear();
284	}
285
286	void InitFromPred(const BBState &Other);
287	void InitFromSucc(const BBState &Other);
288	void MergePred(const BBState &Other);
289	void MergeSucc(const BBState &Other);
290
291	/// Compute the number of possible unique paths from an entry to an exit
292	/// which pass through this block. This is only valid after both the
293	/// top-down and bottom-up traversals are complete.
294	///
295	/// Returns true if overflow occurred. Returns false if overflow did not
296	/// occur.
297	bool GetAllPathCountWithOverflow(unsigned &PathCount) const {
298	if (TopDownPathCount == OverflowOccurredValue \|\|
299	BottomUpPathCount == OverflowOccurredValue)
300	return true;
301	unsigned long long Product =
302	(unsigned long long)TopDownPathCount*BottomUpPathCount;
303	// Overflow occurred if any of the upper bits of Product are set or if all
304	// the lower bits of Product are all set.
305	return (Product >> `32`) \|\|
306	((PathCount = Product) == OverflowOccurredValue);
307	}
308
309	// Specialized CFG utilities.
310	using edge_iterator = SmallVectorImpl<BasicBlock *>::const_iterator;
311
312	edge_iterator pred_begin() const { return Preds.begin(); }
313	edge_iterator pred_end() const { return Preds.end(); }
314	edge_iterator succ_begin() const { return Succs.begin(); }
315	edge_iterator succ_end() const { return Succs.end(); }
316
317	void addSucc(BasicBlock *Succ) { Succs.push_back(Elt: Succ); }
318	void addPred(BasicBlock *Pred) { Preds.push_back(Elt: Pred); }
319
320	bool isExit() const { return Succs.empty(); }
321	};
322
323	} // end anonymous namespace
324
325	const unsigned BBState::OverflowOccurredValue = `0xffffffff`;
326
327	namespace llvm {
328
329	[[maybe_unused]] raw_ostream &operator<<(raw_ostream &OS, BBState &BBState);
330
331	} // end namespace llvm
332
333	void BBState::InitFromPred(const BBState &Other) {
334	PerPtrTopDown = Other.PerPtrTopDown;
335	TopDownPathCount = Other.TopDownPathCount;
336	}
337
338	void BBState::InitFromSucc(const BBState &Other) {
339	PerPtrBottomUp = Other.PerPtrBottomUp;
340	BottomUpPathCount = Other.BottomUpPathCount;
341	}
342
343	/// The top-down traversal uses this to merge information about predecessors to
344	/// form the initial state for a new block.
345	void BBState::MergePred(const BBState &Other) {
346	if (TopDownPathCount == OverflowOccurredValue)
347	return;
348
349	// Other.TopDownPathCount can be 0, in which case it is either dead or a
350	// loop backedge. Loop backedges are special.
351	TopDownPathCount += Other.TopDownPathCount;
352
353	// In order to be consistent, we clear the top down pointers when by adding
354	// TopDownPathCount becomes OverflowOccurredValue even though "true" overflow
355	// has not occurred.
356	if (TopDownPathCount == OverflowOccurredValue) {
357	clearTopDownPointers();
358	return;
359	}
360
361	// Check for overflow. If we have overflow, fall back to conservative
362	// behavior.
363	if (TopDownPathCount < Other.TopDownPathCount) {
364	TopDownPathCount = OverflowOccurredValue;
365	clearTopDownPointers();
366	return;
367	}
368
369	// For each entry in the other set, if our set has an entry with the same key,
370	// merge the entries. Otherwise, copy the entry and merge it with an empty
371	// entry.
372	for (auto MI = Other.top_down_ptr_begin(), ME = Other.top_down_ptr_end();
373	MI != ME; ++MI) {
374	auto Pair = PerPtrTopDown.insert(InsertPair: *MI);
375	Pair.first ->second.Merge(Other: Pair.second ? TopDownPtrState () : MI ->second,
376	/TopDown=/true);
377	}
378
379	// For each entry in our set, if the other set doesn't have an entry with the
380	// same key, force it to merge with an empty entry.
381	for (auto MI = top_down_ptr_begin(), ME = top_down_ptr_end(); MI != ME; ++MI)
382	if (Other.PerPtrTopDown.find(Key: MI ->first) == Other.PerPtrTopDown.end())
383	MI ->second.Merge(Other: TopDownPtrState (), /TopDown=/true);
384	}
385
386	/// The bottom-up traversal uses this to merge information about successors to
387	/// form the initial state for a new block.
388	void BBState::MergeSucc(const BBState &Other) {
389	if (BottomUpPathCount == OverflowOccurredValue)
390	return;
391
392	// Other.BottomUpPathCount can be 0, in which case it is either dead or a
393	// loop backedge. Loop backedges are special.
394	BottomUpPathCount += Other.BottomUpPathCount;
395
396	// In order to be consistent, we clear the top down pointers when by adding
397	// BottomUpPathCount becomes OverflowOccurredValue even though "true" overflow
398	// has not occurred.
399	if (BottomUpPathCount == OverflowOccurredValue) {
400	clearBottomUpPointers();
401	return;
402	}
403
404	// Check for overflow. If we have overflow, fall back to conservative
405	// behavior.
406	if (BottomUpPathCount < Other.BottomUpPathCount) {
407	BottomUpPathCount = OverflowOccurredValue;
408	clearBottomUpPointers();
409	return;
410	}
411
412	// For each entry in the other set, if our set has an entry with the
413	// same key, merge the entries. Otherwise, copy the entry and merge
414	// it with an empty entry.
415	for (auto MI = Other.bottom_up_ptr_begin(), ME = Other.bottom_up_ptr_end();
416	MI != ME; ++MI) {
417	auto Pair = PerPtrBottomUp.insert(InsertPair: *MI);
418	Pair.first ->second.Merge(Other: Pair.second ? BottomUpPtrState () : MI ->second,
419	/TopDown=/false);
420	}
421
422	// For each entry in our set, if the other set doesn't have an entry
423	// with the same key, force it to merge with an empty entry.
424	for (auto MI = bottom_up_ptr_begin(), ME = bottom_up_ptr_end(); MI != ME;
425	++MI)
426	if (Other.PerPtrBottomUp.find(Key: MI ->first) == Other.PerPtrBottomUp.end())
427	MI ->second.Merge(Other: BottomUpPtrState (), /TopDown=/false);
428	}
429
430	raw_ostream &llvm::operator<<(raw_ostream &OS, BBState &BBInfo) {
431	// Dump the pointers we are tracking.
432	OS << " TopDown State:\n";
433	if (!BBInfo.hasTopDownPtrs()) {
434	LLVM_DEBUG(dbgs() << " NONE!\n");
435	} else {
436	for (auto I = BBInfo.top_down_ptr_begin(), E = BBInfo.top_down_ptr_end();
437	I != E; ++I) {
438	const PtrState &P = I ->second;
439	OS << " Ptr: " << *I ->first
440	<< "\n KnownSafe: " << (P.IsKnownSafe()?"true":"false")
441	<< "\n ImpreciseRelease: "
442	<< (P.IsTrackingImpreciseReleases()?"true":"false") << "\n"
443	<< " HasCFGHazards: "
444	<< (P.IsCFGHazardAfflicted()?"true":"false") << "\n"
445	<< " KnownPositive: "
446	<< (P.HasKnownPositiveRefCount()?"true":"false") << "\n"
447	<< " Seq: "
448	<< P.GetSeq() << "\n";
449	}
450	}
451
452	OS << " BottomUp State:\n";
453	if (!BBInfo.hasBottomUpPtrs()) {
454	LLVM_DEBUG(dbgs() << " NONE!\n");
455	} else {
456	for (auto I = BBInfo.bottom_up_ptr_begin(), E = BBInfo.bottom_up_ptr_end();
457	I != E; ++I) {
458	const PtrState &P = I ->second;
459	OS << " Ptr: " << *I ->first
460	<< "\n KnownSafe: " << (P.IsKnownSafe()?"true":"false")
461	<< "\n ImpreciseRelease: "
462	<< (P.IsTrackingImpreciseReleases()?"true":"false") << "\n"
463	<< " HasCFGHazards: "
464	<< (P.IsCFGHazardAfflicted()?"true":"false") << "\n"
465	<< " KnownPositive: "
466	<< (P.HasKnownPositiveRefCount()?"true":"false") << "\n"
467	<< " Seq: "
468	<< P.GetSeq() << "\n";
469	}
470	}
471
472	return OS;
473	}
474
475	namespace {
476
477	/// The main ARC optimization pass.
478	class ObjCARCOpt {
479	bool Changed = false;
480	bool CFGChanged = false;
481	ProvenanceAnalysis PA;
482
483	/// A cache of references to runtime entry point constants.
484	ARCRuntimeEntryPoints EP;
485
486	/// A cache of MDKinds that can be passed into other functions to propagate
487	/// MDKind identifiers.
488	ARCMDKindCache MDKindCache;
489
490	BundledRetainClaimRVs BundledInsts = nullptr*;
491
492	/// A flag indicating whether the optimization that removes or moves
493	/// retain/release pairs should be performed.
494	bool DisableRetainReleasePairing = false;
495
496	/// Flags which determine whether each of the interesting runtime functions
497	/// is in fact used in the current function.
498	unsigned UsedInThisFunction;
499
500	DenseMap<BasicBlock *, ColorVector> BlockEHColors;
501
502	bool OptimizeRetainRVCall(Function &F, Instruction *RetainRV);
503	void OptimizeAutoreleaseRVCall(Function &F, Instruction *AutoreleaseRV,
504	ARCInstKind &Class);
505	void OptimizeIndividualCalls(Function &F);
506
507	/// Optimize an individual call, optionally passing the
508	/// GetArgRCIdentityRoot if it has already been computed.
509	void OptimizeIndividualCallImpl(Function &F, Instruction *Inst,
510	ARCInstKind Class, const Value *Arg);
511
512	/// Try to optimize an AutoreleaseRV with a RetainRV or UnsafeClaimRV. If the
513	/// optimization occurs, returns true to indicate that the caller should
514	/// assume the instructions are dead.
515	bool OptimizeInlinedAutoreleaseRVCall(Function &F, Instruction *Inst,
516	const Value *&Arg, ARCInstKind Class,
517	Instruction *AutoreleaseRV,
518	const Value *&AutoreleaseRVArg);
519
520	void CheckForCFGHazards(const BasicBlock *BB,
521	DenseMap<const BasicBlock *, BBState> &BBStates,
522	BBState &MyStates) const;
523	bool VisitInstructionBottomUp(Instruction Inst, BasicBlock BB,
524	BlotMapVector<Value *, RRInfo> &Retains,
525	BBState &MyStates);
526	bool VisitBottomUp(BasicBlock *BB,
527	DenseMap<const BasicBlock *, BBState> &BBStates,
528	BlotMapVector<Value *, RRInfo> &Retains);
529	bool VisitInstructionTopDown(
530	Instruction Inst, DenseMap<Value , RRInfo> &Releases, BBState &MyStates,
531	const DenseMap<const Instruction , SmallPtrSet<const* Value *, `2`>>
532	&ReleaseInsertPtToRCIdentityRoots);
533	bool VisitTopDown(
534	BasicBlock BB, DenseMap<const* BasicBlock *, BBState> &BBStates,
535	DenseMap<Value *, RRInfo> &Releases,
536	const DenseMap<const Instruction , SmallPtrSet<const* Value *, `2`>>
537	&ReleaseInsertPtToRCIdentityRoots);
538	bool Visit(Function &F, DenseMap<const BasicBlock *, BBState> &BBStates,
539	BlotMapVector<Value *, RRInfo> &Retains,
540	DenseMap<Value *, RRInfo> &Releases);
541
542	void MoveCalls(Value *Arg, RRInfo &RetainsToMove, RRInfo &ReleasesToMove,
543	BlotMapVector<Value *, RRInfo> &Retains,
544	DenseMap<Value *, RRInfo> &Releases,
545	SmallVectorImpl<Instruction > &DeadInsts, Module M);
546
547	bool PairUpRetainsAndReleases(DenseMap<const BasicBlock *, BBState> &BBStates,
548	BlotMapVector<Value *, RRInfo> &Retains,
549	DenseMap<Value , RRInfo> &Releases, Module M,
550	Instruction *Retain,
551	SmallVectorImpl<Instruction *> &DeadInsts,
552	RRInfo &RetainsToMove, RRInfo &ReleasesToMove,
553	Value Arg, bool* KnownSafe,
554	bool &AnyPairsCompletelyEliminated);
555
556	bool PerformCodePlacement(DenseMap<const BasicBlock *, BBState> &BBStates,
557	BlotMapVector<Value *, RRInfo> &Retains,
558	DenseMap<Value , RRInfo> &Releases, Module M);
559
560	void OptimizeWeakCalls(Function &F);
561
562	bool OptimizeSequences(Function &F);
563
564	void OptimizeReturns(Function &F);
565
566	void OptimizeAutoreleasePools(Function &F);
567
568	template <typename PredicateT>
569	static void cloneOpBundlesIf(CallBase *CI,
570	SmallVectorImpl<OperandBundleDef> &OpBundles,
571	PredicateT Predicate) {
572	for (unsigned I = `0`, E = CI->getNumOperandBundles(); I != E; ++I) {
573	OperandBundleUse B = CI->getOperandBundleAt(Index: I);
574	if (Predicate(B))
575	OpBundles.emplace_back(Args&: B);
576	}
577	}
578
579	void addOpBundleForFunclet(BasicBlock *BB,
580	SmallVectorImpl<OperandBundleDef> &OpBundles) {
581	if (!BlockEHColors.empty()) {
582	const ColorVector &CV = BlockEHColors.find(Val: BB)->second;
583	assert(CV.size() > `0` && "Uncolored block");
584	for (BasicBlock *EHPadBB : CV)
585	if (auto *EHPad =
586	dyn_cast<FuncletPadInst>(Val: EHPadBB->getFirstNonPHIIt())) {
587	OpBundles.emplace_back(Args: "funclet", Args&: EHPad);
588	return;
589	}
590	}
591	}
592
593	#ifndef NDEBUG
594	void GatherStatistics(Function &F, bool AfterOptimization = false);
595	#endif
596
597	public:
598	void init(Function &F);
599	bool run(Function &F, AAResults &AA);
600	bool hasCFGChanged() const { return CFGChanged; }
601	};
602	} // end anonymous namespace
603
604	/// Turn objc_retainAutoreleasedReturnValue into objc_retain if the operand is
605	/// not a return value.
606	bool
607	ObjCARCOpt::OptimizeRetainRVCall(Function &F, Instruction *RetainRV) {
608	// Check for the argument being from an immediately preceding call or invoke.
609	const Value *Arg = GetArgRCIdentityRoot(Inst: RetainRV);
610	if (const Instruction *Call = dyn_cast<CallBase>(Val: Arg)) {
611	if (Call->getParent() == RetainRV->getParent()) {
612	BasicBlock::const_iterator I(Call);
613	++I;
614	while (IsNoopInstruction(I: &*I))
615	++I;
616	if (&*I == RetainRV)
617	return false;
618	} else if (const InvokeInst *II = dyn_cast<InvokeInst>(Val: Call)) {
619	BasicBlock *RetainRVParent = RetainRV->getParent();
620	if (II->getNormalDest() == RetainRVParent) {
621	BasicBlock::const_iterator I = RetainRVParent->begin();
622	while (IsNoopInstruction(I: &*I))
623	++I;
624	if (&*I == RetainRV)
625	return false;
626	}
627	}
628	}
629
630	assert(!BundledInsts->contains(RetainRV) &&
631	"a bundled retainRV's argument should be a call");
632
633	// Turn it to a plain objc_retain.
634	Changed = true;
635	++NumPeeps;
636
637	LLVM_DEBUG(dbgs() << "Transforming objc_retainAutoreleasedReturnValue => "
638	"objc_retain since the operand is not a return value.\n"
639	"Old = "
640	<< *RetainRV << "\n");
641
642	Function *NewDecl = EP.get(kind: ARCRuntimeEntryPointKind::Retain);
643	cast<CallInst>(Val: RetainRV)->setCalledFunction(NewDecl);
644
645	LLVM_DEBUG(dbgs() << "New = " << *RetainRV << "\n");
646
647	return false;
648	}
649
650	bool ObjCARCOpt::OptimizeInlinedAutoreleaseRVCall(
651	Function &F, Instruction Inst, const* Value *&Arg, ARCInstKind Class,
652	Instruction AutoreleaseRV, const* Value *&AutoreleaseRVArg) {
653	if (BundledInsts->contains(I: Inst))
654	return false;
655
656	// Must be in the same basic block.
657	assert(Inst->getParent() == AutoreleaseRV->getParent());
658
659	// Must operate on the same root.
660	Arg = GetArgRCIdentityRoot(Inst);
661	AutoreleaseRVArg = GetArgRCIdentityRoot(Inst: AutoreleaseRV);
662	if (Arg != AutoreleaseRVArg) {
663	// If there isn't an exact match, check if we have equivalent PHIs.
664	const PHINode *PN = dyn_cast<PHINode>(Val: Arg);
665	if (!PN)
666	return false;
667
668	SmallVector<const Value *, `4`> ArgUsers;
669	getEquivalentPHIs(PN: *PN, PHIList&: ArgUsers);
670	if (!llvm::is_contained(Range&: ArgUsers, Element: AutoreleaseRVArg))
671	return false;
672	}
673
674	// Okay, this is a match. Merge them.
675	++NumPeeps;
676	LLVM_DEBUG(dbgs() << "Found inlined objc_autoreleaseReturnValue '"
677	<< AutoreleaseRV << "' paired with '" << Inst << "'\n");
678
679	// Delete the RV pair, starting with the AutoreleaseRV.
680	AutoreleaseRV->replaceAllUsesWith(
681	V: cast<CallInst>(Val: AutoreleaseRV)->getArgOperand(i: `0`));
682	Changed = true;
683	EraseInstruction(CI: AutoreleaseRV);
684	if (Class == ARCInstKind::RetainRV) {
685	// AutoreleaseRV and RetainRV cancel out. Delete the RetainRV.
686	Inst->replaceAllUsesWith(V: cast<CallInst>(Val: Inst)->getArgOperand(i: `0`));
687	EraseInstruction(CI: Inst);
688	return true;
689	}
690
691	// UnsafeClaimRV is a frontend peephole for RetainRV + Release. Since the
692	// AutoreleaseRV and RetainRV cancel out, replace UnsafeClaimRV with Release.
693	assert(Class == ARCInstKind::UnsafeClaimRV);
694	Value *CallArg = cast<CallInst>(Val: Inst)->getArgOperand(i: `0`);
695	CallInst *Release =
696	CallInst::Create(Func: EP.get(kind: ARCRuntimeEntryPointKind::Release), Args: CallArg, NameStr: "",
697	InsertBefore: Inst->getIterator());
698	assert(IsAlwaysTail(ARCInstKind::UnsafeClaimRV) &&
699	"Expected UnsafeClaimRV to be safe to tail call");
700	Release->setTailCall();
701	Inst->replaceAllUsesWith(V: CallArg);
702	EraseInstruction(CI: Inst);
703
704	// Run the normal optimizations on Release.
705	OptimizeIndividualCallImpl(F, Inst: Release, Class: ARCInstKind::Release, Arg);
706	return true;
707	}
708
709	/// Turn objc_autoreleaseReturnValue into objc_autorelease if the result is not
710	/// used as a return value.
711	void ObjCARCOpt::OptimizeAutoreleaseRVCall(Function &F,
712	Instruction *AutoreleaseRV,
713	ARCInstKind &Class) {
714	// Check for a return of the pointer value.
715	const Value *Ptr = GetArgRCIdentityRoot(Inst: AutoreleaseRV);
716
717	// If the argument is ConstantPointerNull or UndefValue, its other users
718	// aren't actually interesting to look at.
719	if (isa<ConstantData>(Val: Ptr))
720	return;
721
722	SmallVector<const Value *, `2`> Users;
723	Users.push_back(Elt: Ptr);
724
725	// Add PHIs that are equivalent to Ptr to Users.
726	if (const PHINode *PN = dyn_cast<PHINode>(Val: Ptr))
727	getEquivalentPHIs(PN: *PN, PHIList&: Users);
728
729	do {
730	Ptr = Users.pop_back_val();
731	for (const User *U : Ptr->users()) {
732	if (isa<ReturnInst>(Val: U) \|\| GetBasicARCInstKind(V: U) == ARCInstKind::RetainRV)
733	return;
734	if (isa<BitCastInst>(Val: U))
735	Users.push_back(Elt: U);
736	}
737	} while (!Users.empty());
738
739	Changed = true;
740	++NumPeeps;
741
742	LLVM_DEBUG(
743	dbgs() << "Transforming objc_autoreleaseReturnValue => "
744	"objc_autorelease since its operand is not used as a return "
745	"value.\n"
746	"Old = "
747	<< *AutoreleaseRV << "\n");
748
749	CallInst *AutoreleaseRVCI = cast<CallInst>(Val: AutoreleaseRV);
750	Function *NewDecl = EP.get(kind: ARCRuntimeEntryPointKind::Autorelease);
751	AutoreleaseRVCI->setCalledFunction(NewDecl);
752	AutoreleaseRVCI->setTailCall(false); // Never tail call objc_autorelease.
753	Class = ARCInstKind::Autorelease;
754
755	LLVM_DEBUG(dbgs() << "New: " << *AutoreleaseRV << "\n");
756	}
757
758	/// Visit each call, one at a time, and make simplifications without doing any
759	/// additional analysis.
760	void ObjCARCOpt::OptimizeIndividualCalls(Function &F) {
761	LLVM_DEBUG(dbgs() << "\n== ObjCARCOpt::OptimizeIndividualCalls ==\n");
762	// Reset all the flags in preparation for recomputing them.
763	UsedInThisFunction = `0`;
764
765	// Store any delayed AutoreleaseRV intrinsics, so they can be easily paired
766	// with RetainRV and UnsafeClaimRV.
767	Instruction DelayedAutoreleaseRV = nullptr*;
768	const Value DelayedAutoreleaseRVArg = nullptr*;
769	auto setDelayedAutoreleaseRV = [&](Instruction *AutoreleaseRV) {
770	assert(!DelayedAutoreleaseRV \|\| !AutoreleaseRV);
771	DelayedAutoreleaseRV = AutoreleaseRV;
772	DelayedAutoreleaseRVArg = nullptr;
773	};
774	auto optimizeDelayedAutoreleaseRV = [&]() {
775	if (!DelayedAutoreleaseRV)
776	return;
777	OptimizeIndividualCallImpl(F, Inst: DelayedAutoreleaseRV,
778	Class: ARCInstKind::AutoreleaseRV,
779	Arg: DelayedAutoreleaseRVArg);
780	setDelayedAutoreleaseRV (nullptr);
781	};
782	auto shouldDelayAutoreleaseRV = [&](Instruction *NonARCInst) {
783	// Nothing to delay, but we may as well skip the logic below.
784	if (!DelayedAutoreleaseRV)
785	return true;
786
787	// If we hit the end of the basic block we're not going to find an RV-pair.
788	// Stop delaying.
789	if (NonARCInst->isTerminator())
790	return false;
791
792	// Given the frontend rules for emitting AutoreleaseRV, RetainRV, and
793	// UnsafeClaimRV, it's probably safe to skip over even opaque function calls
794	// here since OptimizeInlinedAutoreleaseRVCall will confirm that they
795	// have the same RCIdentityRoot. However, what really matters is
796	// skipping instructions or intrinsics that the inliner could leave behind;
797	// be conservative for now and don't skip over opaque calls, which could
798	// potentially include other ARC calls.
799	auto *CB = dyn_cast<CallBase>(Val: NonARCInst);
800	if (!CB)
801	return true;
802	return CB->getIntrinsicID() != Intrinsic::not_intrinsic;
803	};
804
805	// Visit all objc_ calls in F.*
806	for (inst_iterator I = inst_begin(F: &F), E = inst_end(F: &F); I != E; ) {
807	Instruction Inst = &I ++;
808
809	if (auto *CI = dyn_cast<CallInst>(Val: Inst))
810	if (objcarc::hasAttachedCallOpBundle(CB: CI)) {
811	BundledInsts->insertRVCall(InsertPt: I ->getIterator(), AnnotatedCall: CI);
812	Changed = true;
813	}
814
815	ARCInstKind Class = GetBasicARCInstKind(V: Inst);
816
817	// Skip this loop if this instruction isn't itself an ARC intrinsic.
818	const Value Arg = nullptr*;
819	switch (Class) {
820	default:
821	optimizeDelayedAutoreleaseRV ();
822	break;
823	case ARCInstKind::CallOrUser:
824	case ARCInstKind::User:
825	case ARCInstKind::None:
826	// This is a non-ARC instruction. If we're delaying an AutoreleaseRV,
827	// check if it's safe to skip over it; if not, optimize the AutoreleaseRV
828	// now.
829	if (!shouldDelayAutoreleaseRV (Inst))
830	optimizeDelayedAutoreleaseRV ();
831	continue;
832	case ARCInstKind::AutoreleaseRV:
833	optimizeDelayedAutoreleaseRV ();
834	setDelayedAutoreleaseRV (Inst);
835	continue;
836	case ARCInstKind::RetainRV:
837	case ARCInstKind::UnsafeClaimRV:
838	if (DelayedAutoreleaseRV) {
839	// We have a potential RV pair. Check if they cancel out.
840	if (OptimizeInlinedAutoreleaseRVCall(F, Inst, Arg, Class,
841	AutoreleaseRV: DelayedAutoreleaseRV,
842	AutoreleaseRVArg&: DelayedAutoreleaseRVArg)) {
843	setDelayedAutoreleaseRV (nullptr);
844	continue;
845	}
846	optimizeDelayedAutoreleaseRV ();
847	}
848	break;
849	}
850
851	OptimizeIndividualCallImpl(F, Inst, Class, Arg);
852	}
853
854	// Catch the final delayed AutoreleaseRV.
855	optimizeDelayedAutoreleaseRV ();
856	}
857
858	/// This function returns true if the value is inert. An ObjC ARC runtime call
859	/// taking an inert operand can be safely deleted.
860	static bool isInertARCValue(Value V, SmallPtrSet<Value , `1`> &VisitedPhis) {
861	V = V->stripPointerCasts();
862
863	if (IsNullOrUndef(V))
864	return true;
865
866	// See if this is a global attribute annotated with an 'objc_arc_inert'.
867	if (auto *GV = dyn_cast<GlobalVariable>(Val: V))
868	if (GV->hasAttribute(Kind: "objc_arc_inert"))
869	return true;
870
871	if (auto PN = dyn_cast<PHINode>(Val: V)) {
872	// Ignore this phi if it has already been discovered.
873	if (!VisitedPhis.insert(Ptr: PN).second)
874	return true;
875	// Look through phis's operands.
876	for (Value *Opnd : PN->incoming_values())
877	if (!isInertARCValue(V: Opnd, VisitedPhis))
878	return false;
879	return true;
880	}
881
882	return false;
883	}
884
885	void ObjCARCOpt::OptimizeIndividualCallImpl(Function &F, Instruction *Inst,
886	ARCInstKind Class,
887	const Value *Arg) {
888	LLVM_DEBUG(dbgs() << "Visiting: Class: " << Class << "; " << *Inst << "\n");
889
890	// We can delete this call if it takes an inert value.
891	SmallPtrSet<Value *, `1`> VisitedPhis;
892
893	if (BundledInsts->contains(I: Inst)) {
894	UsedInThisFunction \|= `1` << unsigned(Class);
895	return;
896	}
897
898	if (IsNoopOnGlobal(Class))
899	if (isInertARCValue(V: Inst->getOperand(i: `0`), VisitedPhis)) {
900	if (!Inst->getType()->isVoidTy())
901	Inst->replaceAllUsesWith(V: Inst->getOperand(i: `0`));
902	Inst->eraseFromParent();
903	Changed = true;
904	return;
905	}
906
907	switch (Class) {
908	default:
909	break;
910
911	// Delete no-op casts. These function calls have special semantics, but
912	// the semantics are entirely implemented via lowering in the front-end,
913	// so by the time they reach the optimizer, they are just no-op calls
914	// which return their argument.
915	//
916	// There are gray areas here, as the ability to cast reference-counted
917	// pointers to raw void and back allows code to break ARC assumptions,*
918	// however these are currently considered to be unimportant.
919	case ARCInstKind::NoopCast:
920	Changed = true;
921	++NumNoops;
922	LLVM_DEBUG(dbgs() << "Erasing no-op cast: " << *Inst << "\n");
923	EraseInstruction(CI: Inst);
924	return;
925
926	// If the pointer-to-weak-pointer is null, it's undefined behavior.
927	case ARCInstKind::StoreWeak:
928	case ARCInstKind::LoadWeak:
929	case ARCInstKind::LoadWeakRetained:
930	case ARCInstKind::InitWeak:
931	case ARCInstKind::DestroyWeak: {
932	CallInst *CI = cast<CallInst>(Val: Inst);
933	if (IsNullOrUndef(V: CI->getArgOperand(i: `0`))) {
934	Changed = true;
935	new StoreInst (ConstantInt::getTrue(Context&: CI->getContext()),
936	PoisonValue::get(T: PointerType::getUnqual(C&: CI->getContext())),
937	CI->getIterator());
938	Value *NewValue = PoisonValue::get(T: CI->getType());
939	LLVM_DEBUG(
940	dbgs() << "A null pointer-to-weak-pointer is undefined behavior."
941	"\nOld = "
942	<< CI << "\nNew = " << NewValue << "\n");
943	CI->replaceAllUsesWith(V: NewValue);
944	CI->eraseFromParent();
945	return;
946	}
947	break;
948	}
949	case ARCInstKind::CopyWeak:
950	case ARCInstKind::MoveWeak: {
951	CallInst *CI = cast<CallInst>(Val: Inst);
952	if (IsNullOrUndef(V: CI->getArgOperand(i: `0`)) \|\|
953	IsNullOrUndef(V: CI->getArgOperand(i: `1`))) {
954	Changed = true;
955	new StoreInst (ConstantInt::getTrue(Context&: CI->getContext()),
956	PoisonValue::get(T: PointerType::getUnqual(C&: CI->getContext())),
957	CI->getIterator());
958
959	Value *NewValue = PoisonValue::get(T: CI->getType());
960	LLVM_DEBUG(
961	dbgs() << "A null pointer-to-weak-pointer is undefined behavior."
962	"\nOld = "
963	<< CI << "\nNew = " << NewValue << "\n");
964
965	CI->replaceAllUsesWith(V: NewValue);
966	CI->eraseFromParent();
967	return;
968	}
969	break;
970	}
971	case ARCInstKind::RetainRV:
972	if (OptimizeRetainRVCall(F, RetainRV: Inst))
973	return;
974	break;
975	case ARCInstKind::AutoreleaseRV:
976	OptimizeAutoreleaseRVCall(F, AutoreleaseRV: Inst, Class);
977	break;
978	}
979
980	// objc_autorelease(x) -> objc_release(x) if x is otherwise unused.
981	if (IsAutorelease(Class) && Inst->use_empty()) {
982	CallInst *Call = cast<CallInst>(Val: Inst);
983	const Value *Arg = Call->getArgOperand(i: `0`);
984	Arg = FindSingleUseIdentifiedObject(Arg);
985	if (Arg) {
986	Changed = true;
987	++NumAutoreleases;
988
989	// Create the declaration lazily.
990	LLVMContext &C = Inst->getContext();
991
992	Function *Decl = EP.get(kind: ARCRuntimeEntryPointKind::Release);
993	CallInst *NewCall = CallInst::Create(Func: Decl, Args: Call->getArgOperand(i: `0`), NameStr: "",
994	InsertBefore: Call->getIterator());
995	NewCall->setMetadata(KindID: MDKindCache.get(ID: ARCMDKindID::ImpreciseRelease),
996	Node: MDNode::get(Context&: C, MDs: {}));
997
998	LLVM_DEBUG(dbgs() << "Replacing autorelease{,RV}(x) with objc_release(x) "
999	"since x is otherwise unused.\nOld: "
1000	<< Call << "\nNew: " << NewCall << "\n");
1001
1002	EraseInstruction(CI: Call);
1003	Inst = NewCall;
1004	Class = ARCInstKind::Release;
1005	}
1006	}
1007
1008	// For functions which can never be passed stack arguments, add
1009	// a tail keyword.
1010	if (IsAlwaysTail(Class) && !cast<CallInst>(Val: Inst)->isNoTailCall()) {
1011	Changed = true;
1012	LLVM_DEBUG(
1013	dbgs() << "Adding tail keyword to function since it can never be "
1014	"passed stack args: "
1015	<< *Inst << "\n");
1016	cast<CallInst>(Val: Inst)->setTailCall();
1017	}
1018
1019	// Ensure that functions that can never have a "tail" keyword due to the
1020	// semantics of ARC truly do not do so.
1021	if (IsNeverTail(Class)) {
1022	Changed = true;
1023	LLVM_DEBUG(dbgs() << "Removing tail keyword from function: " << *Inst
1024	<< "\n");
1025	cast<CallInst>(Val: Inst)->setTailCall(false);
1026	}
1027
1028	// Set nounwind as needed.
1029	if (IsNoThrow(Class)) {
1030	Changed = true;
1031	LLVM_DEBUG(dbgs() << "Found no throw class. Setting nounwind on: " << *Inst
1032	<< "\n");
1033	cast<CallInst>(Val: Inst)->setDoesNotThrow();
1034	}
1035
1036	// Note: This catches instructions unrelated to ARC.
1037	if (!IsNoopOnNull(Class)) {
1038	UsedInThisFunction \|= `1` << unsigned(Class);
1039	return;
1040	}
1041
1042	// If we haven't already looked up the root, look it up now.
1043	if (!Arg)
1044	Arg = GetArgRCIdentityRoot(Inst);
1045
1046	// ARC calls with null are no-ops. Delete them.
1047	if (IsNullOrUndef(V: Arg)) {
1048	Changed = true;
1049	++NumNoops;
1050	LLVM_DEBUG(dbgs() << "ARC calls with null are no-ops. Erasing: " << *Inst
1051	<< "\n");
1052	EraseInstruction(CI: Inst);
1053	return;
1054	}
1055
1056	// Keep track of which of retain, release, autorelease, and retain_block
1057	// are actually present in this function.
1058	UsedInThisFunction \|= `1` << unsigned(Class);
1059
1060	// If Arg is a PHI, and one or more incoming values to the
1061	// PHI are null, and the call is control-equivalent to the PHI, and there
1062	// are no relevant side effects between the PHI and the call, and the call
1063	// is not a release that doesn't have the clang.imprecise_release tag, the
1064	// call could be pushed up to just those paths with non-null incoming
1065	// values. For now, don't bother splitting critical edges for this.
1066	if (Class == ARCInstKind::Release &&
1067	!Inst->getMetadata(KindID: MDKindCache.get(ID: ARCMDKindID::ImpreciseRelease)))
1068	return;
1069
1070	SmallVector<std::pair<Instruction , const* Value *>, `4`> Worklist;
1071	Worklist.push_back(Elt: std::make_pair(x&: Inst, y&: Arg));
1072	do {
1073	std::pair<Instruction , const* Value *> Pair = Worklist.pop_back_val();
1074	Inst = Pair.first;
1075	Arg = Pair.second;
1076
1077	const PHINode *PN = dyn_cast<PHINode>(Val: Arg);
1078	if (!PN)
1079	continue;
1080
1081	// Determine if the PHI has any null operands, or any incoming
1082	// critical edges.
1083	bool HasNull = false;
1084	bool HasCriticalEdges = false;
1085	for (unsigned i = `0`, e = PN->getNumIncomingValues(); i != e; ++i) {
1086	Value *Incoming = GetRCIdentityRoot(V: PN->getIncomingValue(i));
1087	if (IsNullOrUndef(V: Incoming))
1088	HasNull = true;
1089	else if (PN->getIncomingBlock(i)->getTerminator()->getNumSuccessors() !=
1090	`1`) {
1091	HasCriticalEdges = true;
1092	break;
1093	}
1094	}
1095	// If we have null operands and no critical edges, optimize.
1096	if (HasCriticalEdges)
1097	continue;
1098	if (!HasNull)
1099	continue;
1100
1101	Instruction DepInst = nullptr*;
1102
1103	// Check that there is nothing that cares about the reference
1104	// count between the call and the phi.
1105	switch (Class) {
1106	case ARCInstKind::Retain:
1107	case ARCInstKind::RetainBlock:
1108	// These can always be moved up.
1109	break;
1110	case ARCInstKind::Release:
1111	// These can't be moved across things that care about the retain
1112	// count.
1113	DepInst = findSingleDependency(Flavor: NeedsPositiveRetainCount, Arg,
1114	StartBB: Inst->getParent(), StartInst: Inst, PA);
1115	break;
1116	case ARCInstKind::Autorelease:
1117	// These can't be moved across autorelease pool scope boundaries.
1118	DepInst = findSingleDependency(Flavor: AutoreleasePoolBoundary, Arg,
1119	StartBB: Inst->getParent(), StartInst: Inst, PA);
1120	break;
1121	case ARCInstKind::UnsafeClaimRV:
1122	case ARCInstKind::RetainRV:
1123	case ARCInstKind::AutoreleaseRV:
1124	// Don't move these; the RV optimization depends on the autoreleaseRV
1125	// being tail called, and the retainRV being immediately after a call
1126	// (which might still happen if we get lucky with codegen layout, but
1127	// it's not worth taking the chance).
1128	continue;
1129	default:
1130	llvm_unreachable("Invalid dependence flavor");
1131	}
1132
1133	if (DepInst != PN)
1134	continue;
1135
1136	Changed = true;
1137	++NumPartialNoops;
1138	// Clone the call into each predecessor that has a non-null value.
1139	CallInst *CInst = cast<CallInst>(Val: Inst);
1140	Type *ParamTy = CInst->getArgOperand(i: `0`)->getType();
1141	for (unsigned i = `0`, e = PN->getNumIncomingValues(); i != e; ++i) {
1142	Value *Incoming = GetRCIdentityRoot(V: PN->getIncomingValue(i));
1143	if (IsNullOrUndef(V: Incoming))
1144	continue;
1145	Value *Op = PN->getIncomingValue(i);
1146	BasicBlock::iterator InsertPos =
1147	PN->getIncomingBlock(i)->back().getIterator();
1148	SmallVector<OperandBundleDef, `1`> OpBundles;
1149	cloneOpBundlesIf(CI: CInst, OpBundles, Predicate: [](const OperandBundleUse &B) {
1150	return B.getTagID() != LLVMContext::OB_funclet;
1151	});
1152	addOpBundleForFunclet(BB: InsertPos ->getParent(), OpBundles);
1153	CallInst *Clone = CallInst::Create(CI: CInst, Bundles: OpBundles);
1154	if (Op->getType() != ParamTy)
1155	Op = new BitCastInst (Op, ParamTy, "", InsertPos);
1156	Clone->setArgOperand(i: `0`, v: Op);
1157	Clone->insertBefore(BB&: *InsertPos ->getParent(), InsertPos);
1158
1159	LLVM_DEBUG(dbgs() << "Cloning " << *CInst << "\n"
1160	"And inserting clone at "
1161	<< *InsertPos << "\n");
1162	Worklist.push_back(Elt: std::make_pair(x&: Clone, y&: Incoming));
1163	}
1164	// Erase the original call.
1165	LLVM_DEBUG(dbgs() << "Erasing: " << *CInst << "\n");
1166	EraseInstruction(CI: CInst);
1167	} while (!Worklist.empty());
1168	}
1169
1170	/// If we have a top down pointer in the S_Use state, make sure that there are
1171	/// no CFG hazards by checking the states of various bottom up pointers.
1172	static void CheckForUseCFGHazard(const Sequence SuccSSeq,
1173	const bool SuccSRRIKnownSafe,
1174	TopDownPtrState &S,
1175	bool &SomeSuccHasSame,
1176	bool &AllSuccsHaveSame,
1177	bool &NotAllSeqEqualButKnownSafe,
1178	bool &ShouldContinue) {
1179	switch (SuccSSeq) {
1180	case S_CanRelease: {
1181	if (!S.IsKnownSafe() && !SuccSRRIKnownSafe) {
1182	S.ClearSequenceProgress();
1183	break;
1184	}
1185	S.SetCFGHazardAfflicted(true);
1186	ShouldContinue = true;
1187	break;
1188	}
1189	case S_Use:
1190	SomeSuccHasSame = true;
1191	break;
1192	case S_Stop:
1193	case S_MovableRelease:
1194	if (!S.IsKnownSafe() && !SuccSRRIKnownSafe)
1195	AllSuccsHaveSame = false;
1196	else
1197	NotAllSeqEqualButKnownSafe = true;
1198	break;
1199	case S_Retain:
1200	llvm_unreachable("bottom-up pointer in retain state!");
1201	case S_None:
1202	llvm_unreachable("This should have been handled earlier.");
1203	}
1204	}
1205
1206	/// If we have a Top Down pointer in the S_CanRelease state, make sure that
1207	/// there are no CFG hazards by checking the states of various bottom up
1208	/// pointers.
1209	static void CheckForCanReleaseCFGHazard(const Sequence SuccSSeq,
1210	const bool SuccSRRIKnownSafe,
1211	TopDownPtrState &S,
1212	bool &SomeSuccHasSame,
1213	bool &AllSuccsHaveSame,
1214	bool &NotAllSeqEqualButKnownSafe) {
1215	switch (SuccSSeq) {
1216	case S_CanRelease:
1217	SomeSuccHasSame = true;
1218	break;
1219	case S_Stop:
1220	case S_MovableRelease:
1221	case S_Use:
1222	if (!S.IsKnownSafe() && !SuccSRRIKnownSafe)
1223	AllSuccsHaveSame = false;
1224	else
1225	NotAllSeqEqualButKnownSafe = true;
1226	break;
1227	case S_Retain:
1228	llvm_unreachable("bottom-up pointer in retain state!");
1229	case S_None:
1230	llvm_unreachable("This should have been handled earlier.");
1231	}
1232	}
1233
1234	/// Check for critical edges, loop boundaries, irreducible control flow, or
1235	/// other CFG structures where moving code across the edge would result in it
1236	/// being executed more.
1237	void
1238	ObjCARCOpt::CheckForCFGHazards(const BasicBlock *BB,
1239	DenseMap<const BasicBlock *, BBState> &BBStates,
1240	BBState &MyStates) const {
1241	// If any top-down local-use or possible-dec has a succ which is earlier in
1242	// the sequence, forget it.
1243	for (auto I = MyStates.top_down_ptr_begin(), E = MyStates.top_down_ptr_end();
1244	I != E; ++I) {
1245	TopDownPtrState &S = I ->second;
1246	const Sequence Seq = I ->second.GetSeq();
1247
1248	// We only care about S_Retain, S_CanRelease, and S_Use.
1249	if (Seq == S_None)
1250	continue;
1251
1252	// Make sure that if extra top down states are added in the future that this
1253	// code is updated to handle it.
1254	assert((Seq == S_Retain \|\| Seq == S_CanRelease \|\| Seq == S_Use) &&
1255	"Unknown top down sequence state.");
1256
1257	const Value *Arg = I ->first;
1258	bool SomeSuccHasSame = false;
1259	bool AllSuccsHaveSame = true;
1260	bool NotAllSeqEqualButKnownSafe = false;
1261
1262	for (const BasicBlock *Succ : successors(BB)) {
1263	// If VisitBottomUp has pointer information for this successor, take
1264	// what we know about it.
1265	const DenseMap<const BasicBlock *, BBState>::iterator BBI =
1266	BBStates.find(Val: Succ);
1267	assert(BBI != BBStates.end());
1268	const BottomUpPtrState &SuccS = BBI ->second.getPtrBottomUpState(Arg);
1269	const Sequence SuccSSeq = SuccS.GetSeq();
1270
1271	// If bottom up, the pointer is in an S_None state, clear the sequence
1272	// progress since the sequence in the bottom up state finished
1273	// suggesting a mismatch in between retains/releases. This is true for
1274	// all three cases that we are handling here: S_Retain, S_Use, and
1275	// S_CanRelease.
1276	if (SuccSSeq == S_None) {
1277	S.ClearSequenceProgress();
1278	continue;
1279	}
1280
1281	// If we have S_Use or S_CanRelease, perform our check for cfg hazard
1282	// checks.
1283	const bool SuccSRRIKnownSafe = SuccS.IsKnownSafe();
1284
1285	// NOTE* We do not use Seq from above here since we are allowing for*
1286	// S.GetSeq() to change while we are visiting basic blocks.
1287	switch(S.GetSeq()) {
1288	case S_Use: {
1289	bool ShouldContinue = false;
1290	CheckForUseCFGHazard(SuccSSeq, SuccSRRIKnownSafe, S, SomeSuccHasSame,
1291	AllSuccsHaveSame, NotAllSeqEqualButKnownSafe,
1292	ShouldContinue);
1293	if (ShouldContinue)
1294	continue;
1295	break;
1296	}
1297	case S_CanRelease:
1298	CheckForCanReleaseCFGHazard(SuccSSeq, SuccSRRIKnownSafe, S,
1299	SomeSuccHasSame, AllSuccsHaveSame,
1300	NotAllSeqEqualButKnownSafe);
1301	break;
1302	case S_Retain:
1303	case S_None:
1304	case S_Stop:
1305	case S_MovableRelease:
1306	break;
1307	}
1308	}
1309
1310	// If the state at the other end of any of the successor edges
1311	// matches the current state, require all edges to match. This
1312	// guards against loops in the middle of a sequence.
1313	if (SomeSuccHasSame && !AllSuccsHaveSame) {
1314	S.ClearSequenceProgress();
1315	} else if (NotAllSeqEqualButKnownSafe) {
1316	// If we would have cleared the state foregoing the fact that we are known
1317	// safe, stop code motion. This is because whether or not it is safe to
1318	// remove RR pairs via KnownSafe is an orthogonal concept to whether we
1319	// are allowed to perform code motion.
1320	S.SetCFGHazardAfflicted(true);
1321	}
1322	}
1323	}
1324
1325	bool ObjCARCOpt::VisitInstructionBottomUp(
1326	Instruction Inst, BasicBlock BB, BlotMapVector<Value *, RRInfo> &Retains,
1327	BBState &MyStates) {
1328	bool NestingDetected = false;
1329	ARCInstKind Class = GetARCInstKind(V: Inst);
1330	const Value Arg = nullptr*;
1331
1332	LLVM_DEBUG(dbgs() << " Class: " << Class << "\n");
1333
1334	switch (Class) {
1335	case ARCInstKind::Release: {
1336	Arg = GetArgRCIdentityRoot(Inst);
1337
1338	BottomUpPtrState &S = MyStates.getPtrBottomUpState(Arg);
1339	NestingDetected \|= S.InitBottomUp(Cache&: MDKindCache, I: Inst);
1340	break;
1341	}
1342	case ARCInstKind::RetainBlock:
1343	// In OptimizeIndividualCalls, we have strength reduced all optimizable
1344	// objc_retainBlocks to objc_retains. Thus at this point any
1345	// objc_retainBlocks that we see are not optimizable.
1346	break;
1347	case ARCInstKind::Retain:
1348	case ARCInstKind::RetainRV: {
1349	Arg = GetArgRCIdentityRoot(Inst);
1350	BottomUpPtrState &S = MyStates.getPtrBottomUpState(Arg);
1351	if (S.MatchWithRetain()) {
1352	// Don't do retain+release tracking for ARCInstKind::RetainRV, because
1353	// it's better to let it remain as the first instruction after a call.
1354	if (Class != ARCInstKind::RetainRV) {
1355	LLVM_DEBUG(dbgs() << " Matching with: " << *Inst << "\n");
1356	Retains [Inst] = S.GetRRInfo();
1357	}
1358	S.ClearSequenceProgress();
1359	}
1360	// A retain moving bottom up can be a use.
1361	break;
1362	}
1363	case ARCInstKind::AutoreleasepoolPop:
1364	// Conservatively, clear MyStates for all known pointers.
1365	MyStates.clearBottomUpPointers();
1366	return NestingDetected;
1367	case ARCInstKind::AutoreleasepoolPush:
1368	case ARCInstKind::None:
1369	// These are irrelevant.
1370	return NestingDetected;
1371	default:
1372	break;
1373	}
1374
1375	// Consider any other possible effects of this instruction on each
1376	// pointer being tracked.
1377	for (auto MI = MyStates.bottom_up_ptr_begin(),
1378	ME = MyStates.bottom_up_ptr_end();
1379	MI != ME; ++MI) {
1380	const Value *Ptr = MI ->first;
1381	if (Ptr == Arg)
1382	continue; // Handled above.
1383	BottomUpPtrState &S = MI ->second;
1384
1385	if (S.HandlePotentialAlterRefCount(Inst, Ptr, PA, Class))
1386	continue;
1387
1388	S.HandlePotentialUse(BB, Inst, Ptr, PA, Class);
1389	}
1390
1391	return NestingDetected;
1392	}
1393
1394	bool ObjCARCOpt::VisitBottomUp(BasicBlock *BB,
1395	DenseMap<const BasicBlock *, BBState> &BBStates,
1396	BlotMapVector<Value *, RRInfo> &Retains) {
1397	LLVM_DEBUG(dbgs() << "\n== ObjCARCOpt::VisitBottomUp ==\n");
1398
1399	bool NestingDetected = false;
1400	BBState &MyStates = BBStates [BB];
1401
1402	// Merge the states from each successor to compute the initial state
1403	// for the current block.
1404	BBState::edge_iterator SI(MyStates.succ_begin()),
1405	SE(MyStates.succ_end());
1406	if (SI != SE) {
1407	const BasicBlock Succ = SI;
1408	DenseMap<const BasicBlock *, BBState>::iterator I = BBStates.find(Val: Succ);
1409	assert(I != BBStates.end());
1410	MyStates.InitFromSucc(Other: I ->second);
1411	++SI;
1412	for (; SI != SE; ++SI) {
1413	Succ = *SI;
1414	I = BBStates.find(Val: Succ);
1415	assert(I != BBStates.end());
1416	MyStates.MergeSucc(Other: I ->second);
1417	}
1418	}
1419
1420	LLVM_DEBUG(dbgs() << "Before:\n"
1421	<< BBStates[BB] << "\n"
1422	<< "Performing Dataflow:\n");
1423
1424	// Visit all the instructions, bottom-up.
1425	for (BasicBlock::iterator I = BB->end(), E = BB->begin(); I != E; --I) {
1426	Instruction Inst = &std::prev(x: I);
1427
1428	// Invoke instructions are visited as part of their successors (below).
1429	if (isa<InvokeInst>(Val: Inst))
1430	continue;
1431
1432	LLVM_DEBUG(dbgs() << " Visiting " << *Inst << "\n");
1433
1434	NestingDetected \|= VisitInstructionBottomUp(Inst, BB, Retains, MyStates);
1435
1436	// Bail out if the number of pointers being tracked becomes too large so
1437	// that this pass can complete in a reasonable amount of time.
1438	if (MyStates.bottom_up_ptr_list_size() > MaxPtrStates) {
1439	DisableRetainReleasePairing = true;
1440	return false;
1441	}
1442	}
1443
1444	// If there's a predecessor with an invoke, visit the invoke as if it were
1445	// part of this block, since we can't insert code after an invoke in its own
1446	// block, and we don't want to split critical edges.
1447	for (BBState::edge_iterator PI(MyStates.pred_begin()),
1448	PE(MyStates.pred_end()); PI != PE; ++PI) {
1449	BasicBlock Pred = PI;
1450	if (InvokeInst *II = dyn_cast<InvokeInst>(Val: &Pred->back()))
1451	NestingDetected \|= VisitInstructionBottomUp(Inst: II, BB, Retains, MyStates);
1452	}
1453
1454	LLVM_DEBUG(dbgs() << "\nFinal State:\n" << BBStates[BB] << "\n");
1455
1456	return NestingDetected;
1457	}
1458
1459	// Fill ReleaseInsertPtToRCIdentityRoots, which is a map from insertion points
1460	// to the set of RC identity roots that would be released by the release calls
1461	// moved to the insertion points.
1462	static void collectReleaseInsertPts(
1463	const BlotMapVector<Value *, RRInfo> &Retains,
1464	DenseMap<const Instruction , SmallPtrSet<const* Value *, `2`>>
1465	&ReleaseInsertPtToRCIdentityRoots) {
1466	for (const auto &P : Retains) {
1467	// Retains is a map from an objc_retain call to a RRInfo of the RC identity
1468	// root of the call. Get the RC identity root of the objc_retain call.
1469	Instruction *Retain = cast<Instruction>(Val: P.first);
1470	Value *Root = GetRCIdentityRoot(V: Retain->getOperand(i: `0`));
1471	// Collect all the insertion points of the objc_release calls that release
1472	// the RC identity root of the objc_retain call.
1473	for (const Instruction *InsertPt : P.second.ReverseInsertPts)
1474	ReleaseInsertPtToRCIdentityRoots [InsertPt].insert(Ptr: Root);
1475	}
1476	}
1477
1478	// Get the RC identity roots from an insertion point of an objc_release call.
1479	// Return nullptr if the passed instruction isn't an insertion point.
1480	static const SmallPtrSet<const Value , `2`>
1481	getRCIdentityRootsFromReleaseInsertPt(
1482	const Instruction *InsertPt,
1483	const DenseMap<const Instruction , SmallPtrSet<const* Value *, `2`>>
1484	&ReleaseInsertPtToRCIdentityRoots) {
1485	auto I = ReleaseInsertPtToRCIdentityRoots.find(Val: InsertPt);
1486	if (I == ReleaseInsertPtToRCIdentityRoots.end())
1487	return nullptr;
1488	return &I ->second;
1489	}
1490
1491	bool ObjCARCOpt::VisitInstructionTopDown(
1492	Instruction Inst, DenseMap<Value , RRInfo> &Releases, BBState &MyStates,
1493	const DenseMap<const Instruction , SmallPtrSet<const* Value *, `2`>>
1494	&ReleaseInsertPtToRCIdentityRoots) {
1495	bool NestingDetected = false;
1496	ARCInstKind Class = GetARCInstKind(V: Inst);
1497	const Value Arg = nullptr*;
1498
1499	// Make sure a call to objc_retain isn't moved past insertion points of calls
1500	// to objc_release.
1501	if (const SmallPtrSet<const Value , `2`> Roots =
1502	getRCIdentityRootsFromReleaseInsertPt(
1503	InsertPt: Inst, ReleaseInsertPtToRCIdentityRoots))
1504	for (const auto Root : Roots) {
1505	TopDownPtrState &S = MyStates.getPtrTopDownState(Arg: Root);
1506	// Disable code motion if the current position is S_Retain to prevent
1507	// moving the objc_retain call past objc_release calls. If it's
1508	// S_CanRelease or larger, it's not necessary to disable code motion as
1509	// the insertion points that prevent the objc_retain call from moving down
1510	// should have been set already.
1511	if (S.GetSeq() == S_Retain)
1512	S.SetCFGHazardAfflicted(true);
1513	}
1514
1515	LLVM_DEBUG(dbgs() << " Class: " << Class << "\n");
1516
1517	switch (Class) {
1518	case ARCInstKind::RetainBlock:
1519	// In OptimizeIndividualCalls, we have strength reduced all optimizable
1520	// objc_retainBlocks to objc_retains. Thus at this point any
1521	// objc_retainBlocks that we see are not optimizable. We need to break since
1522	// a retain can be a potential use.
1523	break;
1524	case ARCInstKind::Retain:
1525	case ARCInstKind::RetainRV: {
1526	Arg = GetArgRCIdentityRoot(Inst);
1527	TopDownPtrState &S = MyStates.getPtrTopDownState(Arg);
1528	NestingDetected \|= S.InitTopDown(Kind: Class, I: Inst);
1529	// A retain can be a potential use; proceed to the generic checking
1530	// code below.
1531	break;
1532	}
1533	case ARCInstKind::Release: {
1534	Arg = GetArgRCIdentityRoot(Inst);
1535	TopDownPtrState &S = MyStates.getPtrTopDownState(Arg);
1536	// Try to form a tentative pair in between this release instruction and the
1537	// top down pointers that we are tracking.
1538	if (S.MatchWithRelease(Cache&: MDKindCache, Release: Inst)) {
1539	// If we succeed, copy S's RRInfo into the Release -> {Retain Set
1540	// Map}. Then we clear S.
1541	LLVM_DEBUG(dbgs() << " Matching with: " << *Inst << "\n");
1542	Releases [Inst] = S.GetRRInfo();
1543	S.ClearSequenceProgress();
1544	}
1545	break;
1546	}
1547	case ARCInstKind::AutoreleasepoolPop:
1548	// Conservatively, clear MyStates for all known pointers.
1549	MyStates.clearTopDownPointers();
1550	return false;
1551	case ARCInstKind::AutoreleasepoolPush:
1552	case ARCInstKind::None:
1553	// These can not be uses of
1554	return false;
1555	default:
1556	break;
1557	}
1558
1559	// Consider any other possible effects of this instruction on each
1560	// pointer being tracked.
1561	for (auto MI = MyStates.top_down_ptr_begin(),
1562	ME = MyStates.top_down_ptr_end();
1563	MI != ME; ++MI) {
1564	const Value *Ptr = MI ->first;
1565	if (Ptr == Arg)
1566	continue; // Handled above.
1567	TopDownPtrState &S = MI ->second;
1568	if (S.HandlePotentialAlterRefCount(Inst, Ptr, PA, Class, BundledRVs: *BundledInsts))
1569	continue;
1570
1571	S.HandlePotentialUse(Inst, Ptr, PA, Class);
1572	}
1573
1574	return NestingDetected;
1575	}
1576
1577	bool ObjCARCOpt::VisitTopDown(
1578	BasicBlock BB, DenseMap<const* BasicBlock *, BBState> &BBStates,
1579	DenseMap<Value *, RRInfo> &Releases,
1580	const DenseMap<const Instruction , SmallPtrSet<const* Value *, `2`>>
1581	&ReleaseInsertPtToRCIdentityRoots) {
1582	LLVM_DEBUG(dbgs() << "\n== ObjCARCOpt::VisitTopDown ==\n");
1583	bool NestingDetected = false;
1584	BBState &MyStates = BBStates [BB];
1585
1586	// Merge the states from each predecessor to compute the initial state
1587	// for the current block.
1588	BBState::edge_iterator PI(MyStates.pred_begin()),
1589	PE(MyStates.pred_end());
1590	if (PI != PE) {
1591	const BasicBlock Pred = PI;
1592	DenseMap<const BasicBlock *, BBState>::iterator I = BBStates.find(Val: Pred);
1593	assert(I != BBStates.end());
1594	MyStates.InitFromPred(Other: I ->second);
1595	++PI;
1596	for (; PI != PE; ++PI) {
1597	Pred = *PI;
1598	I = BBStates.find(Val: Pred);
1599	assert(I != BBStates.end());
1600	MyStates.MergePred(Other: I ->second);
1601	}
1602	}
1603
1604	// Check that BB and MyStates have the same number of predecessors. This
1605	// prevents retain calls that live outside a loop from being moved into the
1606	// loop.
1607	if (!BB->hasNPredecessors(N: MyStates.pred_end() - MyStates.pred_begin()))
1608	for (auto I = MyStates.top_down_ptr_begin(),
1609	E = MyStates.top_down_ptr_end();
1610	I != E; ++I)
1611	I ->second.SetCFGHazardAfflicted(true);
1612
1613	LLVM_DEBUG(dbgs() << "Before:\n"
1614	<< BBStates[BB] << "\n"
1615	<< "Performing Dataflow:\n");
1616
1617	// Visit all the instructions, top-down.
1618	for (Instruction &Inst : *BB) {
1619	LLVM_DEBUG(dbgs() << " Visiting " << Inst << "\n");
1620
1621	NestingDetected \|= VisitInstructionTopDown(
1622	Inst: &Inst, Releases, MyStates, ReleaseInsertPtToRCIdentityRoots);
1623
1624	// Bail out if the number of pointers being tracked becomes too large so
1625	// that this pass can complete in a reasonable amount of time.
1626	if (MyStates.top_down_ptr_list_size() > MaxPtrStates) {
1627	DisableRetainReleasePairing = true;
1628	return false;
1629	}
1630	}
1631
1632	LLVM_DEBUG(dbgs() << "\nState Before Checking for CFG Hazards:\n"
1633	<< BBStates[BB] << "\n\n");
1634	CheckForCFGHazards(BB, BBStates, MyStates);
1635	LLVM_DEBUG(dbgs() << "Final State:\n" << BBStates[BB] << "\n");
1636	return NestingDetected;
1637	}
1638
1639	static void
1640	ComputePostOrders(Function &F,
1641	SmallVectorImpl<BasicBlock *> &PostOrder,
1642	SmallVectorImpl<BasicBlock *> &ReverseCFGPostOrder,
1643	unsigned NoObjCARCExceptionsMDKind,
1644	DenseMap<const BasicBlock *, BBState> &BBStates) {
1645	/// The visited set, for doing DFS walks.
1646	SmallPtrSet<BasicBlock *, `16`> Visited;
1647
1648	// Do DFS, computing the PostOrder.
1649	SmallPtrSet<BasicBlock *, `16`> OnStack;
1650	SmallVector<std::pair<BasicBlock *, succ_iterator>, `16`> SuccStack;
1651
1652	// Functions always have exactly one entry block, and we don't have
1653	// any other block that we treat like an entry block.
1654	BasicBlock *EntryBB = &F.getEntryBlock();
1655	BBState &MyStates = BBStates [EntryBB];
1656	MyStates.SetAsEntry();
1657	SuccStack.push_back(Elt: std::make_pair(x&: EntryBB, y: succ_begin(BB: EntryBB)));
1658	Visited.insert(Ptr: EntryBB);
1659	OnStack.insert(Ptr: EntryBB);
1660	do {
1661	dfs_next_succ:
1662	BasicBlock *CurrBB = SuccStack.back().first;
1663	succ_iterator SE = succ_end(I: CurrBB->getTerminator());
1664
1665	while (SuccStack.back().second != SE) {
1666	BasicBlock SuccBB = SuccStack.back().second ++;
1667	if (Visited.insert(Ptr: SuccBB).second) {
1668	SuccStack.push_back(Elt: std::make_pair(x&: SuccBB, y: succ_begin(BB: SuccBB)));
1669	BBStates [CurrBB].addSucc(Succ: SuccBB);
1670	BBState &SuccStates = BBStates [SuccBB];
1671	SuccStates.addPred(Pred: CurrBB);
1672	OnStack.insert(Ptr: SuccBB);
1673	goto dfs_next_succ;
1674	}
1675
1676	if (!OnStack.count(Ptr: SuccBB)) {
1677	BBStates [CurrBB].addSucc(Succ: SuccBB);
1678	BBStates [SuccBB].addPred(Pred: CurrBB);
1679	}
1680	}
1681	OnStack.erase(Ptr: CurrBB);
1682	PostOrder.push_back(Elt: CurrBB);
1683	SuccStack.pop_back();
1684	} while (!SuccStack.empty());
1685
1686	Visited.clear();
1687
1688	// Do reverse-CFG DFS, computing the reverse-CFG PostOrder.
1689	// Functions may have many exits, and there also blocks which we treat
1690	// as exits due to ignored edges.
1691	SmallVector<std::pair<BasicBlock *, BBState::edge_iterator>, `16`> PredStack;
1692	for (BasicBlock &ExitBB : F) {
1693	BBState &MyStates = BBStates [&ExitBB];
1694	if (!MyStates.isExit())
1695	continue;
1696
1697	MyStates.SetAsExit();
1698
1699	PredStack.push_back(Elt: std::make_pair(x: &ExitBB, y: MyStates.pred_begin()));
1700	Visited.insert(Ptr: &ExitBB);
1701	while (!PredStack.empty()) {
1702	reverse_dfs_next_succ:
1703	BBState::edge_iterator PE = BBStates [PredStack.back().first].pred_end();
1704	while (PredStack.back().second != PE) {
1705	BasicBlock BB = PredStack.back().second++;
1706	if (Visited.insert(Ptr: BB).second) {
1707	PredStack.push_back(Elt: std::make_pair(x&: BB, y: BBStates [BB].pred_begin()));
1708	goto reverse_dfs_next_succ;
1709	}
1710	}
1711	ReverseCFGPostOrder.push_back(Elt: PredStack.pop_back_val().first);
1712	}
1713	}
1714	}
1715
1716	// Visit the function both top-down and bottom-up.
1717	bool ObjCARCOpt::Visit(Function &F,
1718	DenseMap<const BasicBlock *, BBState> &BBStates,
1719	BlotMapVector<Value *, RRInfo> &Retains,
1720	DenseMap<Value *, RRInfo> &Releases) {
1721	// Use reverse-postorder traversals, because we magically know that loops
1722	// will be well behaved, i.e. they won't repeatedly call retain on a single
1723	// pointer without doing a release. We can't use the ReversePostOrderTraversal
1724	// class here because we want the reverse-CFG postorder to consider each
1725	// function exit point, and we want to ignore selected cycle edges.
1726	SmallVector<BasicBlock *, `16`> PostOrder;
1727	SmallVector<BasicBlock *, `16`> ReverseCFGPostOrder;
1728	ComputePostOrders(F, PostOrder, ReverseCFGPostOrder,
1729	NoObjCARCExceptionsMDKind: MDKindCache.get(ID: ARCMDKindID::NoObjCARCExceptions),
1730	BBStates);
1731
1732	// Use reverse-postorder on the reverse CFG for bottom-up.
1733	bool BottomUpNestingDetected = false;
1734	for (BasicBlock *BB : llvm::reverse(C&: ReverseCFGPostOrder)) {
1735	BottomUpNestingDetected \|= VisitBottomUp(BB, BBStates, Retains);
1736	if (DisableRetainReleasePairing)
1737	return false;
1738	}
1739
1740	DenseMap<const Instruction , SmallPtrSet<const* Value *, `2`>>
1741	ReleaseInsertPtToRCIdentityRoots;
1742	collectReleaseInsertPts(Retains, ReleaseInsertPtToRCIdentityRoots);
1743
1744	// Use reverse-postorder for top-down.
1745	bool TopDownNestingDetected = false;
1746	for (BasicBlock *BB : llvm::reverse(C&: PostOrder)) {
1747	TopDownNestingDetected \|=
1748	VisitTopDown(BB, BBStates, Releases, ReleaseInsertPtToRCIdentityRoots);
1749	if (DisableRetainReleasePairing)
1750	return false;
1751	}
1752
1753	return TopDownNestingDetected && BottomUpNestingDetected;
1754	}
1755
1756	/// Move the calls in RetainsToMove and ReleasesToMove.
1757	void ObjCARCOpt::MoveCalls(Value *Arg, RRInfo &RetainsToMove,
1758	RRInfo &ReleasesToMove,
1759	BlotMapVector<Value *, RRInfo> &Retains,
1760	DenseMap<Value *, RRInfo> &Releases,
1761	SmallVectorImpl<Instruction *> &DeadInsts,
1762	Module *M) {
1763	LLVM_DEBUG(dbgs() << "== ObjCARCOpt::MoveCalls ==\n");
1764
1765	// Insert the new retain and release calls.
1766	for (Instruction *InsertPt : ReleasesToMove.ReverseInsertPts) {
1767	Function *Decl = EP.get(kind: ARCRuntimeEntryPointKind::Retain);
1768	SmallVector<OperandBundleDef, `1`> BundleList;
1769	addOpBundleForFunclet(BB: InsertPt->getParent(), OpBundles&: BundleList);
1770	CallInst *Call =
1771	CallInst::Create(Func: Decl, Args: Arg, Bundles: BundleList, NameStr: "", InsertBefore: InsertPt->getIterator());
1772	Call->setDoesNotThrow();
1773	Call->setTailCall();
1774
1775	LLVM_DEBUG(dbgs() << "Inserting new Retain: " << *Call
1776	<< "\n"
1777	"At insertion point: "
1778	<< *InsertPt << "\n");
1779	}
1780	for (Instruction *InsertPt : RetainsToMove.ReverseInsertPts) {
1781	Function *Decl = EP.get(kind: ARCRuntimeEntryPointKind::Release);
1782	SmallVector<OperandBundleDef, `1`> BundleList;
1783	addOpBundleForFunclet(BB: InsertPt->getParent(), OpBundles&: BundleList);
1784	CallInst *Call =
1785	CallInst::Create(Func: Decl, Args: Arg, Bundles: BundleList, NameStr: "", InsertBefore: InsertPt->getIterator());
1786	// Attach a clang.imprecise_release metadata tag, if appropriate.
1787	if (MDNode *M = ReleasesToMove.ReleaseMetadata)
1788	Call->setMetadata(KindID: MDKindCache.get(ID: ARCMDKindID::ImpreciseRelease), Node: M);
1789	Call->setDoesNotThrow();
1790	if (ReleasesToMove.IsTailCallRelease)
1791	Call->setTailCall();
1792
1793	LLVM_DEBUG(dbgs() << "Inserting new Release: " << *Call
1794	<< "\n"
1795	"At insertion point: "
1796	<< *InsertPt << "\n");
1797	}
1798
1799	// Delete the original retain and release calls.
1800	for (Instruction *OrigRetain : RetainsToMove.Calls) {
1801	Retains.blot(Key: OrigRetain);
1802	DeadInsts.push_back(Elt: OrigRetain);
1803	LLVM_DEBUG(dbgs() << "Deleting retain: " << *OrigRetain << "\n");
1804	}
1805	for (Instruction *OrigRelease : ReleasesToMove.Calls) {
1806	Releases.erase(Val: OrigRelease);
1807	DeadInsts.push_back(Elt: OrigRelease);
1808	LLVM_DEBUG(dbgs() << "Deleting release: " << *OrigRelease << "\n");
1809	}
1810	}
1811
1812	bool ObjCARCOpt::PairUpRetainsAndReleases(
1813	DenseMap<const BasicBlock *, BBState> &BBStates,
1814	BlotMapVector<Value *, RRInfo> &Retains,
1815	DenseMap<Value , RRInfo> &Releases, Module M,
1816	Instruction *Retain,
1817	SmallVectorImpl<Instruction *> &DeadInsts, RRInfo &RetainsToMove,
1818	RRInfo &ReleasesToMove, Value Arg, bool* KnownSafe,
1819	bool &AnyPairsCompletelyEliminated) {
1820	// If a pair happens in a region where it is known that the reference count
1821	// is already incremented, we can similarly ignore possible decrements unless
1822	// we are dealing with a retainable object with multiple provenance sources.
1823	bool KnownSafeTD = true, KnownSafeBU = true;
1824	bool CFGHazardAfflicted = false;
1825
1826	// Connect the dots between the top-down-collected RetainsToMove and
1827	// bottom-up-collected ReleasesToMove to form sets of related calls.
1828	// This is an iterative process so that we connect multiple releases
1829	// to multiple retains if needed.
1830	unsigned OldDelta = `0`;
1831	unsigned NewDelta = `0`;
1832	unsigned OldCount = `0`;
1833	unsigned NewCount = `0`;
1834	bool FirstRelease = true;
1835	for (SmallVector<Instruction *, `4`> NewRetains{Retain};;) {
1836	SmallVector<Instruction *, `4`> NewReleases;
1837	for (Instruction *NewRetain : NewRetains) {
1838	auto It = Retains.find(Key: NewRetain);
1839	assert(It != Retains.end());
1840	const RRInfo &NewRetainRRI = It ->second;
1841	KnownSafeTD &= NewRetainRRI.KnownSafe;
1842	CFGHazardAfflicted \|= NewRetainRRI.CFGHazardAfflicted;
1843	for (Instruction *NewRetainRelease : NewRetainRRI.Calls) {
1844	auto Jt = Releases.find(Val: NewRetainRelease);
1845	if (Jt == Releases.end())
1846	return false;
1847	const RRInfo &NewRetainReleaseRRI = Jt ->second;
1848
1849	// If the release does not have a reference to the retain as well,
1850	// something happened which is unaccounted for. Do not do anything.
1851	//
1852	// This can happen if we catch an additive overflow during path count
1853	// merging.
1854	if (!NewRetainReleaseRRI.Calls.count(Ptr: NewRetain))
1855	return false;
1856
1857	if (ReleasesToMove.Calls.insert(Ptr: NewRetainRelease).second) {
1858	// If we overflow when we compute the path count, don't remove/move
1859	// anything.
1860	const BBState &NRRBBState = BBStates [NewRetainRelease->getParent()];
1861	unsigned PathCount = BBState::OverflowOccurredValue;
1862	if (NRRBBState.GetAllPathCountWithOverflow(PathCount))
1863	return false;
1864	assert(PathCount != BBState::OverflowOccurredValue &&
1865	"PathCount at this point can not be "
1866	"OverflowOccurredValue.");
1867	OldDelta -= PathCount;
1868
1869	// Merge the ReleaseMetadata and IsTailCallRelease values.
1870	if (FirstRelease) {
1871	ReleasesToMove.ReleaseMetadata =
1872	NewRetainReleaseRRI.ReleaseMetadata;
1873	ReleasesToMove.IsTailCallRelease =
1874	NewRetainReleaseRRI.IsTailCallRelease;
1875	FirstRelease = false;
1876	} else {
1877	if (ReleasesToMove.ReleaseMetadata !=
1878	NewRetainReleaseRRI.ReleaseMetadata)
1879	ReleasesToMove.ReleaseMetadata = nullptr;
1880	if (ReleasesToMove.IsTailCallRelease !=
1881	NewRetainReleaseRRI.IsTailCallRelease)
1882	ReleasesToMove.IsTailCallRelease = false;
1883	}
1884
1885	// Collect the optimal insertion points.
1886	if (!KnownSafe)
1887	for (Instruction *RIP : NewRetainReleaseRRI.ReverseInsertPts) {
1888	if (ReleasesToMove.ReverseInsertPts.insert(Ptr: RIP).second) {
1889	// If we overflow when we compute the path count, don't
1890	// remove/move anything.
1891	const BBState &RIPBBState = BBStates [RIP->getParent()];
1892	PathCount = BBState::OverflowOccurredValue;
1893	if (RIPBBState.GetAllPathCountWithOverflow(PathCount))
1894	return false;
1895	assert(PathCount != BBState::OverflowOccurredValue &&
1896	"PathCount at this point can not be "
1897	"OverflowOccurredValue.");
1898	NewDelta -= PathCount;
1899	}
1900	}
1901	NewReleases.push_back(Elt: NewRetainRelease);
1902	}
1903	}
1904	}
1905	NewRetains.clear();
1906	if (NewReleases.empty()) break;
1907
1908	// Back the other way.
1909	for (Instruction *NewRelease : NewReleases) {
1910	auto It = Releases.find(Val: NewRelease);
1911	assert(It != Releases.end());
1912	const RRInfo &NewReleaseRRI = It ->second;
1913	KnownSafeBU &= NewReleaseRRI.KnownSafe;
1914	CFGHazardAfflicted \|= NewReleaseRRI.CFGHazardAfflicted;
1915	for (Instruction *NewReleaseRetain : NewReleaseRRI.Calls) {
1916	auto Jt = Retains.find(Key: NewReleaseRetain);
1917	if (Jt == Retains.end())
1918	return false;
1919	const RRInfo &NewReleaseRetainRRI = Jt ->second;
1920
1921	// If the retain does not have a reference to the release as well,
1922	// something happened which is unaccounted for. Do not do anything.
1923	//
1924	// This can happen if we catch an additive overflow during path count
1925	// merging.
1926	if (!NewReleaseRetainRRI.Calls.count(Ptr: NewRelease))
1927	return false;
1928
1929	if (RetainsToMove.Calls.insert(Ptr: NewReleaseRetain).second) {
1930	// If we overflow when we compute the path count, don't remove/move
1931	// anything.
1932	const BBState &NRRBBState = BBStates [NewReleaseRetain->getParent()];
1933	unsigned PathCount = BBState::OverflowOccurredValue;
1934	if (NRRBBState.GetAllPathCountWithOverflow(PathCount))
1935	return false;
1936	assert(PathCount != BBState::OverflowOccurredValue &&
1937	"PathCount at this point can not be "
1938	"OverflowOccurredValue.");
1939	OldDelta += PathCount;
1940	OldCount += PathCount;
1941
1942	// Collect the optimal insertion points.
1943	if (!KnownSafe)
1944	for (Instruction *RIP : NewReleaseRetainRRI.ReverseInsertPts) {
1945	if (RetainsToMove.ReverseInsertPts.insert(Ptr: RIP).second) {
1946	// If we overflow when we compute the path count, don't
1947	// remove/move anything.
1948	const BBState &RIPBBState = BBStates [RIP->getParent()];
1949
1950	PathCount = BBState::OverflowOccurredValue;
1951	if (RIPBBState.GetAllPathCountWithOverflow(PathCount))
1952	return false;
1953	assert(PathCount != BBState::OverflowOccurredValue &&
1954	"PathCount at this point can not be "
1955	"OverflowOccurredValue.");
1956	NewDelta += PathCount;
1957	NewCount += PathCount;
1958	}
1959	}
1960	NewRetains.push_back(Elt: NewReleaseRetain);
1961	}
1962	}
1963	}
1964	if (NewRetains.empty()) break;
1965	}
1966
1967	// We can only remove pointers if we are known safe in both directions.
1968	bool UnconditionallySafe = KnownSafeTD && KnownSafeBU;
1969	if (UnconditionallySafe) {
1970	RetainsToMove.ReverseInsertPts.clear();
1971	ReleasesToMove.ReverseInsertPts.clear();
1972	NewCount = `0`;
1973	} else {
1974	// Determine whether the new insertion points we computed preserve the
1975	// balance of retain and release calls through the program.
1976	// TODO: If the fully aggressive solution isn't valid, try to find a
1977	// less aggressive solution which is.
1978	if (NewDelta != `0`)
1979	return false;
1980
1981	// At this point, we are not going to remove any RR pairs, but we still are
1982	// able to move RR pairs. If one of our pointers is afflicted with
1983	// CFGHazards, we cannot perform such code motion so exit early.
1984	const bool WillPerformCodeMotion =
1985	!RetainsToMove.ReverseInsertPts.empty() \|\|
1986	!ReleasesToMove.ReverseInsertPts.empty();
1987	if (CFGHazardAfflicted && WillPerformCodeMotion)
1988	return false;
1989	}
1990
1991	// Determine whether the original call points are balanced in the retain and
1992	// release calls through the program. If not, conservatively don't touch
1993	// them.
1994	// TODO: It's theoretically possible to do code motion in this case, as
1995	// long as the existing imbalances are maintained.
1996	if (OldDelta != `0`)
1997	return false;
1998
1999	Changed = true;
2000	assert(OldCount != `0` && "Unreachable code?");
2001	NumRRs += OldCount - NewCount;
2002	// Set to true if we completely removed any RR pairs.
2003	AnyPairsCompletelyEliminated = NewCount == `0`;
2004
2005	// We can move calls!
2006	return true;
2007	}
2008
2009	/// Identify pairings between the retains and releases, and delete and/or move
2010	/// them.
2011	bool ObjCARCOpt::PerformCodePlacement(
2012	DenseMap<const BasicBlock *, BBState> &BBStates,
2013	BlotMapVector<Value *, RRInfo> &Retains,
2014	DenseMap<Value , RRInfo> &Releases, Module M) {
2015	LLVM_DEBUG(dbgs() << "\n== ObjCARCOpt::PerformCodePlacement ==\n");
2016
2017	bool AnyPairsCompletelyEliminated = false;
2018	SmallVector<Instruction *, `8`> DeadInsts;
2019
2020	// Visit each retain.
2021	for (BlotMapVector<Value *, RRInfo>::const_iterator I = Retains.begin(),
2022	E = Retains.end();
2023	I != E; ++I) {
2024	Value *V = I ->first;
2025	if (!V) continue; // blotted
2026
2027	Instruction *Retain = cast<Instruction>(Val: V);
2028
2029	LLVM_DEBUG(dbgs() << "Visiting: " << *Retain << "\n");
2030
2031	Value *Arg = GetArgRCIdentityRoot(Inst: Retain);
2032
2033	// If the object being released is in static or stack storage, we know it's
2034	// not being managed by ObjC reference counting, so we can delete pairs
2035	// regardless of what possible decrements or uses lie between them.
2036	bool KnownSafe = isa<Constant>(Val: Arg) \|\| isa<AllocaInst>(Val: Arg);
2037
2038	// A constant pointer can't be pointing to an object on the heap. It may
2039	// be reference-counted, but it won't be deleted.
2040	if (const LoadInst *LI = dyn_cast<LoadInst>(Val: Arg))
2041	if (const GlobalVariable *GV =
2042	dyn_cast<GlobalVariable>(
2043	Val: GetRCIdentityRoot(V: LI->getPointerOperand())))
2044	if (GV->isConstant())
2045	KnownSafe = true;
2046
2047	// Connect the dots between the top-down-collected RetainsToMove and
2048	// bottom-up-collected ReleasesToMove to form sets of related calls.
2049	RRInfo RetainsToMove, ReleasesToMove;
2050
2051	bool PerformMoveCalls = PairUpRetainsAndReleases(
2052	BBStates, Retains, Releases, M, Retain, DeadInsts,
2053	RetainsToMove, ReleasesToMove, Arg, KnownSafe,
2054	AnyPairsCompletelyEliminated);
2055
2056	if (PerformMoveCalls) {
2057	// Ok, everything checks out and we're all set. Let's move/delete some
2058	// code!
2059	MoveCalls(Arg, RetainsToMove, ReleasesToMove,
2060	Retains, Releases, DeadInsts, M);
2061	}
2062	}
2063
2064	// Now that we're done moving everything, we can delete the newly dead
2065	// instructions, as we no longer need them as insert points.
2066	while (!DeadInsts.empty())
2067	EraseInstruction(CI: DeadInsts.pop_back_val());
2068
2069	return AnyPairsCompletelyEliminated;
2070	}
2071
2072	/// Weak pointer optimizations.
2073	void ObjCARCOpt::OptimizeWeakCalls(Function &F) {
2074	LLVM_DEBUG(dbgs() << "\n== ObjCARCOpt::OptimizeWeakCalls ==\n");
2075
2076	// First, do memdep-style RLE and S2L optimizations. We can't use memdep
2077	// itself because it uses AliasAnalysis and we need to do provenance
2078	// queries instead.
2079	for (inst_iterator I = inst_begin(F: &F), E = inst_end(F: &F); I != E; ) {
2080	Instruction Inst = &I ++;
2081
2082	LLVM_DEBUG(dbgs() << "Visiting: " << *Inst << "\n");
2083
2084	ARCInstKind Class = GetBasicARCInstKind(V: Inst);
2085	if (Class != ARCInstKind::LoadWeak &&
2086	Class != ARCInstKind::LoadWeakRetained)
2087	continue;
2088
2089	// Delete objc_loadWeak calls with no users.
2090	if (Class == ARCInstKind::LoadWeak && Inst->use_empty()) {
2091	Inst->eraseFromParent();
2092	Changed = true;
2093	continue;
2094	}
2095
2096	// TODO: For now, just look for an earlier available version of this value
2097	// within the same block. Theoretically, we could do memdep-style non-local
2098	// analysis too, but that would want caching. A better approach would be to
2099	// use the technique that EarlyCSE uses.
2100	inst_iterator Current = std::prev(x: I);
2101	BasicBlock CurrentBB = &Current.getBasicBlockIterator();
2102	for (BasicBlock::iterator B = CurrentBB->begin(),
2103	J = Current.getInstructionIterator();
2104	J != B; --J) {
2105	Instruction EarlierInst = &std::prev(x: J);
2106	ARCInstKind EarlierClass = GetARCInstKind(V: EarlierInst);
2107	switch (EarlierClass) {
2108	case ARCInstKind::LoadWeak:
2109	case ARCInstKind::LoadWeakRetained: {
2110	// If this is loading from the same pointer, replace this load's value
2111	// with that one.
2112	CallInst *Call = cast<CallInst>(Val: Inst);
2113	CallInst *EarlierCall = cast<CallInst>(Val: EarlierInst);
2114	Value *Arg = Call->getArgOperand(i: `0`);
2115	Value *EarlierArg = EarlierCall->getArgOperand(i: `0`);
2116	switch (PA.getAA()->alias(V1: Arg, V2: EarlierArg)) {
2117	case AliasResult::MustAlias:
2118	Changed = true;
2119	// If the load has a builtin retain, insert a plain retain for it.
2120	if (Class == ARCInstKind::LoadWeakRetained) {
2121	Function *Decl = EP.get(kind: ARCRuntimeEntryPointKind::Retain);
2122	CallInst *CI =
2123	CallInst::Create(Func: Decl, Args: EarlierCall, NameStr: "", InsertBefore: Call->getIterator());
2124	CI->setTailCall();
2125	}
2126	// Zap the fully redundant load.
2127	Call->replaceAllUsesWith(V: EarlierCall);
2128	Call->eraseFromParent();
2129	goto clobbered;
2130	case AliasResult::MayAlias:
2131	case AliasResult::PartialAlias:
2132	goto clobbered;
2133	case AliasResult::NoAlias:
2134	break;
2135	}
2136	break;
2137	}
2138	case ARCInstKind::StoreWeak:
2139	case ARCInstKind::InitWeak: {
2140	// If this is storing to the same pointer and has the same size etc.
2141	// replace this load's value with the stored value.
2142	CallInst *Call = cast<CallInst>(Val: Inst);
2143	CallInst *EarlierCall = cast<CallInst>(Val: EarlierInst);
2144	Value *Arg = Call->getArgOperand(i: `0`);
2145	Value *EarlierArg = EarlierCall->getArgOperand(i: `0`);
2146	switch (PA.getAA()->alias(V1: Arg, V2: EarlierArg)) {
2147	case AliasResult::MustAlias:
2148	Changed = true;
2149	// If the load has a builtin retain, insert a plain retain for it.
2150	if (Class == ARCInstKind::LoadWeakRetained) {
2151	Function *Decl = EP.get(kind: ARCRuntimeEntryPointKind::Retain);
2152	CallInst *CI =
2153	CallInst::Create(Func: Decl, Args: EarlierCall, NameStr: "", InsertBefore: Call->getIterator());
2154	CI->setTailCall();
2155	}
2156	// Zap the fully redundant load.
2157	Call->replaceAllUsesWith(V: EarlierCall->getArgOperand(i: `1`));
2158	Call->eraseFromParent();
2159	goto clobbered;
2160	case AliasResult::MayAlias:
2161	case AliasResult::PartialAlias:
2162	goto clobbered;
2163	case AliasResult::NoAlias:
2164	break;
2165	}
2166	break;
2167	}
2168	case ARCInstKind::MoveWeak:
2169	case ARCInstKind::CopyWeak:
2170	// TOOD: Grab the copied value.
2171	goto clobbered;
2172	case ARCInstKind::AutoreleasepoolPush:
2173	case ARCInstKind::None:
2174	case ARCInstKind::IntrinsicUser:
2175	case ARCInstKind::User:
2176	// Weak pointers are only modified through the weak entry points
2177	// (and arbitrary calls, which could call the weak entry points).
2178	break;
2179	default:
2180	// Anything else could modify the weak pointer.
2181	goto clobbered;
2182	}
2183	}
2184	clobbered:;
2185	}
2186
2187	// Then, for each destroyWeak with an alloca operand, check to see if
2188	// the alloca and all its users can be zapped.
2189	for (Instruction &Inst : llvm::make_early_inc_range(Range: instructions(F))) {
2190	ARCInstKind Class = GetBasicARCInstKind(V: &Inst);
2191	if (Class != ARCInstKind::DestroyWeak)
2192	continue;
2193
2194	CallInst *Call = cast<CallInst>(Val: &Inst);
2195	Value *Arg = Call->getArgOperand(i: `0`);
2196	if (AllocaInst *Alloca = dyn_cast<AllocaInst>(Val: Arg)) {
2197	for (User *U : Alloca->users()) {
2198	const Instruction *UserInst = cast<Instruction>(Val: U);
2199	switch (GetBasicARCInstKind(V: UserInst)) {
2200	case ARCInstKind::InitWeak:
2201	case ARCInstKind::StoreWeak:
2202	case ARCInstKind::DestroyWeak:
2203	continue;
2204	default:
2205	goto done;
2206	}
2207	}
2208	Changed = true;
2209	for (User *U : llvm::make_early_inc_range(Range: Alloca->users())) {
2210	CallInst *UserInst = cast<CallInst>(Val: U);
2211	switch (GetBasicARCInstKind(V: UserInst)) {
2212	case ARCInstKind::InitWeak:
2213	case ARCInstKind::StoreWeak:
2214	// These functions return their second argument.
2215	UserInst->replaceAllUsesWith(V: UserInst->getArgOperand(i: `1`));
2216	break;
2217	case ARCInstKind::DestroyWeak:
2218	// No return value.
2219	break;
2220	default:
2221	llvm_unreachable("alloca really is used!");
2222	}
2223	UserInst->eraseFromParent();
2224	}
2225	Alloca->eraseFromParent();
2226	done:;
2227	}
2228	}
2229	}
2230
2231	/// Identify program paths which execute sequences of retains and releases which
2232	/// can be eliminated.
2233	bool ObjCARCOpt::OptimizeSequences(Function &F) {
2234	// Releases, Retains - These are used to store the results of the main flow
2235	// analysis. These use Value as the key instead of Instruction* so that the*
2236	// map stays valid when we get around to rewriting code and calls get
2237	// replaced by arguments.
2238	DenseMap<Value *, RRInfo> Releases;
2239	BlotMapVector<Value *, RRInfo> Retains;
2240
2241	// This is used during the traversal of the function to track the
2242	// states for each identified object at each block.
2243	DenseMap<const BasicBlock *, BBState> BBStates;
2244
2245	// Analyze the CFG of the function, and all instructions.
2246	bool NestingDetected = Visit(F, BBStates, Retains, Releases);
2247
2248	if (DisableRetainReleasePairing)
2249	return false;
2250
2251	// Transform.
2252	bool AnyPairsCompletelyEliminated = PerformCodePlacement(BBStates, Retains,
2253	Releases,
2254	M: F.getParent());
2255
2256	return AnyPairsCompletelyEliminated && NestingDetected;
2257	}
2258
2259	/// Check if there is a dependent call earlier that does not have anything in
2260	/// between the Retain and the call that can affect the reference count of their
2261	/// shared pointer argument. Note that Retain need not be in BB.
2262	static CallInst HasSafePathToPredecessorCall(const* Value *Arg,
2263	Instruction *Retain,
2264	ProvenanceAnalysis &PA) {
2265	auto *Call = dyn_cast_or_null<CallInst>(Val: findSingleDependency(
2266	Flavor: CanChangeRetainCount, Arg, StartBB: Retain->getParent(), StartInst: Retain, PA));
2267
2268	// Check that the pointer is the return value of the call.
2269	if (!Call \|\| Arg != Call)
2270	return nullptr;
2271
2272	// Check that the call is a regular call.
2273	ARCInstKind Class = GetBasicARCInstKind(V: Call);
2274	return Class == ARCInstKind::CallOrUser \|\| Class == ARCInstKind::Call
2275	? Call
2276	: nullptr;
2277	}
2278
2279	/// Find a dependent retain that precedes the given autorelease for which there
2280	/// is nothing in between the two instructions that can affect the ref count of
2281	/// Arg.
2282	static CallInst *
2283	FindPredecessorRetainWithSafePath(const Value Arg, BasicBlock BB,
2284	Instruction *Autorelease,
2285	ProvenanceAnalysis &PA) {
2286	auto *Retain = dyn_cast_or_null<CallInst>(
2287	Val: findSingleDependency(Flavor: CanChangeRetainCount, Arg, StartBB: BB, StartInst: Autorelease, PA));
2288
2289	// Check that we found a retain with the same argument.
2290	if (!Retain \|\| !IsRetain(Class: GetBasicARCInstKind(V: Retain)) \|\|
2291	GetArgRCIdentityRoot(Inst: Retain) != Arg) {
2292	return nullptr;
2293	}
2294
2295	return Retain;
2296	}
2297
2298	/// Look for an ``autorelease'' instruction dependent on Arg such that there are
2299	/// no instructions dependent on Arg that need a positive ref count in between
2300	/// the autorelease and the ret.
2301	static CallInst *FindPredecessorAutoreleaseWithSafePath(
2302	const Value Arg, BasicBlock BB, ReturnInst *Ret, ProvenanceAnalysis &PA) {
2303	auto *Autorelease = dyn_cast_or_null<CallInst>(
2304	Val: findSingleDependency(Flavor: NeedsPositiveRetainCount, Arg, StartBB: BB, StartInst: Ret, PA));
2305
2306	if (!Autorelease)
2307	return nullptr;
2308	ARCInstKind AutoreleaseClass = GetBasicARCInstKind(V: Autorelease);
2309	if (!IsAutorelease(Class: AutoreleaseClass))
2310	return nullptr;
2311	if (GetArgRCIdentityRoot(Inst: Autorelease) != Arg)
2312	return nullptr;
2313
2314	return Autorelease;
2315	}
2316
2317	/// Look for this pattern:
2318	/// \code
2319	/// %call = call i8 @something(...)*
2320	/// %2 = call i8 @objc_retain(i8* %call)*
2321	/// %3 = call i8 @objc_autorelease(i8* %2)*
2322	/// ret i8 %3*
2323	/// \endcode
2324	/// And delete the retain and autorelease.
2325	void ObjCARCOpt::OptimizeReturns(Function &F) {
2326	if (!F.getReturnType()->isPointerTy())
2327	return;
2328
2329	LLVM_DEBUG(dbgs() << "\n== ObjCARCOpt::OptimizeReturns ==\n");
2330
2331	for (BasicBlock &BB: F) {
2332	ReturnInst *Ret = dyn_cast<ReturnInst>(Val: &BB.back());
2333	if (!Ret)
2334	continue;
2335
2336	LLVM_DEBUG(dbgs() << "Visiting: " << *Ret << "\n");
2337
2338	const Value *Arg = GetRCIdentityRoot(V: Ret->getOperand(i_nocapture: `0`));
2339
2340	// Look for an ``autorelease'' instruction that is a predecessor of Ret and
2341	// dependent on Arg such that there are no instructions dependent on Arg
2342	// that need a positive ref count in between the autorelease and Ret.
2343	CallInst *Autorelease =
2344	FindPredecessorAutoreleaseWithSafePath(Arg, BB: &BB, Ret, PA);
2345
2346	if (!Autorelease)
2347	continue;
2348
2349	CallInst *Retain = FindPredecessorRetainWithSafePath(
2350	Arg, BB: Autorelease->getParent(), Autorelease, PA);
2351
2352	if (!Retain)
2353	continue;
2354
2355	// Check that there is nothing that can affect the reference count
2356	// between the retain and the call. Note that Retain need not be in BB.
2357	CallInst *Call = HasSafePathToPredecessorCall(Arg, Retain, PA);
2358
2359	// Don't remove retainRV/autoreleaseRV pairs if the call isn't a tail call.
2360	if (!Call \|\|
2361	(!Call->isTailCall() &&
2362	GetBasicARCInstKind(V: Retain) == ARCInstKind::RetainRV &&
2363	GetBasicARCInstKind(V: Autorelease) == ARCInstKind::AutoreleaseRV))
2364	continue;
2365
2366	// If so, we can zap the retain and autorelease.
2367	Changed = true;
2368	++NumRets;
2369	LLVM_DEBUG(dbgs() << "Erasing: " << Retain << "\nErasing: " << Autorelease
2370	<< "\n");
2371	BundledInsts->eraseInst(CI: Retain);
2372	EraseInstruction(CI: Autorelease);
2373	}
2374	}
2375
2376	#ifndef NDEBUG
2377	void
2378	ObjCARCOpt::GatherStatistics(Function &F, bool AfterOptimization) {
2379	Statistic &NumRetains =
2380	AfterOptimization ? NumRetainsAfterOpt : NumRetainsBeforeOpt;
2381	Statistic &NumReleases =
2382	AfterOptimization ? NumReleasesAfterOpt : NumReleasesBeforeOpt;
2383
2384	for (inst_iterator I = inst_begin(&F), E = inst_end(&F); I != E; ) {
2385	Instruction Inst = &I++;
2386	switch (GetBasicARCInstKind(Inst)) {
2387	default:
2388	break;
2389	case ARCInstKind::Retain:
2390	++NumRetains;
2391	break;
2392	case ARCInstKind::Release:
2393	++NumReleases;
2394	break;
2395	}
2396	}
2397	}
2398	#endif
2399
2400	void ObjCARCOpt::init(Function &F) {
2401	if (!EnableARCOpts)
2402	return;
2403
2404	// Intuitively, objc_retain and others are nocapture, however in practice
2405	// they are not, because they return their argument value. And objc_release
2406	// calls finalizers which can have arbitrary side effects.
2407	MDKindCache.init(Mod: F.getParent());
2408
2409	// Initialize our runtime entry point cache.
2410	EP.init(M: F.getParent());
2411
2412	// Compute which blocks are in which funclet.
2413	if (F.hasPersonalityFn() &&
2414	isScopedEHPersonality(Pers: classifyEHPersonality(Pers: F.getPersonalityFn())))
2415	BlockEHColors = colorEHFunclets(F);
2416	}
2417
2418	bool ObjCARCOpt::run(Function &F, AAResults &AA) {
2419	if (!EnableARCOpts)
2420	return false;
2421
2422	Changed = CFGChanged = false;
2423	BundledRetainClaimRVs BRV(EP, /ContractPass=/false, /UseClaimRV=/false);
2424	BundledInsts = &BRV;
2425
2426	LLVM_DEBUG(dbgs() << "<<< ObjCARCOpt: Visiting Function: " << F.getName()
2427	<< " >>>"
2428	"\n");
2429
2430	std::pair<bool, bool> R = BundledInsts->insertAfterInvokes(F, DT: nullptr);
2431	Changed \|= R.first;
2432	CFGChanged \|= R.second;
2433
2434	PA.setAA(&AA);
2435
2436	#ifndef NDEBUG
2437	if (AreStatisticsEnabled()) {
2438	GatherStatistics(F, false);
2439	}
2440	#endif
2441
2442	// This pass performs several distinct transformations. As a compile-time aid
2443	// when compiling code that isn't ObjC, skip these if the relevant ObjC
2444	// library functions aren't declared.
2445
2446	// Preliminary optimizations. This also computes UsedInThisFunction.
2447	OptimizeIndividualCalls(F);
2448
2449	// Optimizations for weak pointers.
2450	if (UsedInThisFunction & ((`1` << unsigned(ARCInstKind::LoadWeak)) \|
2451	(`1` << unsigned(ARCInstKind::LoadWeakRetained)) \|
2452	(`1` << unsigned(ARCInstKind::StoreWeak)) \|
2453	(`1` << unsigned(ARCInstKind::InitWeak)) \|
2454	(`1` << unsigned(ARCInstKind::CopyWeak)) \|
2455	(`1` << unsigned(ARCInstKind::MoveWeak)) \|
2456	(`1` << unsigned(ARCInstKind::DestroyWeak))))
2457	OptimizeWeakCalls(F);
2458
2459	// Optimizations for retain+release pairs.
2460	if (UsedInThisFunction & ((`1` << unsigned(ARCInstKind::Retain)) \|
2461	(`1` << unsigned(ARCInstKind::RetainRV)) \|
2462	(`1` << unsigned(ARCInstKind::RetainBlock))))
2463	if (UsedInThisFunction & (`1` << unsigned(ARCInstKind::Release)))
2464	// Run OptimizeSequences until it either stops making changes or
2465	// no retain+release pair nesting is detected.
2466	while (OptimizeSequences(F)) {}
2467
2468	// Optimizations if objc_autorelease is used.
2469	if (UsedInThisFunction & ((`1` << unsigned(ARCInstKind::Autorelease)) \|
2470	(`1` << unsigned(ARCInstKind::AutoreleaseRV))))
2471	OptimizeReturns(F);
2472
2473	// Optimizations for autorelease pools.
2474	if (UsedInThisFunction & ((`1` << unsigned(ARCInstKind::AutoreleasepoolPush)) \|
2475	(`1` << unsigned(ARCInstKind::AutoreleasepoolPop))))
2476	OptimizeAutoreleasePools(F);
2477
2478	// Gather statistics after optimization.
2479	#ifndef NDEBUG
2480	if (AreStatisticsEnabled()) {
2481	GatherStatistics(F, true);
2482	}
2483	#endif
2484
2485	LLVM_DEBUG(dbgs() << "\n");
2486
2487	return Changed;
2488	}
2489
2490	/// Interprocedurally determine if calls made by the given call site can
2491	/// possibly produce autoreleases.
2492	bool MayAutorelease(const CallBase &CB, unsigned Depth = `0`) {
2493	if (CB.onlyReadsMemory())
2494	return false;
2495
2496	// This recursion depth limit is arbitrary. It's just great
2497	// enough to cover known interesting testcases.
2498	if (Depth > `5`)
2499	return true;
2500
2501	if (const Function *Callee = CB.getCalledFunction()) {
2502	if (!Callee->hasExactDefinition())
2503	return true;
2504	for (const BasicBlock &BB : *Callee) {
2505	for (const Instruction &I : BB) {
2506	// TODO: Ignore all instructions between autorelease pools
2507	ARCInstKind InstKind = GetBasicARCInstKind(V: &I);
2508	switch (InstKind) {
2509	case ARCInstKind::Autorelease:
2510	case ARCInstKind::AutoreleaseRV:
2511	case ARCInstKind::FusedRetainAutorelease:
2512	case ARCInstKind::FusedRetainAutoreleaseRV:
2513	case ARCInstKind::LoadWeak:
2514	// These may produce autoreleases
2515	return true;
2516
2517	case ARCInstKind::Retain:
2518	case ARCInstKind::RetainRV:
2519	case ARCInstKind::UnsafeClaimRV:
2520	case ARCInstKind::RetainBlock:
2521	case ARCInstKind::Release:
2522	case ARCInstKind::NoopCast:
2523	case ARCInstKind::LoadWeakRetained:
2524	case ARCInstKind::StoreWeak:
2525	case ARCInstKind::InitWeak:
2526	case ARCInstKind::MoveWeak:
2527	case ARCInstKind::CopyWeak:
2528	case ARCInstKind::DestroyWeak:
2529	case ARCInstKind::StoreStrong:
2530	case ARCInstKind::AutoreleasepoolPush:
2531	case ARCInstKind::AutoreleasepoolPop:
2532	// These ObjC runtime functions don't produce autoreleases
2533	break;
2534
2535	case ARCInstKind::CallOrUser:
2536	case ARCInstKind::Call:
2537	// For non-ObjC function calls, recursively analyze
2538	if (MayAutorelease(CB: cast<CallBase>(Val: I), Depth: Depth + `1`))
2539	return true;
2540	break;
2541
2542	case ARCInstKind::IntrinsicUser:
2543	case ARCInstKind::User:
2544	case ARCInstKind::None:
2545	// These are not relevant for autorelease analysis
2546	break;
2547	}
2548	}
2549	}
2550	return false;
2551	}
2552
2553	return true;
2554	}
2555
2556	/// Optimize autorelease pools by eliminating empty push/pop pairs.
2557	void ObjCARCOpt::OptimizeAutoreleasePools(Function &F) {
2558	LLVM_DEBUG(dbgs() << "\n== ObjCARCOpt::OptimizeAutoreleasePools ==\n");
2559
2560	OptimizationRemarkEmitter ORE(&F);
2561
2562	// Process each basic block independently.
2563	// TODO: Can we optimize inter-block autorelease pool pairs?
2564	// This would involve tracking autorelease pool state across blocks.
2565	for (BasicBlock &BB : F) {
2566	// Use a stack to track nested autorelease pools
2567	SmallVector<std::pair<CallInst , bool*>, `4`>
2568	PoolStack; // {push_inst, has_autorelease_in_scope}
2569
2570	for (Instruction &Inst : llvm::make_early_inc_range(Range&: BB)) {
2571	ARCInstKind Class = GetBasicARCInstKind(V: &Inst);
2572
2573	switch (Class) {
2574	case ARCInstKind::AutoreleasepoolPush: {
2575	// Start tracking a new autorelease pool scope
2576	auto *Push = cast<CallInst>(Val: &Inst);
2577	PoolStack.push_back(
2578	Elt: {Push, false}); // {push_inst, has_autorelease_in_scope}
2579	LLVM_DEBUG(dbgs() << "Found autorelease pool push: " << *Push << "\n");
2580	break;
2581	}
2582
2583	case ARCInstKind::AutoreleasepoolPop: {
2584	auto *Pop = cast<CallInst>(Val: &Inst);
2585
2586	if (PoolStack.empty())
2587	break;
2588
2589	auto &TopPool = PoolStack.back();
2590	CallInst *PendingPush = TopPool.first;
2591	bool HasAutoreleaseInScope = TopPool.second;
2592
2593	// Pop the stack - remove this pool scope
2594	PoolStack.pop_back();
2595
2596	// Bail if this pop doesn't match the pending push
2597	if (Pop->getArgOperand(i: `0`)->stripPointerCasts() != PendingPush)
2598	break;
2599
2600	// Bail if there were autoreleases in this scope
2601	if (HasAutoreleaseInScope)
2602	break;
2603
2604	// Optimize: eliminate this empty autorelease pool pair
2605	ORE.emit(RemarkBuilder: [&]() {
2606	return OptimizationRemark (DEBUG_TYPE, "AutoreleasePoolElimination",
2607	PendingPush)
2608	<< "eliminated empty autorelease pool pair";
2609	});
2610
2611	// Replace all uses of push with poison before deletion
2612	PendingPush->replaceAllUsesWith(
2613	V: PoisonValue::get(T: PendingPush->getType()));
2614
2615	Pop->eraseFromParent();
2616	PendingPush->eraseFromParent();
2617
2618	Changed = true;
2619	++NumNoops;
2620	break;
2621	}
2622	case ARCInstKind::CallOrUser:
2623	case ARCInstKind::Call:
2624	if (!MayAutorelease(CB: cast<CallBase>(Val&: Inst)))
2625	break;
2626	[[fallthrough]];
2627	case ARCInstKind::Autorelease:
2628	case ARCInstKind::AutoreleaseRV:
2629	case ARCInstKind::FusedRetainAutorelease:
2630	case ARCInstKind::FusedRetainAutoreleaseRV:
2631	case ARCInstKind::LoadWeak: {
2632	// Track that we have autorelease calls in the current pool scope
2633	if (!PoolStack.empty()) {
2634	PoolStack.back().second = true; // Set has_autorelease_in_scope = true
2635	LLVM_DEBUG(
2636	dbgs()
2637	<< "Found autorelease or potential autorelease in pool scope: "
2638	<< Inst << "\n");
2639	}
2640	break;
2641	}
2642
2643	// Enumerate all remaining ARCInstKind cases explicitly
2644	case ARCInstKind::Retain:
2645	case ARCInstKind::RetainRV:
2646	case ARCInstKind::UnsafeClaimRV:
2647	case ARCInstKind::RetainBlock:
2648	case ARCInstKind::Release:
2649	case ARCInstKind::NoopCast:
2650	case ARCInstKind::LoadWeakRetained:
2651	case ARCInstKind::StoreWeak:
2652	case ARCInstKind::InitWeak:
2653	case ARCInstKind::MoveWeak:
2654	case ARCInstKind::CopyWeak:
2655	case ARCInstKind::DestroyWeak:
2656	case ARCInstKind::StoreStrong:
2657	case ARCInstKind::IntrinsicUser:
2658	case ARCInstKind::User:
2659	case ARCInstKind::None:
2660	// These instruction kinds don't affect autorelease pool optimization
2661	break;
2662	}
2663	}
2664	}
2665	}
2666
2667	/// @}
2668	///
2669
2670	PreservedAnalyses ObjCARCOptPass::run(Function &F,
2671	FunctionAnalysisManager &AM) {
2672	ObjCARCOpt OCAO;
2673	OCAO.init(F);
2674
2675	bool Changed = OCAO.run(F, AA&: AM.getResult<AAManager>(IR&: F));
2676	bool CFGChanged = OCAO.hasCFGChanged();
2677	if (Changed) {
2678	PreservedAnalyses PA;
2679	if (!CFGChanged)
2680	PA.preserveSet<CFGAnalyses>();
2681	return PA;
2682	}
2683	return PreservedAnalyses::all();
2684	}
2685

Browse the source code of llvm_projects/llvm/lib/Transforms/ObjCARC/ObjCARCOpts.cpp