Delinearization.cpp source code [llvm_projects/llvm/lib/Analysis/Delinearization.cpp]

1	//===---- Delinearization.cpp - MultiDimensional Index Delinearization ----===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	//
9	// This implements an analysis pass that tries to delinearize all GEP
10	// instructions in all loops using the SCEV analysis functionality. This pass is
11	// only used for testing purposes: if your pass needs delinearization, please
12	// use the on-demand SCEVAddRecExpr::delinearize() function.
13	//
14	//===----------------------------------------------------------------------===//
15
16	#include "llvm/Analysis/Delinearization.h"
17	#include "llvm/Analysis/LoopInfo.h"
18	#include "llvm/Analysis/ScalarEvolution.h"
19	#include "llvm/Analysis/ScalarEvolutionDivision.h"
20	#include "llvm/Analysis/ScalarEvolutionExpressions.h"
21	#include "llvm/IR/Constants.h"
22	#include "llvm/IR/DerivedTypes.h"
23	#include "llvm/IR/Function.h"
24	#include "llvm/IR/InstIterator.h"
25	#include "llvm/IR/Instructions.h"
26	#include "llvm/IR/PassManager.h"
27	#include "llvm/Support/Debug.h"
28	#include "llvm/Support/raw_ostream.h"
29
30	using namespace llvm;
31
32	#define DL_NAME "delinearize"
33	#define DEBUG_TYPE DL_NAME
34
35	// Return true when S contains at least an undef value.
36	static inline bool containsUndefs(const SCEV *S) {
37	return SCEVExprContains(Root: S, Pred: [](const SCEV *S) {
38	if (const auto *SU = dyn_cast<SCEVUnknown>(Val: S))
39	return isa<UndefValue>(Val: SU->getValue());
40	return false;
41	});
42	}
43
44	namespace {
45
46	// Collect all steps of SCEV expressions.
47	struct SCEVCollectStrides {
48	ScalarEvolution &SE;
49	SmallVectorImpl<const SCEV *> &Strides;
50
51	SCEVCollectStrides(ScalarEvolution &SE, SmallVectorImpl<const SCEV *> &S)
52	: SE(SE), Strides(S) {}
53
54	bool follow(const SCEV *S) {
55	if (const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(Val: S))
56	Strides.push_back(Elt: AR->getStepRecurrence(SE));
57	return true;
58	}
59
60	bool isDone() const { return false; }
61	};
62
63	// Collect all SCEVUnknown and SCEVMulExpr expressions.
64	struct SCEVCollectTerms {
65	SmallVectorImpl<const SCEV *> &Terms;
66
67	SCEVCollectTerms(SmallVectorImpl<const SCEV *> &T) : Terms(T) {}
68
69	bool follow(const SCEV *S) {
70	if (isa<SCEVUnknown>(Val: S) \|\| isa<SCEVMulExpr>(Val: S) \|\|
71	isa<SCEVSignExtendExpr>(Val: S)) {
72	if (!containsUndefs(S))
73	Terms.push_back(Elt: S);
74
75	// Stop recursion: once we collected a term, do not walk its operands.
76	return false;
77	}
78
79	// Keep looking.
80	return true;
81	}
82
83	bool isDone() const { return false; }
84	};
85
86	// Check if a SCEV contains an AddRecExpr.
87	struct SCEVHasAddRec {
88	bool &ContainsAddRec;
89
90	SCEVHasAddRec(bool &ContainsAddRec) : ContainsAddRec(ContainsAddRec) {
91	ContainsAddRec = false;
92	}
93
94	bool follow(const SCEV *S) {
95	if (isa<SCEVAddRecExpr>(Val: S)) {
96	ContainsAddRec = true;
97
98	// Stop recursion: once we collected a term, do not walk its operands.
99	return false;
100	}
101
102	// Keep looking.
103	return true;
104	}
105
106	bool isDone() const { return false; }
107	};
108
109	// Find factors that are multiplied with an expression that (possibly as a
110	// subexpression) contains an AddRecExpr. In the expression:
111	//
112	// 8 (100 + %p * %q * (%a + {0, +, 1}_loop))*
113	//
114	// "%p %q" are factors multiplied by the expression "(%a + {0, +, 1}_loop)"*
115	// that contains the AddRec {0, +, 1}_loop. %p %q are likely to be array size*
116	// parameters as they form a product with an induction variable.
117	//
118	// This collector expects all array size parameters to be in the same MulExpr.
119	// It might be necessary to later add support for collecting parameters that are
120	// spread over different nested MulExpr.
121	struct SCEVCollectAddRecMultiplies {
122	SmallVectorImpl<const SCEV *> &Terms;
123	ScalarEvolution &SE;
124
125	SCEVCollectAddRecMultiplies(SmallVectorImpl<const SCEV *> &T,
126	ScalarEvolution &SE)
127	: Terms(T), SE(SE) {}
128
129	bool follow(const SCEV *S) {
130	if (auto *Mul = dyn_cast<SCEVMulExpr>(Val: S)) {
131	bool HasAddRec = false;
132	SmallVector<const SCEV *, `0`> Operands;
133	for (const SCEV *Op : Mul->operands()) {
134	const SCEVUnknown *Unknown = dyn_cast<SCEVUnknown>(Val: Op);
135	if (Unknown && !isa<CallInst>(Val: Unknown->getValue())) {
136	Operands.push_back(Elt: Op);
137	} else if (Unknown) {
138	HasAddRec = true;
139	} else {
140	bool ContainsAddRec = false;
141	SCEVHasAddRec ContiansAddRec(ContainsAddRec);
142	visitAll(Root: Op, Visitor&: ContiansAddRec);
143	HasAddRec \|= ContainsAddRec;
144	}
145	}
146	if (Operands.size() == `0`)
147	return true;
148
149	if (!HasAddRec)
150	return false;
151
152	Terms.push_back(Elt: SE.getMulExpr(Ops&: Operands));
153	// Stop recursion: once we collected a term, do not walk its operands.
154	return false;
155	}
156
157	// Keep looking.
158	return true;
159	}
160
161	bool isDone() const { return false; }
162	};
163
164	} // end anonymous namespace
165
166	/// Find parametric terms in this SCEVAddRecExpr. We first for parameters in
167	/// two places:
168	/// 1) The strides of AddRec expressions.
169	/// 2) Unknowns that are multiplied with AddRec expressions.
170	void llvm::collectParametricTerms(ScalarEvolution &SE, const SCEV *Expr,
171	SmallVectorImpl<const SCEV *> &Terms) {
172	SmallVector<const SCEV *, `4`> Strides;
173	SCEVCollectStrides StrideCollector(SE, Strides);
174	visitAll(Root: Expr, Visitor&: StrideCollector);
175
176	LLVM_DEBUG({
177	dbgs() << "Strides:\n";
178	for (const SCEV *S : Strides)
179	dbgs() << *S << "\n";
180	});
181
182	for (const SCEV *S : Strides) {
183	SCEVCollectTerms TermCollector(Terms);
184	visitAll(Root: S, Visitor&: TermCollector);
185	}
186
187	LLVM_DEBUG({
188	dbgs() << "Terms:\n";
189	for (const SCEV *T : Terms)
190	dbgs() << *T << "\n";
191	});
192
193	SCEVCollectAddRecMultiplies MulCollector(Terms, SE);
194	visitAll(Root: Expr, Visitor&: MulCollector);
195	}
196
197	static bool findArrayDimensionsRec(ScalarEvolution &SE,
198	SmallVectorImpl<const SCEV *> &Terms,
199	SmallVectorImpl<const SCEV *> &Sizes) {
200	int Last = Terms.size() - `1`;
201	const SCEV *Step = Terms [Last];
202
203	// End of recursion.
204	if (Last == `0`) {
205	if (const SCEVMulExpr *M = dyn_cast<SCEVMulExpr>(Val: Step)) {
206	SmallVector<const SCEV *, `2`> Qs;
207	for (const SCEV *Op : M->operands())
208	if (!isa<SCEVConstant>(Val: Op))
209	Qs.push_back(Elt: Op);
210
211	Step = SE.getMulExpr(Ops&: Qs);
212	}
213
214	Sizes.push_back(Elt: Step);
215	return true;
216	}
217
218	for (const SCEV *&Term : Terms) {
219	// Normalize the terms before the next call to findArrayDimensionsRec.
220	const SCEV Q, R;
221	SCEVDivision::divide(SE, Numerator: Term, Denominator: Step, Quotient: &Q, Remainder: &R);
222
223	// Bail out when GCD does not evenly divide one of the terms.
224	if (!R->isZero())
225	return false;
226
227	Term = Q;
228	}
229
230	// Remove all SCEVConstants.
231	erase_if(C&: Terms, P: [](const SCEV E) { return* isa<SCEVConstant>(Val: E); });
232
233	if (Terms.size() > `0`)
234	if (!findArrayDimensionsRec(SE, Terms, Sizes))
235	return false;
236
237	Sizes.push_back(Elt: Step);
238	return true;
239	}
240
241	// Returns true when one of the SCEVs of Terms contains a SCEVUnknown parameter.
242	static inline bool containsParameters(SmallVectorImpl<const SCEV *> &Terms) {
243	for (const SCEV *T : Terms)
244	if (SCEVExprContains(Root: T, Pred: [](const SCEV S) { return* isa<SCEVUnknown>(Val: S); }))
245	return true;
246
247	return false;
248	}
249
250	// Return the number of product terms in S.
251	static inline int numberOfTerms(const SCEV *S) {
252	if (const SCEVMulExpr *Expr = dyn_cast<SCEVMulExpr>(Val: S))
253	return Expr->getNumOperands();
254	return `1`;
255	}
256
257	static const SCEV removeConstantFactors(ScalarEvolution &SE, const* SCEV *T) {
258	if (isa<SCEVConstant>(Val: T))
259	return nullptr;
260
261	if (isa<SCEVUnknown>(Val: T))
262	return T;
263
264	if (const SCEVMulExpr *M = dyn_cast<SCEVMulExpr>(Val: T)) {
265	SmallVector<const SCEV *, `2`> Factors;
266	for (const SCEV *Op : M->operands())
267	if (!isa<SCEVConstant>(Val: Op))
268	Factors.push_back(Elt: Op);
269
270	return SE.getMulExpr(Ops&: Factors);
271	}
272
273	return T;
274	}
275
276	void llvm::findArrayDimensions(ScalarEvolution &SE,
277	SmallVectorImpl<const SCEV *> &Terms,
278	SmallVectorImpl<const SCEV *> &Sizes,
279	const SCEV *ElementSize) {
280	if (Terms.size() < `1` \|\| !ElementSize)
281	return;
282
283	// Early return when Terms do not contain parameters: we do not delinearize
284	// non parametric SCEVs.
285	if (!containsParameters(Terms))
286	return;
287
288	LLVM_DEBUG({
289	dbgs() << "Terms:\n";
290	for (const SCEV *T : Terms)
291	dbgs() << *T << "\n";
292	});
293
294	// Remove duplicates.
295	array_pod_sort(Start: Terms.begin(), End: Terms.end());
296	Terms.erase(CS: llvm::unique(R&: Terms), CE: Terms.end());
297
298	// Put larger terms first.
299	llvm::sort(C&: Terms, Comp: [](const SCEV LHS, const* SCEV *RHS) {
300	return numberOfTerms(S: LHS) > numberOfTerms(S: RHS);
301	});
302
303	// Try to divide all terms by the element size. If term is not divisible by
304	// element size, proceed with the original term.
305	for (const SCEV *&Term : Terms) {
306	const SCEV Q, R;
307	SCEVDivision::divide(SE, Numerator: Term, Denominator: ElementSize, Quotient: &Q, Remainder: &R);
308	if (!Q->isZero())
309	Term = Q;
310	}
311
312	SmallVector<const SCEV *, `4`> NewTerms;
313
314	// Remove constant factors.
315	for (const SCEV *T : Terms)
316	if (const SCEV *NewT = removeConstantFactors(SE, T))
317	NewTerms.push_back(Elt: NewT);
318
319	LLVM_DEBUG({
320	dbgs() << "Terms after sorting:\n";
321	for (const SCEV *T : NewTerms)
322	dbgs() << *T << "\n";
323	});
324
325	if (NewTerms.empty() \|\| !findArrayDimensionsRec(SE, Terms&: NewTerms, Sizes)) {
326	Sizes.clear();
327	return;
328	}
329
330	// The last element to be pushed into Sizes is the size of an element.
331	Sizes.push_back(Elt: ElementSize);
332
333	LLVM_DEBUG({
334	dbgs() << "Sizes:\n";
335	for (const SCEV *S : Sizes)
336	dbgs() << *S << "\n";
337	});
338	}
339
340	void llvm::computeAccessFunctions(ScalarEvolution &SE, const SCEV *Expr,
341	SmallVectorImpl<const SCEV *> &Subscripts,
342	SmallVectorImpl<const SCEV *> &Sizes) {
343	// Early exit in case this SCEV is not an affine multivariate function.
344	if (Sizes.empty())
345	return;
346
347	if (auto *AR = dyn_cast<SCEVAddRecExpr>(Val: Expr))
348	if (!AR->isAffine())
349	return;
350
351	const SCEV *Res = Expr;
352	int Last = Sizes.size() - `1`;
353	for (int i = Last; i >= `0`; i--) {
354	const SCEV Q, R;
355	SCEVDivision::divide(SE, Numerator: Res, Denominator: Sizes [i], Quotient: &Q, Remainder: &R);
356
357	LLVM_DEBUG({
358	dbgs() << "Res: " << *Res << "\n";
359	dbgs() << "Sizes[i]: " << *Sizes[i] << "\n";
360	dbgs() << "Res divided by Sizes[i]:\n";
361	dbgs() << "Quotient: " << *Q << "\n";
362	dbgs() << "Remainder: " << *R << "\n";
363	});
364
365	Res = Q;
366
367	// Do not record the last subscript corresponding to the size of elements in
368	// the array.
369	if (i == Last) {
370
371	// Bail out if the byte offset is non-zero.
372	if (!R->isZero()) {
373	Subscripts.clear();
374	Sizes.clear();
375	return;
376	}
377
378	continue;
379	}
380
381	// Record the access function for the current subscript.
382	Subscripts.push_back(Elt: R);
383	}
384
385	// Also push in last position the remainder of the last division: it will be
386	// the access function of the innermost dimension.
387	Subscripts.push_back(Elt: Res);
388
389	std::reverse(first: Subscripts.begin(), last: Subscripts.end());
390
391	LLVM_DEBUG({
392	dbgs() << "Subscripts:\n";
393	for (const SCEV *S : Subscripts)
394	dbgs() << *S << "\n";
395	});
396	}
397
398	/// Splits the SCEV into two vectors of SCEVs representing the subscripts and
399	/// sizes of an array access. Returns the remainder of the delinearization that
400	/// is the offset start of the array. The SCEV->delinearize algorithm computes
401	/// the multiples of SCEV coefficients: that is a pattern matching of sub
402	/// expressions in the stride and base of a SCEV corresponding to the
403	/// computation of a GCD (greatest common divisor) of base and stride. When
404	/// SCEV->delinearize fails, it returns the SCEV unchanged.
405	///
406	/// For example: when analyzing the memory access A[i][j][k] in this loop nest
407	///
408	/// void foo(long n, long m, long o, double A[n][m][o]) {
409	///
410	/// for (long i = 0; i < n; i++)
411	/// for (long j = 0; j < m; j++)
412	/// for (long k = 0; k < o; k++)
413	/// A[i][j][k] = 1.0;
414	/// }
415	///
416	/// the delinearization input is the following AddRec SCEV:
417	///
418	/// AddRec: {{{%A,+,(8 %m * %o)}<%for.i>,+,(8 * %o)}<%for.j>,+,8}<%for.k>*
419	///
420	/// From this SCEV, we are able to say that the base offset of the access is %A
421	/// because it appears as an offset that does not divide any of the strides in
422	/// the loops:
423	///
424	/// CHECK: Base offset: %A
425	///
426	/// and then SCEV->delinearize determines the size of some of the dimensions of
427	/// the array as these are the multiples by which the strides are happening:
428	///
429	/// CHECK: ArrayDecl[UnknownSize][%m][%o] with elements of sizeof(double)
430	/// bytes.
431	///
432	/// Note that the outermost dimension remains of UnknownSize because there are
433	/// no strides that would help identifying the size of the last dimension: when
434	/// the array has been statically allocated, one could compute the size of that
435	/// dimension by dividing the overall size of the array by the size of the known
436	/// dimensions: %m %o * 8.*
437	///
438	/// Finally delinearize provides the access functions for the array reference
439	/// that does correspond to A[i][j][k] of the above C testcase:
440	///
441	/// CHECK: ArrayRef[{0,+,1}<%for.i>][{0,+,1}<%for.j>][{0,+,1}<%for.k>]
442	///
443	/// The testcases are checking the output of a function pass:
444	/// DelinearizationPass that walks through all loads and stores of a function
445	/// asking for the SCEV of the memory access with respect to all enclosing
446	/// loops, calling SCEV->delinearize on that and printing the results.
447	void llvm::delinearize(ScalarEvolution &SE, const SCEV *Expr,
448	SmallVectorImpl<const SCEV *> &Subscripts,
449	SmallVectorImpl<const SCEV *> &Sizes,
450	const SCEV *ElementSize) {
451	// First step: collect parametric terms.
452	SmallVector<const SCEV *, `4`> Terms;
453	collectParametricTerms(SE, Expr, Terms);
454
455	if (Terms.empty())
456	return;
457
458	// Second step: find subscript sizes.
459	findArrayDimensions(SE, Terms, Sizes, ElementSize);
460
461	if (Sizes.empty())
462	return;
463
464	// Third step: compute the access functions for each subscript.
465	computeAccessFunctions(SE, Expr, Subscripts, Sizes);
466
467	if (Subscripts.empty())
468	return;
469
470	LLVM_DEBUG({
471	dbgs() << "succeeded to delinearize " << *Expr << "\n";
472	dbgs() << "ArrayDecl[UnknownSize]";
473	for (const SCEV *S : Sizes)
474	dbgs() << "[" << *S << "]";
475
476	dbgs() << "\nArrayRef";
477	for (const SCEV *S : Subscripts)
478	dbgs() << "[" << *S << "]";
479	dbgs() << "\n";
480	});
481	}
482
483	bool llvm::getIndexExpressionsFromGEP(ScalarEvolution &SE,
484	const GetElementPtrInst *GEP,
485	SmallVectorImpl<const SCEV *> &Subscripts,
486	SmallVectorImpl<int> &Sizes) {
487	assert(Subscripts.empty() && Sizes.empty() &&
488	"Expected output lists to be empty on entry to this function.");
489	assert(GEP && "getIndexExpressionsFromGEP called with a null GEP");
490	Type Ty = nullptr*;
491	bool DroppedFirstDim = false;
492	for (unsigned i = `1`; i < GEP->getNumOperands(); i++) {
493	const SCEV *Expr = SE.getSCEV(V: GEP->getOperand(i_nocapture: i));
494	if (i == `1`) {
495	Ty = GEP->getSourceElementType();
496	if (auto *Const = dyn_cast<SCEVConstant>(Val: Expr))
497	if (Const->getValue()->isZero()) {
498	DroppedFirstDim = true;
499	continue;
500	}
501	Subscripts.push_back(Elt: Expr);
502	continue;
503	}
504
505	auto *ArrayTy = dyn_cast<ArrayType>(Val: Ty);
506	if (!ArrayTy) {
507	Subscripts.clear();
508	Sizes.clear();
509	return false;
510	}
511
512	Subscripts.push_back(Elt: Expr);
513	if (!(DroppedFirstDim && i == `2`))
514	Sizes.push_back(Elt: ArrayTy->getNumElements());
515
516	Ty = ArrayTy->getElementType();
517	}
518	return !Subscripts.empty();
519	}
520
521	bool llvm::tryDelinearizeFixedSizeImpl(
522	ScalarEvolution SE, Instruction Inst, const SCEV *AccessFn,
523	SmallVectorImpl<const SCEV > &Subscripts, SmallVectorImpl<int*> &Sizes) {
524	Value *SrcPtr = getLoadStorePointerOperand(V: Inst);
525
526	// Check the simple case where the array dimensions are fixed size.
527	auto *SrcGEP = dyn_cast<GetElementPtrInst>(Val: SrcPtr);
528	if (!SrcGEP)
529	return false;
530
531	getIndexExpressionsFromGEP(SE&: *SE, GEP: SrcGEP, Subscripts, Sizes);
532
533	// Check that the two size arrays are non-empty and equal in length and
534	// value.
535	// TODO: it would be better to let the caller to clear Subscripts, similar
536	// to how we handle Sizes.
537	if (Sizes.empty() \|\| Subscripts.size() <= `1`) {
538	Subscripts.clear();
539	return false;
540	}
541
542	// Check that for identical base pointers we do not miss index offsets
543	// that have been added before this GEP is applied.
544	Value *SrcBasePtr = SrcGEP->getOperand(i_nocapture: `0`)->stripPointerCasts();
545	const SCEVUnknown *SrcBase =
546	dyn_cast<SCEVUnknown>(Val: SE->getPointerBase(V: AccessFn));
547	if (!SrcBase \|\| SrcBasePtr != SrcBase->getValue()) {
548	Subscripts.clear();
549	return false;
550	}
551
552	assert(Subscripts.size() == Sizes.size() + `1` &&
553	"Expected equal number of entries in the list of size and "
554	"subscript.");
555
556	return true;
557	}
558
559	namespace {
560
561	void printDelinearization(raw_ostream &O, Function F, LoopInfo LI,
562	ScalarEvolution *SE) {
563	O << "Delinearization on function " << F->getName() << ":\n";
564	for (Instruction &Inst : instructions(F)) {
565	// Only analyze loads and stores.
566	if (!isa<StoreInst>(Val: &Inst) && !isa<LoadInst>(Val: &Inst) &&
567	!isa<GetElementPtrInst>(Val: &Inst))
568	continue;
569
570	const BasicBlock *BB = Inst.getParent();
571	// Delinearize the memory access as analyzed in all the surrounding loops.
572	// Do not analyze memory accesses outside loops.
573	for (Loop L = LI->getLoopFor(BB); L != nullptr*; L = L->getParentLoop()) {
574	const SCEV *AccessFn = SE->getSCEVAtScope(V: getPointerOperand(V: &Inst), L);
575
576	const SCEVUnknown *BasePointer =
577	dyn_cast<SCEVUnknown>(Val: SE->getPointerBase(V: AccessFn));
578	// Do not delinearize if we cannot find the base pointer.
579	if (!BasePointer)
580	break;
581	AccessFn = SE->getMinusSCEV(LHS: AccessFn, RHS: BasePointer);
582
583	O << "\n";
584	O << "Inst:" << Inst << "\n";
585	O << "In Loop with Header: " << L->getHeader()->getName() << "\n";
586	O << "AccessFunction: " << *AccessFn << "\n";
587
588	SmallVector<const SCEV *, `3`> Subscripts, Sizes;
589	delinearize(SE&: *SE, Expr: AccessFn, Subscripts, Sizes, ElementSize: SE->getElementSize(Inst: &Inst));
590	if (Subscripts.size() == `0` \|\| Sizes.size() == `0` \|\|
591	Subscripts.size() != Sizes.size()) {
592	O << "failed to delinearize\n";
593	continue;
594	}
595
596	O << "Base offset: " << *BasePointer << "\n";
597	O << "ArrayDecl[UnknownSize]";
598	int Size = Subscripts.size();
599	for (int i = `0`; i < Size - `1`; i++)
600	O << "[" << *Sizes [i] << "]";
601	O << " with elements of " << *Sizes [Size - `1`] << " bytes.\n";
602
603	O << "ArrayRef";
604	for (int i = `0`; i < Size; i++)
605	O << "[" << *Subscripts [i] << "]";
606	O << "\n";
607	}
608	}
609	}
610
611	} // end anonymous namespace
612
613	DelinearizationPrinterPass::DelinearizationPrinterPass(raw_ostream &OS)
614	: OS(OS) {}
615	PreservedAnalyses DelinearizationPrinterPass::run(Function &F,
616	FunctionAnalysisManager &AM) {
617	printDelinearization(O&: OS, F: &F, LI: &AM.getResult<LoopAnalysis>(IR&: F),
618	SE: &AM.getResult<ScalarEvolutionAnalysis>(IR&: F));
619	return PreservedAnalyses::all();
620	}
621

Browse the source code of llvm_projects/llvm/lib/Analysis/Delinearization.cpp