| 1 | //===- LoopVersioningLICM.cpp - LICM Loop Versioning ----------------------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // When alias analysis is uncertain about the aliasing between any two accesses, |
| 10 | // it will return MayAlias. This uncertainty from alias analysis restricts LICM |
| 11 | // from proceeding further. In cases where alias analysis is uncertain we might |
| 12 | // use loop versioning as an alternative. |
| 13 | // |
| 14 | // Loop Versioning will create a version of the loop with aggressive aliasing |
| 15 | // assumptions in addition to the original with conservative (default) aliasing |
| 16 | // assumptions. The version of the loop making aggressive aliasing assumptions |
| 17 | // will have all the memory accesses marked as no-alias. These two versions of |
| 18 | // loop will be preceded by a memory runtime check. This runtime check consists |
| 19 | // of bound checks for all unique memory accessed in loop, and it ensures the |
| 20 | // lack of memory aliasing. The result of the runtime check determines which of |
| 21 | // the loop versions is executed: If the runtime check detects any memory |
| 22 | // aliasing, then the original loop is executed. Otherwise, the version with |
| 23 | // aggressive aliasing assumptions is used. |
| 24 | // |
| 25 | // Following are the top level steps: |
| 26 | // |
| 27 | // a) Perform LoopVersioningLICM's feasibility check. |
| 28 | // b) If loop is a candidate for versioning then create a memory bound check, |
| 29 | // by considering all the memory accesses in loop body. |
| 30 | // c) Clone original loop and set all memory accesses as no-alias in new loop. |
| 31 | // d) Set original loop & versioned loop as a branch target of the runtime check |
| 32 | // result. |
| 33 | // |
| 34 | // It transforms loop as shown below: |
| 35 | // |
| 36 | // +----------------+ |
| 37 | // |Runtime Memcheck| |
| 38 | // +----------------+ |
| 39 | // | |
| 40 | // +----------+----------------+----------+ |
| 41 | // | | |
| 42 | // +---------+----------+ +-----------+----------+ |
| 43 | // |Orig Loop Preheader | |Cloned Loop Preheader | |
| 44 | // +--------------------+ +----------------------+ |
| 45 | // | | |
| 46 | // +--------------------+ +----------------------+ |
| 47 | // |Orig Loop Body | |Cloned Loop Body | |
| 48 | // +--------------------+ +----------------------+ |
| 49 | // | | |
| 50 | // +--------------------+ +----------------------+ |
| 51 | // |Orig Loop Exit Block| |Cloned Loop Exit Block| |
| 52 | // +--------------------+ +-----------+----------+ |
| 53 | // | | |
| 54 | // +----------+--------------+-----------+ |
| 55 | // | |
| 56 | // +-----+----+ |
| 57 | // |Join Block| |
| 58 | // +----------+ |
| 59 | // |
| 60 | //===----------------------------------------------------------------------===// |
| 61 | |
| 62 | #include "llvm/Transforms/Scalar/LoopVersioningLICM.h" |
| 63 | #include "llvm/ADT/SmallVector.h" |
| 64 | #include "llvm/ADT/StringRef.h" |
| 65 | #include "llvm/Analysis/AliasAnalysis.h" |
| 66 | #include "llvm/Analysis/AliasSetTracker.h" |
| 67 | #include "llvm/Analysis/GlobalsModRef.h" |
| 68 | #include "llvm/Analysis/LoopAccessAnalysis.h" |
| 69 | #include "llvm/Analysis/LoopInfo.h" |
| 70 | #include "llvm/Analysis/LoopPass.h" |
| 71 | #include "llvm/Analysis/OptimizationRemarkEmitter.h" |
| 72 | #include "llvm/Analysis/ScalarEvolution.h" |
| 73 | #include "llvm/IR/Dominators.h" |
| 74 | #include "llvm/IR/Instruction.h" |
| 75 | #include "llvm/IR/Instructions.h" |
| 76 | #include "llvm/IR/LLVMContext.h" |
| 77 | #include "llvm/IR/MDBuilder.h" |
| 78 | #include "llvm/IR/Metadata.h" |
| 79 | #include "llvm/IR/Value.h" |
| 80 | #include "llvm/Support/Casting.h" |
| 81 | #include "llvm/Support/CommandLine.h" |
| 82 | #include "llvm/Support/Debug.h" |
| 83 | #include "llvm/Support/raw_ostream.h" |
| 84 | #include "llvm/Transforms/Utils/LoopUtils.h" |
| 85 | #include "llvm/Transforms/Utils/LoopVersioning.h" |
| 86 | #include <cassert> |
| 87 | |
| 88 | using namespace llvm; |
| 89 | |
| 90 | #define DEBUG_TYPE "loop-versioning-licm" |
| 91 | |
| 92 | static const char *LICMVersioningMetaData = "llvm.loop.licm_versioning.disable" ; |
| 93 | |
| 94 | /// Threshold minimum allowed percentage for possible |
| 95 | /// invariant instructions in a loop. |
| 96 | static cl::opt<float> |
| 97 | LVInvarThreshold("licm-versioning-invariant-threshold" , |
| 98 | cl::desc("LoopVersioningLICM's minimum allowed percentage " |
| 99 | "of possible invariant instructions per loop" ), |
| 100 | cl::init(Val: 25), cl::Hidden); |
| 101 | |
| 102 | /// Threshold for maximum allowed loop nest/depth |
| 103 | static cl::opt<unsigned> LVLoopDepthThreshold( |
| 104 | "licm-versioning-max-depth-threshold" , |
| 105 | cl::desc( |
| 106 | "LoopVersioningLICM's threshold for maximum allowed loop nest/depth" ), |
| 107 | cl::init(Val: 2), cl::Hidden); |
| 108 | |
| 109 | namespace { |
| 110 | |
| 111 | struct LoopVersioningLICM { |
| 112 | // We don't explicitly pass in LoopAccessInfo to the constructor since the |
| 113 | // loop versioning might return early due to instructions that are not safe |
| 114 | // for versioning. By passing the proxy instead the construction of |
| 115 | // LoopAccessInfo will take place only when it's necessary. |
| 116 | (AliasAnalysis *AA, ScalarEvolution *SE, |
| 117 | OptimizationRemarkEmitter *ORE, |
| 118 | LoopAccessInfoManager &LAIs, LoopInfo &LI, |
| 119 | Loop *CurLoop) |
| 120 | : AA(AA), SE(SE), LAIs(LAIs), LI(LI), CurLoop(CurLoop), |
| 121 | LoopDepthThreshold(LVLoopDepthThreshold), |
| 122 | InvariantThreshold(LVInvarThreshold), ORE(ORE) {} |
| 123 | |
| 124 | bool run(DominatorTree *DT); |
| 125 | |
| 126 | private: |
| 127 | // Current AliasAnalysis information |
| 128 | AliasAnalysis *AA; |
| 129 | |
| 130 | // Current ScalarEvolution |
| 131 | ScalarEvolution *SE; |
| 132 | |
| 133 | // Current Loop's LoopAccessInfo |
| 134 | const LoopAccessInfo *LAI = nullptr; |
| 135 | |
| 136 | // Proxy for retrieving LoopAccessInfo. |
| 137 | LoopAccessInfoManager &LAIs; |
| 138 | |
| 139 | LoopInfo &LI; |
| 140 | |
| 141 | // The current loop we are working on. |
| 142 | Loop *CurLoop; |
| 143 | |
| 144 | // Maximum loop nest threshold |
| 145 | unsigned LoopDepthThreshold; |
| 146 | |
| 147 | // Minimum invariant threshold |
| 148 | float InvariantThreshold; |
| 149 | |
| 150 | // Counter to track num of load & store |
| 151 | unsigned LoadAndStoreCounter = 0; |
| 152 | |
| 153 | // Counter to track num of invariant |
| 154 | unsigned InvariantCounter = 0; |
| 155 | |
| 156 | // Read only loop marker. |
| 157 | bool IsReadOnlyLoop = true; |
| 158 | |
| 159 | // OptimizationRemarkEmitter |
| 160 | OptimizationRemarkEmitter *ORE; |
| 161 | |
| 162 | bool isLegalForVersioning(); |
| 163 | bool legalLoopStructure(); |
| 164 | bool legalLoopInstructions(); |
| 165 | bool legalLoopMemoryAccesses(); |
| 166 | bool isLoopAlreadyVisited(); |
| 167 | bool instructionSafeForVersioning(Instruction *I); |
| 168 | }; |
| 169 | |
| 170 | } // end anonymous namespace |
| 171 | |
| 172 | /// Check loop structure and confirms it's good for LoopVersioningLICM. |
| 173 | bool LoopVersioningLICM::legalLoopStructure() { |
| 174 | // Loop must be in loop simplify form. |
| 175 | if (!CurLoop->isLoopSimplifyForm()) { |
| 176 | LLVM_DEBUG(dbgs() << " loop is not in loop-simplify form.\n" ); |
| 177 | return false; |
| 178 | } |
| 179 | // Loop should be innermost loop, if not return false. |
| 180 | if (!CurLoop->getSubLoops().empty()) { |
| 181 | LLVM_DEBUG(dbgs() << " loop is not innermost\n" ); |
| 182 | return false; |
| 183 | } |
| 184 | // Loop should have a single backedge, if not return false. |
| 185 | if (CurLoop->getNumBackEdges() != 1) { |
| 186 | LLVM_DEBUG(dbgs() << " loop has multiple backedges\n" ); |
| 187 | return false; |
| 188 | } |
| 189 | // Loop must have a single exiting block, if not return false. |
| 190 | if (!CurLoop->getExitingBlock()) { |
| 191 | LLVM_DEBUG(dbgs() << " loop has multiple exiting block\n" ); |
| 192 | return false; |
| 193 | } |
| 194 | // We only handle bottom-tested loop, i.e. loop in which the condition is |
| 195 | // checked at the end of each iteration. With that we can assume that all |
| 196 | // instructions in the loop are executed the same number of times. |
| 197 | if (CurLoop->getExitingBlock() != CurLoop->getLoopLatch()) { |
| 198 | LLVM_DEBUG(dbgs() << " loop is not bottom tested\n" ); |
| 199 | return false; |
| 200 | } |
| 201 | // Parallel loops must not have aliasing loop-invariant memory accesses. |
| 202 | // Hence we don't need to version anything in this case. |
| 203 | if (CurLoop->isAnnotatedParallel()) { |
| 204 | LLVM_DEBUG(dbgs() << " Parallel loop is not worth versioning\n" ); |
| 205 | return false; |
| 206 | } |
| 207 | // Loop depth more then LoopDepthThreshold are not allowed |
| 208 | if (CurLoop->getLoopDepth() > LoopDepthThreshold) { |
| 209 | LLVM_DEBUG(dbgs() << " loop depth is more than threshold\n" ); |
| 210 | return false; |
| 211 | } |
| 212 | // We need to be able to compute the loop trip count in order |
| 213 | // to generate the bound checks. |
| 214 | const SCEV *ExitCount = SE->getBackedgeTakenCount(L: CurLoop); |
| 215 | if (isa<SCEVCouldNotCompute>(Val: ExitCount)) { |
| 216 | LLVM_DEBUG(dbgs() << " loop does not have trip count\n" ); |
| 217 | return false; |
| 218 | } |
| 219 | return true; |
| 220 | } |
| 221 | |
| 222 | /// Check memory accesses in loop and confirms it's good for |
| 223 | /// LoopVersioningLICM. |
| 224 | bool LoopVersioningLICM::legalLoopMemoryAccesses() { |
| 225 | // Loop over the body of this loop, construct AST. |
| 226 | BatchAAResults BAA(*AA); |
| 227 | AliasSetTracker AST(BAA); |
| 228 | for (auto *Block : CurLoop->getBlocks()) { |
| 229 | // Ignore blocks in subloops. |
| 230 | if (LI.getLoopFor(BB: Block) == CurLoop) |
| 231 | AST.add(BB&: *Block); |
| 232 | } |
| 233 | |
| 234 | // Memory check: |
| 235 | // Transform phase will generate a versioned loop and also a runtime check to |
| 236 | // ensure the pointers are independent and they don’t alias. |
| 237 | // In version variant of loop, alias meta data asserts that all access are |
| 238 | // mutually independent. |
| 239 | // |
| 240 | // Pointers aliasing in alias domain are avoided because with multiple |
| 241 | // aliasing domains we may not be able to hoist potential loop invariant |
| 242 | // access out of the loop. |
| 243 | // |
| 244 | // Iterate over alias tracker sets, and confirm AliasSets doesn't have any |
| 245 | // must alias set. |
| 246 | bool HasMayAlias = false; |
| 247 | bool TypeSafety = false; |
| 248 | bool HasMod = false; |
| 249 | for (const auto &I : AST) { |
| 250 | const AliasSet &AS = I; |
| 251 | // Skip Forward Alias Sets, as this should be ignored as part of |
| 252 | // the AliasSetTracker object. |
| 253 | if (AS.isForwardingAliasSet()) |
| 254 | continue; |
| 255 | // With MustAlias its not worth adding runtime bound check. |
| 256 | if (AS.isMustAlias()) |
| 257 | return false; |
| 258 | const Value *SomePtr = AS.begin()->Ptr; |
| 259 | bool TypeCheck = true; |
| 260 | // Check for Mod & MayAlias |
| 261 | HasMayAlias |= AS.isMayAlias(); |
| 262 | HasMod |= AS.isMod(); |
| 263 | for (const auto &MemLoc : AS) { |
| 264 | const Value *Ptr = MemLoc.Ptr; |
| 265 | // Alias tracker should have pointers of same data type. |
| 266 | // |
| 267 | // FIXME: check no longer effective since opaque pointers? |
| 268 | // If the intent is to check that the memory accesses use the |
| 269 | // same data type (such that LICM can promote them), then we |
| 270 | // can no longer see this from the pointer value types. |
| 271 | TypeCheck = (TypeCheck && (SomePtr->getType() == Ptr->getType())); |
| 272 | } |
| 273 | // At least one alias tracker should have pointers of same data type. |
| 274 | TypeSafety |= TypeCheck; |
| 275 | } |
| 276 | // Ensure types should be of same type. |
| 277 | if (!TypeSafety) { |
| 278 | LLVM_DEBUG(dbgs() << " Alias tracker type safety failed!\n" ); |
| 279 | return false; |
| 280 | } |
| 281 | // Ensure loop body shouldn't be read only. |
| 282 | if (!HasMod) { |
| 283 | LLVM_DEBUG(dbgs() << " No memory modified in loop body\n" ); |
| 284 | return false; |
| 285 | } |
| 286 | // Make sure alias set has may alias case. |
| 287 | // If there no alias memory ambiguity, return false. |
| 288 | if (!HasMayAlias) { |
| 289 | LLVM_DEBUG(dbgs() << " No ambiguity in memory access.\n" ); |
| 290 | return false; |
| 291 | } |
| 292 | return true; |
| 293 | } |
| 294 | |
| 295 | /// Check loop instructions safe for Loop versioning. |
| 296 | /// It returns true if it's safe else returns false. |
| 297 | /// Consider following: |
| 298 | /// 1) Check all load store in loop body are non atomic & non volatile. |
| 299 | /// 2) Check function call safety, by ensuring its not accessing memory. |
| 300 | /// 3) Loop body shouldn't have any may throw instruction. |
| 301 | /// 4) Loop body shouldn't have any convergent or noduplicate instructions. |
| 302 | bool LoopVersioningLICM::instructionSafeForVersioning(Instruction *I) { |
| 303 | assert(I != nullptr && "Null instruction found!" ); |
| 304 | // Check function call safety |
| 305 | if (auto *Call = dyn_cast<CallBase>(Val: I)) { |
| 306 | if (Call->isConvergent() || Call->cannotDuplicate()) { |
| 307 | LLVM_DEBUG(dbgs() << " Convergent call site found.\n" ); |
| 308 | return false; |
| 309 | } |
| 310 | |
| 311 | if (!AA->doesNotAccessMemory(Call)) { |
| 312 | LLVM_DEBUG(dbgs() << " Unsafe call site found.\n" ); |
| 313 | return false; |
| 314 | } |
| 315 | } |
| 316 | |
| 317 | // Avoid loops with possiblity of throw |
| 318 | if (I->mayThrow()) { |
| 319 | LLVM_DEBUG(dbgs() << " May throw instruction found in loop body\n" ); |
| 320 | return false; |
| 321 | } |
| 322 | // If current instruction is load instructions |
| 323 | // make sure it's a simple load (non atomic & non volatile) |
| 324 | if (I->mayReadFromMemory()) { |
| 325 | LoadInst *Ld = dyn_cast<LoadInst>(Val: I); |
| 326 | if (!Ld || !Ld->isSimple()) { |
| 327 | LLVM_DEBUG(dbgs() << " Found a non-simple load.\n" ); |
| 328 | return false; |
| 329 | } |
| 330 | LoadAndStoreCounter++; |
| 331 | Value *Ptr = Ld->getPointerOperand(); |
| 332 | // Check loop invariant. |
| 333 | if (SE->isLoopInvariant(S: SE->getSCEV(V: Ptr), L: CurLoop)) |
| 334 | InvariantCounter++; |
| 335 | } |
| 336 | // If current instruction is store instruction |
| 337 | // make sure it's a simple store (non atomic & non volatile) |
| 338 | else if (I->mayWriteToMemory()) { |
| 339 | StoreInst *St = dyn_cast<StoreInst>(Val: I); |
| 340 | if (!St || !St->isSimple()) { |
| 341 | LLVM_DEBUG(dbgs() << " Found a non-simple store.\n" ); |
| 342 | return false; |
| 343 | } |
| 344 | LoadAndStoreCounter++; |
| 345 | Value *Ptr = St->getPointerOperand(); |
| 346 | // Don't allow stores that we don't have runtime checks for, as we won't be |
| 347 | // able to mark them noalias meaning they would prevent any code motion. |
| 348 | auto &Pointers = LAI->getRuntimePointerChecking()->Pointers; |
| 349 | if (!any_of(Range: Pointers, P: [&](auto &P) { return P.PointerValue == Ptr; })) { |
| 350 | LLVM_DEBUG(dbgs() << " Found a store without a runtime check.\n" ); |
| 351 | return false; |
| 352 | } |
| 353 | // Check loop invariant. |
| 354 | if (SE->isLoopInvariant(S: SE->getSCEV(V: Ptr), L: CurLoop)) |
| 355 | InvariantCounter++; |
| 356 | |
| 357 | IsReadOnlyLoop = false; |
| 358 | } |
| 359 | return true; |
| 360 | } |
| 361 | |
| 362 | /// Check loop instructions and confirms it's good for |
| 363 | /// LoopVersioningLICM. |
| 364 | bool LoopVersioningLICM::legalLoopInstructions() { |
| 365 | // Resetting counters. |
| 366 | LoadAndStoreCounter = 0; |
| 367 | InvariantCounter = 0; |
| 368 | IsReadOnlyLoop = true; |
| 369 | using namespace ore; |
| 370 | // Get LoopAccessInfo from current loop via the proxy. |
| 371 | LAI = &LAIs.getInfo(L&: *CurLoop, /*AllowPartial=*/true); |
| 372 | // Check LoopAccessInfo for need of runtime check. |
| 373 | if (LAI->getRuntimePointerChecking()->getChecks().empty()) { |
| 374 | LLVM_DEBUG(dbgs() << " LAA: Runtime check not found !!\n" ); |
| 375 | return false; |
| 376 | } |
| 377 | // Iterate over loop blocks and instructions of each block and check |
| 378 | // instruction safety. |
| 379 | for (auto *Block : CurLoop->getBlocks()) |
| 380 | for (auto &Inst : *Block) { |
| 381 | // If instruction is unsafe just return false. |
| 382 | if (!instructionSafeForVersioning(I: &Inst)) { |
| 383 | ORE->emit(RemarkBuilder: [&]() { |
| 384 | return OptimizationRemarkMissed(DEBUG_TYPE, "IllegalLoopInst" , &Inst) |
| 385 | << " Unsafe Loop Instruction" ; |
| 386 | }); |
| 387 | return false; |
| 388 | } |
| 389 | } |
| 390 | // Number of runtime-checks should be less then RuntimeMemoryCheckThreshold |
| 391 | if (LAI->getNumRuntimePointerChecks() > |
| 392 | VectorizerParams::RuntimeMemoryCheckThreshold) { |
| 393 | LLVM_DEBUG( |
| 394 | dbgs() << " LAA: Runtime checks are more than threshold !!\n" ); |
| 395 | ORE->emit(RemarkBuilder: [&]() { |
| 396 | return OptimizationRemarkMissed(DEBUG_TYPE, "RuntimeCheck" , |
| 397 | CurLoop->getStartLoc(), |
| 398 | CurLoop->getHeader()) |
| 399 | << "Number of runtime checks " |
| 400 | << NV("RuntimeChecks" , LAI->getNumRuntimePointerChecks()) |
| 401 | << " exceeds threshold " |
| 402 | << NV("Threshold" , VectorizerParams::RuntimeMemoryCheckThreshold); |
| 403 | }); |
| 404 | return false; |
| 405 | } |
| 406 | // Loop should have at least one invariant load or store instruction. |
| 407 | if (!InvariantCounter) { |
| 408 | LLVM_DEBUG(dbgs() << " Invariant not found !!\n" ); |
| 409 | return false; |
| 410 | } |
| 411 | // Read only loop not allowed. |
| 412 | if (IsReadOnlyLoop) { |
| 413 | LLVM_DEBUG(dbgs() << " Found a read-only loop!\n" ); |
| 414 | return false; |
| 415 | } |
| 416 | // Profitablity check: |
| 417 | // Check invariant threshold, should be in limit. |
| 418 | if (InvariantCounter * 100 < InvariantThreshold * LoadAndStoreCounter) { |
| 419 | LLVM_DEBUG( |
| 420 | dbgs() |
| 421 | << " Invariant load & store are less then defined threshold\n" ); |
| 422 | LLVM_DEBUG(dbgs() << " Invariant loads & stores: " |
| 423 | << ((InvariantCounter * 100) / LoadAndStoreCounter) |
| 424 | << "%\n" ); |
| 425 | LLVM_DEBUG(dbgs() << " Invariant loads & store threshold: " |
| 426 | << InvariantThreshold << "%\n" ); |
| 427 | ORE->emit(RemarkBuilder: [&]() { |
| 428 | return OptimizationRemarkMissed(DEBUG_TYPE, "InvariantThreshold" , |
| 429 | CurLoop->getStartLoc(), |
| 430 | CurLoop->getHeader()) |
| 431 | << "Invariant load & store " |
| 432 | << NV("LoadAndStoreCounter" , |
| 433 | ((InvariantCounter * 100) / LoadAndStoreCounter)) |
| 434 | << " are less then defined threshold " |
| 435 | << NV("Threshold" , InvariantThreshold); |
| 436 | }); |
| 437 | return false; |
| 438 | } |
| 439 | return true; |
| 440 | } |
| 441 | |
| 442 | /// It checks loop is already visited or not. |
| 443 | /// check loop meta data, if loop revisited return true |
| 444 | /// else false. |
| 445 | bool LoopVersioningLICM::isLoopAlreadyVisited() { |
| 446 | // Check LoopVersioningLICM metadata into loop |
| 447 | if (findStringMetadataForLoop(TheLoop: CurLoop, Name: LICMVersioningMetaData)) { |
| 448 | return true; |
| 449 | } |
| 450 | return false; |
| 451 | } |
| 452 | |
| 453 | /// Checks legality for LoopVersioningLICM by considering following: |
| 454 | /// a) loop structure legality b) loop instruction legality |
| 455 | /// c) loop memory access legality. |
| 456 | /// Return true if legal else returns false. |
| 457 | bool LoopVersioningLICM::isLegalForVersioning() { |
| 458 | using namespace ore; |
| 459 | LLVM_DEBUG(dbgs() << "Loop: " << *CurLoop); |
| 460 | // Make sure not re-visiting same loop again. |
| 461 | if (isLoopAlreadyVisited()) { |
| 462 | LLVM_DEBUG( |
| 463 | dbgs() << " Revisiting loop in LoopVersioningLICM not allowed.\n\n" ); |
| 464 | return false; |
| 465 | } |
| 466 | // Check loop structure leagality. |
| 467 | if (!legalLoopStructure()) { |
| 468 | LLVM_DEBUG( |
| 469 | dbgs() << " Loop structure not suitable for LoopVersioningLICM\n\n" ); |
| 470 | ORE->emit(RemarkBuilder: [&]() { |
| 471 | return OptimizationRemarkMissed(DEBUG_TYPE, "IllegalLoopStruct" , |
| 472 | CurLoop->getStartLoc(), |
| 473 | CurLoop->getHeader()) |
| 474 | << " Unsafe Loop structure" ; |
| 475 | }); |
| 476 | return false; |
| 477 | } |
| 478 | // Check loop instruction leagality. |
| 479 | if (!legalLoopInstructions()) { |
| 480 | LLVM_DEBUG( |
| 481 | dbgs() |
| 482 | << " Loop instructions not suitable for LoopVersioningLICM\n\n" ); |
| 483 | return false; |
| 484 | } |
| 485 | // Check loop memory access leagality. |
| 486 | if (!legalLoopMemoryAccesses()) { |
| 487 | LLVM_DEBUG( |
| 488 | dbgs() |
| 489 | << " Loop memory access not suitable for LoopVersioningLICM\n\n" ); |
| 490 | ORE->emit(RemarkBuilder: [&]() { |
| 491 | return OptimizationRemarkMissed(DEBUG_TYPE, "IllegalLoopMemoryAccess" , |
| 492 | CurLoop->getStartLoc(), |
| 493 | CurLoop->getHeader()) |
| 494 | << " Unsafe Loop memory access" ; |
| 495 | }); |
| 496 | return false; |
| 497 | } |
| 498 | // Loop versioning is feasible, return true. |
| 499 | LLVM_DEBUG(dbgs() << " Loop Versioning found to be beneficial\n\n" ); |
| 500 | ORE->emit(RemarkBuilder: [&]() { |
| 501 | return OptimizationRemark(DEBUG_TYPE, "IsLegalForVersioning" , |
| 502 | CurLoop->getStartLoc(), CurLoop->getHeader()) |
| 503 | << " Versioned loop for LICM." |
| 504 | << " Number of runtime checks we had to insert " |
| 505 | << NV("RuntimeChecks" , LAI->getNumRuntimePointerChecks()); |
| 506 | }); |
| 507 | return true; |
| 508 | } |
| 509 | |
| 510 | bool LoopVersioningLICM::run(DominatorTree *DT) { |
| 511 | // Do not do the transformation if disabled by metadata. |
| 512 | if (hasLICMVersioningTransformation(L: CurLoop) & TM_Disable) |
| 513 | return false; |
| 514 | |
| 515 | bool Changed = false; |
| 516 | |
| 517 | // Check feasiblity of LoopVersioningLICM. |
| 518 | // If versioning found to be feasible and beneficial then proceed |
| 519 | // else simply return, by cleaning up memory. |
| 520 | if (isLegalForVersioning()) { |
| 521 | // Do loop versioning. |
| 522 | // Create memcheck for memory accessed inside loop. |
| 523 | // Clone original loop, and set blocks properly. |
| 524 | LoopVersioning LVer(*LAI, LAI->getRuntimePointerChecking()->getChecks(), |
| 525 | CurLoop, &LI, DT, SE); |
| 526 | LVer.versionLoop(); |
| 527 | // Set Loop Versioning metaData for original loop. |
| 528 | addStringMetadataToLoop(TheLoop: LVer.getNonVersionedLoop(), MDString: LICMVersioningMetaData); |
| 529 | // Set Loop Versioning metaData for version loop. |
| 530 | addStringMetadataToLoop(TheLoop: LVer.getVersionedLoop(), MDString: LICMVersioningMetaData); |
| 531 | // Set "llvm.mem.parallel_loop_access" metaData to versioned loop. |
| 532 | // FIXME: "llvm.mem.parallel_loop_access" annotates memory access |
| 533 | // instructions, not loops. |
| 534 | addStringMetadataToLoop(TheLoop: LVer.getVersionedLoop(), |
| 535 | MDString: "llvm.mem.parallel_loop_access" ); |
| 536 | // Update version loop with aggressive aliasing assumption. |
| 537 | LVer.annotateLoopWithNoAlias(); |
| 538 | Changed = true; |
| 539 | } |
| 540 | return Changed; |
| 541 | } |
| 542 | |
| 543 | namespace llvm { |
| 544 | |
| 545 | PreservedAnalyses LoopVersioningLICMPass::run(Loop &L, LoopAnalysisManager &AM, |
| 546 | LoopStandardAnalysisResults &LAR, |
| 547 | LPMUpdater &U) { |
| 548 | AliasAnalysis *AA = &LAR.AA; |
| 549 | ScalarEvolution *SE = &LAR.SE; |
| 550 | DominatorTree *DT = &LAR.DT; |
| 551 | const Function *F = L.getHeader()->getParent(); |
| 552 | OptimizationRemarkEmitter ORE(F); |
| 553 | |
| 554 | LoopAccessInfoManager LAIs(*SE, *AA, *DT, LAR.LI, nullptr, nullptr); |
| 555 | if (!LoopVersioningLICM(AA, SE, &ORE, LAIs, LAR.LI, &L).run(DT)) |
| 556 | return PreservedAnalyses::all(); |
| 557 | return getLoopPassPreservedAnalyses(); |
| 558 | } |
| 559 | } // namespace llvm |
| 560 | |