| 1 | //===- TargetPassConfig.cpp - Target independent code generation passes ---===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This file defines interfaces to access the target independent code |
| 10 | // generation passes provided by the LLVM backend. |
| 11 | // |
| 12 | //===---------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "llvm/CodeGen/TargetPassConfig.h" |
| 15 | #include "llvm/ADT/DenseMap.h" |
| 16 | #include "llvm/ADT/SmallVector.h" |
| 17 | #include "llvm/ADT/StringRef.h" |
| 18 | #include "llvm/Analysis/BasicAliasAnalysis.h" |
| 19 | #include "llvm/Analysis/CallGraphSCCPass.h" |
| 20 | #include "llvm/Analysis/ScopedNoAliasAA.h" |
| 21 | #include "llvm/Analysis/TargetTransformInfo.h" |
| 22 | #include "llvm/Analysis/TypeBasedAliasAnalysis.h" |
| 23 | #include "llvm/CodeGen/BasicBlockSectionsProfileReader.h" |
| 24 | #include "llvm/CodeGen/CSEConfigBase.h" |
| 25 | #include "llvm/CodeGen/CodeGenTargetMachineImpl.h" |
| 26 | #include "llvm/CodeGen/MachineFunctionPass.h" |
| 27 | #include "llvm/CodeGen/MachinePassRegistry.h" |
| 28 | #include "llvm/CodeGen/Passes.h" |
| 29 | #include "llvm/CodeGen/RegAllocRegistry.h" |
| 30 | #include "llvm/IR/IRPrintingPasses.h" |
| 31 | #include "llvm/IR/LegacyPassManager.h" |
| 32 | #include "llvm/IR/PassInstrumentation.h" |
| 33 | #include "llvm/IR/Verifier.h" |
| 34 | #include "llvm/InitializePasses.h" |
| 35 | #include "llvm/MC/MCAsmInfo.h" |
| 36 | #include "llvm/MC/MCTargetOptions.h" |
| 37 | #include "llvm/Pass.h" |
| 38 | #include "llvm/Support/CodeGen.h" |
| 39 | #include "llvm/Support/CommandLine.h" |
| 40 | #include "llvm/Support/Compiler.h" |
| 41 | #include "llvm/Support/Debug.h" |
| 42 | #include "llvm/Support/Discriminator.h" |
| 43 | #include "llvm/Support/ErrorHandling.h" |
| 44 | #include "llvm/Support/SaveAndRestore.h" |
| 45 | #include "llvm/Support/Threading.h" |
| 46 | #include "llvm/Support/VirtualFileSystem.h" |
| 47 | #include "llvm/Support/WithColor.h" |
| 48 | #include "llvm/Target/CGPassBuilderOption.h" |
| 49 | #include "llvm/Target/TargetMachine.h" |
| 50 | #include "llvm/Transforms/ObjCARC.h" |
| 51 | #include "llvm/Transforms/Scalar.h" |
| 52 | #include "llvm/Transforms/Utils.h" |
| 53 | #include <cassert> |
| 54 | #include <optional> |
| 55 | #include <string> |
| 56 | |
| 57 | using namespace llvm; |
| 58 | |
| 59 | static cl::opt<bool> |
| 60 | EnableIPRA("enable-ipra" , cl::init(Val: false), cl::Hidden, |
| 61 | cl::desc("Enable interprocedural register allocation " |
| 62 | "to reduce load/store at procedure calls." )); |
| 63 | static cl::opt<bool> DisablePostRASched("disable-post-ra" , cl::Hidden, |
| 64 | cl::desc("Disable Post Regalloc Scheduler" )); |
| 65 | static cl::opt<bool> DisableBranchFold("disable-branch-fold" , cl::Hidden, |
| 66 | cl::desc("Disable branch folding" )); |
| 67 | static cl::opt<bool> DisableTailDuplicate("disable-tail-duplicate" , cl::Hidden, |
| 68 | cl::desc("Disable tail duplication" )); |
| 69 | static cl::opt<bool> DisableEarlyTailDup("disable-early-taildup" , cl::Hidden, |
| 70 | cl::desc("Disable pre-register allocation tail duplication" )); |
| 71 | static cl::opt<bool> DisableBlockPlacement("disable-block-placement" , |
| 72 | cl::Hidden, cl::desc("Disable probability-driven block placement" )); |
| 73 | static cl::opt<bool> EnableBlockPlacementStats("enable-block-placement-stats" , |
| 74 | cl::Hidden, cl::desc("Collect probability-driven block placement stats" )); |
| 75 | static cl::opt<bool> DisableSSC("disable-ssc" , cl::Hidden, |
| 76 | cl::desc("Disable Stack Slot Coloring" )); |
| 77 | static cl::opt<bool> DisableMachineDCE("disable-machine-dce" , cl::Hidden, |
| 78 | cl::desc("Disable Machine Dead Code Elimination" )); |
| 79 | static cl::opt<bool> DisableEarlyIfConversion("disable-early-ifcvt" , cl::Hidden, |
| 80 | cl::desc("Disable Early If-conversion" )); |
| 81 | static cl::opt<bool> DisableMachineLICM("disable-machine-licm" , cl::Hidden, |
| 82 | cl::desc("Disable Machine LICM" )); |
| 83 | static cl::opt<bool> DisableMachineCSE("disable-machine-cse" , cl::Hidden, |
| 84 | cl::desc("Disable Machine Common Subexpression Elimination" )); |
| 85 | static cl::opt<cl::boolOrDefault> OptimizeRegAlloc( |
| 86 | "optimize-regalloc" , cl::Hidden, |
| 87 | cl::desc("Enable optimized register allocation compilation path." )); |
| 88 | static cl::opt<bool> DisablePostRAMachineLICM("disable-postra-machine-licm" , |
| 89 | cl::Hidden, |
| 90 | cl::desc("Disable Machine LICM" )); |
| 91 | static cl::opt<bool> DisableMachineSink("disable-machine-sink" , cl::Hidden, |
| 92 | cl::desc("Disable Machine Sinking" )); |
| 93 | static cl::opt<bool> DisablePostRAMachineSink("disable-postra-machine-sink" , |
| 94 | cl::Hidden, |
| 95 | cl::desc("Disable PostRA Machine Sinking" )); |
| 96 | static cl::opt<bool> DisableLSR("disable-lsr" , cl::Hidden, |
| 97 | cl::desc("Disable Loop Strength Reduction Pass" )); |
| 98 | static cl::opt<bool> DisableConstantHoisting("disable-constant-hoisting" , |
| 99 | cl::Hidden, cl::desc("Disable ConstantHoisting" )); |
| 100 | static cl::opt<bool> DisableCGP("disable-cgp" , cl::Hidden, |
| 101 | cl::desc("Disable Codegen Prepare" )); |
| 102 | static cl::opt<bool> DisableCopyProp("disable-copyprop" , cl::Hidden, |
| 103 | cl::desc("Disable Copy Propagation pass" )); |
| 104 | static cl::opt<bool> DisablePartialLibcallInlining("disable-partial-libcall-inlining" , |
| 105 | cl::Hidden, cl::desc("Disable Partial Libcall Inlining" )); |
| 106 | static cl::opt<bool> DisableAtExitBasedGlobalDtorLowering( |
| 107 | "disable-atexit-based-global-dtor-lowering" , cl::Hidden, |
| 108 | cl::desc("For MachO, disable atexit()-based global destructor lowering" )); |
| 109 | static cl::opt<bool> EnableImplicitNullChecks( |
| 110 | "enable-implicit-null-checks" , |
| 111 | cl::desc("Fold null checks into faulting memory operations" ), |
| 112 | cl::init(Val: false), cl::Hidden); |
| 113 | static cl::opt<bool> DisableMergeICmps("disable-mergeicmps" , |
| 114 | cl::desc("Disable MergeICmps Pass" ), |
| 115 | cl::init(Val: false), cl::Hidden); |
| 116 | static cl::opt<bool> |
| 117 | PrintISelInput("print-isel-input" , cl::Hidden, |
| 118 | cl::desc("Print LLVM IR input to isel pass" )); |
| 119 | static cl::opt<cl::boolOrDefault> |
| 120 | VerifyMachineCode("verify-machineinstrs" , cl::Hidden, |
| 121 | cl::desc("Verify generated machine code" )); |
| 122 | static cl::opt<cl::boolOrDefault> |
| 123 | DebugifyAndStripAll("debugify-and-strip-all-safe" , cl::Hidden, |
| 124 | cl::desc("Debugify MIR before and Strip debug after " |
| 125 | "each pass except those known to be unsafe " |
| 126 | "when debug info is present" )); |
| 127 | static cl::opt<cl::boolOrDefault> DebugifyCheckAndStripAll( |
| 128 | "debugify-check-and-strip-all-safe" , cl::Hidden, |
| 129 | cl::desc( |
| 130 | "Debugify MIR before, by checking and stripping the debug info after, " |
| 131 | "each pass except those known to be unsafe when debug info is " |
| 132 | "present" )); |
| 133 | // Enable or disable the MachineOutliner. |
| 134 | static cl::opt<RunOutliner> EnableMachineOutliner( |
| 135 | "enable-machine-outliner" , cl::desc("Enable the machine outliner" ), |
| 136 | cl::Hidden, cl::ValueOptional, cl::init(Val: RunOutliner::TargetDefault), |
| 137 | cl::values(clEnumValN(RunOutliner::AlwaysOutline, "always" , |
| 138 | "Run on all functions guaranteed to be beneficial" ), |
| 139 | clEnumValN(RunOutliner::NeverOutline, "never" , |
| 140 | "Disable all outlining" ), |
| 141 | // Sentinel value for unspecified option. |
| 142 | clEnumValN(RunOutliner::AlwaysOutline, "" , "" ))); |
| 143 | static cl::opt<bool> EnableGlobalMergeFunc( |
| 144 | "enable-global-merge-func" , cl::Hidden, |
| 145 | cl::desc("Enable global merge functions that are based on hash function" )); |
| 146 | // Disable the pass to fix unwind information. Whether the pass is included in |
| 147 | // the pipeline is controlled via the target options, this option serves as |
| 148 | // manual override. |
| 149 | static cl::opt<bool> DisableCFIFixup("disable-cfi-fixup" , cl::Hidden, |
| 150 | cl::desc("Disable the CFI fixup pass" )); |
| 151 | // Enable or disable FastISel. Both options are needed, because |
| 152 | // FastISel is enabled by default with -fast, and we wish to be |
| 153 | // able to enable or disable fast-isel independently from -O0. |
| 154 | static cl::opt<cl::boolOrDefault> |
| 155 | EnableFastISelOption("fast-isel" , cl::Hidden, |
| 156 | cl::desc("Enable the \"fast\" instruction selector" )); |
| 157 | |
| 158 | static cl::opt<cl::boolOrDefault> EnableGlobalISelOption( |
| 159 | "global-isel" , cl::Hidden, |
| 160 | cl::desc("Enable the \"global\" instruction selector" )); |
| 161 | |
| 162 | // FIXME: remove this after switching to NPM or GlobalISel, whichever gets there |
| 163 | // first... |
| 164 | static cl::opt<bool> |
| 165 | PrintAfterISel("print-after-isel" , cl::init(Val: false), cl::Hidden, |
| 166 | cl::desc("Print machine instrs after ISel" )); |
| 167 | |
| 168 | static cl::opt<GlobalISelAbortMode> EnableGlobalISelAbort( |
| 169 | "global-isel-abort" , cl::Hidden, |
| 170 | cl::desc("Enable abort calls when \"global\" instruction selection " |
| 171 | "fails to lower/select an instruction" ), |
| 172 | cl::values( |
| 173 | clEnumValN(GlobalISelAbortMode::Disable, "0" , "Disable the abort" ), |
| 174 | clEnumValN(GlobalISelAbortMode::Enable, "1" , "Enable the abort" ), |
| 175 | clEnumValN(GlobalISelAbortMode::DisableWithDiag, "2" , |
| 176 | "Disable the abort but emit a diagnostic on failure" ))); |
| 177 | |
| 178 | // Disable MIRProfileLoader before RegAlloc. This is for for debugging and |
| 179 | // tuning purpose. |
| 180 | static cl::opt<bool> DisableRAFSProfileLoader( |
| 181 | "disable-ra-fsprofile-loader" , cl::init(Val: false), cl::Hidden, |
| 182 | cl::desc("Disable MIRProfileLoader before RegAlloc" )); |
| 183 | // Disable MIRProfileLoader before BloackPlacement. This is for for debugging |
| 184 | // and tuning purpose. |
| 185 | static cl::opt<bool> DisableLayoutFSProfileLoader( |
| 186 | "disable-layout-fsprofile-loader" , cl::init(Val: false), cl::Hidden, |
| 187 | cl::desc("Disable MIRProfileLoader before BlockPlacement" )); |
| 188 | // Specify FSProfile file name. |
| 189 | static cl::opt<std::string> |
| 190 | FSProfileFile("fs-profile-file" , cl::init(Val: "" ), cl::value_desc("filename" ), |
| 191 | cl::desc("Flow Sensitive profile file name." ), cl::Hidden); |
| 192 | // Specify Remapping file for FSProfile. |
| 193 | static cl::opt<std::string> FSRemappingFile( |
| 194 | "fs-remapping-file" , cl::init(Val: "" ), cl::value_desc("filename" ), |
| 195 | cl::desc("Flow Sensitive profile remapping file name." ), cl::Hidden); |
| 196 | |
| 197 | // Temporary option to allow experimenting with MachineScheduler as a post-RA |
| 198 | // scheduler. Targets can "properly" enable this with |
| 199 | // substitutePass(&PostRASchedulerID, &PostMachineSchedulerID). |
| 200 | // Targets can return true in targetSchedulesPostRAScheduling() and |
| 201 | // insert a PostRA scheduling pass wherever it wants. |
| 202 | static cl::opt<bool> MISchedPostRA( |
| 203 | "misched-postra" , cl::Hidden, |
| 204 | cl::desc( |
| 205 | "Run MachineScheduler post regalloc (independent of preRA sched)" )); |
| 206 | |
| 207 | // Experimental option to run live interval analysis early. |
| 208 | static cl::opt<bool> EarlyLiveIntervals("early-live-intervals" , cl::Hidden, |
| 209 | cl::desc("Run live interval analysis earlier in the pipeline" )); |
| 210 | |
| 211 | static cl::opt<bool> DisableReplaceWithVecLib( |
| 212 | "disable-replace-with-vec-lib" , cl::Hidden, |
| 213 | cl::desc("Disable replace with vector math call pass" )); |
| 214 | |
| 215 | /// Option names for limiting the codegen pipeline. |
| 216 | /// Those are used in error reporting and we didn't want |
| 217 | /// to duplicate their names all over the place. |
| 218 | static const char StartAfterOptName[] = "start-after" ; |
| 219 | static const char StartBeforeOptName[] = "start-before" ; |
| 220 | static const char StopAfterOptName[] = "stop-after" ; |
| 221 | static const char StopBeforeOptName[] = "stop-before" ; |
| 222 | |
| 223 | static cl::opt<std::string> |
| 224 | StartAfterOpt(StringRef(StartAfterOptName), |
| 225 | cl::desc("Resume compilation after a specific pass" ), |
| 226 | cl::value_desc("pass-name" ), cl::init(Val: "" ), cl::Hidden); |
| 227 | |
| 228 | static cl::opt<std::string> |
| 229 | StartBeforeOpt(StringRef(StartBeforeOptName), |
| 230 | cl::desc("Resume compilation before a specific pass" ), |
| 231 | cl::value_desc("pass-name" ), cl::init(Val: "" ), cl::Hidden); |
| 232 | |
| 233 | static cl::opt<std::string> |
| 234 | StopAfterOpt(StringRef(StopAfterOptName), |
| 235 | cl::desc("Stop compilation after a specific pass" ), |
| 236 | cl::value_desc("pass-name" ), cl::init(Val: "" ), cl::Hidden); |
| 237 | |
| 238 | static cl::opt<std::string> |
| 239 | StopBeforeOpt(StringRef(StopBeforeOptName), |
| 240 | cl::desc("Stop compilation before a specific pass" ), |
| 241 | cl::value_desc("pass-name" ), cl::init(Val: "" ), cl::Hidden); |
| 242 | |
| 243 | /// Enable the machine function splitter pass. |
| 244 | static cl::opt<bool> EnableMachineFunctionSplitter( |
| 245 | "enable-split-machine-functions" , cl::Hidden, |
| 246 | cl::desc("Split out cold blocks from machine functions based on profile " |
| 247 | "information." )); |
| 248 | |
| 249 | /// Disable the expand reductions pass for testing. |
| 250 | static cl::opt<bool> DisableExpandReductions( |
| 251 | "disable-expand-reductions" , cl::init(Val: false), cl::Hidden, |
| 252 | cl::desc("Disable the expand reduction intrinsics pass from running" )); |
| 253 | |
| 254 | /// Disable the select optimization pass. |
| 255 | static cl::opt<bool> DisableSelectOptimize( |
| 256 | "disable-select-optimize" , cl::init(Val: true), cl::Hidden, |
| 257 | cl::desc("Disable the select-optimization pass from running" )); |
| 258 | |
| 259 | /// Enable garbage-collecting empty basic blocks. |
| 260 | static cl::opt<bool> |
| 261 | GCEmptyBlocks("gc-empty-basic-blocks" , cl::init(Val: false), cl::Hidden, |
| 262 | cl::desc("Enable garbage-collecting empty basic blocks" )); |
| 263 | |
| 264 | static cl::opt<bool> |
| 265 | SplitStaticData("split-static-data" , cl::Hidden, cl::init(Val: false), |
| 266 | cl::desc("Split static data sections into hot and cold " |
| 267 | "sections using profile information" )); |
| 268 | |
| 269 | /// Allow standard passes to be disabled by command line options. This supports |
| 270 | /// simple binary flags that either suppress the pass or do nothing. |
| 271 | /// i.e. -disable-mypass=false has no effect. |
| 272 | /// These should be converted to boolOrDefault in order to use applyOverride. |
| 273 | static IdentifyingPassPtr applyDisable(IdentifyingPassPtr PassID, |
| 274 | bool Override) { |
| 275 | if (Override) |
| 276 | return IdentifyingPassPtr(); |
| 277 | return PassID; |
| 278 | } |
| 279 | |
| 280 | /// Allow standard passes to be disabled by the command line, regardless of who |
| 281 | /// is adding the pass. |
| 282 | /// |
| 283 | /// StandardID is the pass identified in the standard pass pipeline and provided |
| 284 | /// to addPass(). It may be a target-specific ID in the case that the target |
| 285 | /// directly adds its own pass, but in that case we harmlessly fall through. |
| 286 | /// |
| 287 | /// TargetID is the pass that the target has configured to override StandardID. |
| 288 | /// |
| 289 | /// StandardID may be a pseudo ID. In that case TargetID is the name of the real |
| 290 | /// pass to run. This allows multiple options to control a single pass depending |
| 291 | /// on where in the pipeline that pass is added. |
| 292 | static IdentifyingPassPtr overridePass(AnalysisID StandardID, |
| 293 | IdentifyingPassPtr TargetID) { |
| 294 | if (StandardID == &PostRASchedulerID) |
| 295 | return applyDisable(PassID: TargetID, Override: DisablePostRASched); |
| 296 | |
| 297 | if (StandardID == &BranchFolderPassID) |
| 298 | return applyDisable(PassID: TargetID, Override: DisableBranchFold); |
| 299 | |
| 300 | if (StandardID == &TailDuplicateLegacyID) |
| 301 | return applyDisable(PassID: TargetID, Override: DisableTailDuplicate); |
| 302 | |
| 303 | if (StandardID == &EarlyTailDuplicateLegacyID) |
| 304 | return applyDisable(PassID: TargetID, Override: DisableEarlyTailDup); |
| 305 | |
| 306 | if (StandardID == &MachineBlockPlacementID) |
| 307 | return applyDisable(PassID: TargetID, Override: DisableBlockPlacement); |
| 308 | |
| 309 | if (StandardID == &StackSlotColoringID) |
| 310 | return applyDisable(PassID: TargetID, Override: DisableSSC); |
| 311 | |
| 312 | if (StandardID == &DeadMachineInstructionElimID) |
| 313 | return applyDisable(PassID: TargetID, Override: DisableMachineDCE); |
| 314 | |
| 315 | if (StandardID == &EarlyIfConverterLegacyID) |
| 316 | return applyDisable(PassID: TargetID, Override: DisableEarlyIfConversion); |
| 317 | |
| 318 | if (StandardID == &EarlyMachineLICMID) |
| 319 | return applyDisable(PassID: TargetID, Override: DisableMachineLICM); |
| 320 | |
| 321 | if (StandardID == &MachineCSELegacyID) |
| 322 | return applyDisable(PassID: TargetID, Override: DisableMachineCSE); |
| 323 | |
| 324 | if (StandardID == &MachineLICMID) |
| 325 | return applyDisable(PassID: TargetID, Override: DisablePostRAMachineLICM); |
| 326 | |
| 327 | if (StandardID == &MachineSinkingLegacyID) |
| 328 | return applyDisable(PassID: TargetID, Override: DisableMachineSink); |
| 329 | |
| 330 | if (StandardID == &PostRAMachineSinkingID) |
| 331 | return applyDisable(PassID: TargetID, Override: DisablePostRAMachineSink); |
| 332 | |
| 333 | if (StandardID == &MachineCopyPropagationID) |
| 334 | return applyDisable(PassID: TargetID, Override: DisableCopyProp); |
| 335 | |
| 336 | return TargetID; |
| 337 | } |
| 338 | |
| 339 | // Find the FSProfile file name. The internal option takes the precedence |
| 340 | // before getting from TargetMachine. |
| 341 | static std::string getFSProfileFile(const TargetMachine *TM) { |
| 342 | if (!FSProfileFile.empty()) |
| 343 | return FSProfileFile.getValue(); |
| 344 | const std::optional<PGOOptions> &PGOOpt = TM->getPGOOption(); |
| 345 | if (PGOOpt == std::nullopt || PGOOpt->Action != PGOOptions::SampleUse) |
| 346 | return std::string(); |
| 347 | return PGOOpt->ProfileFile; |
| 348 | } |
| 349 | |
| 350 | // Find the Profile remapping file name. The internal option takes the |
| 351 | // precedence before getting from TargetMachine. |
| 352 | static std::string getFSRemappingFile(const TargetMachine *TM) { |
| 353 | if (!FSRemappingFile.empty()) |
| 354 | return FSRemappingFile.getValue(); |
| 355 | const std::optional<PGOOptions> &PGOOpt = TM->getPGOOption(); |
| 356 | if (PGOOpt == std::nullopt || PGOOpt->Action != PGOOptions::SampleUse) |
| 357 | return std::string(); |
| 358 | return PGOOpt->ProfileRemappingFile; |
| 359 | } |
| 360 | |
| 361 | //===---------------------------------------------------------------------===// |
| 362 | /// TargetPassConfig |
| 363 | //===---------------------------------------------------------------------===// |
| 364 | |
| 365 | INITIALIZE_PASS(TargetPassConfig, "targetpassconfig" , |
| 366 | "Target Pass Configuration" , false, false) |
| 367 | char TargetPassConfig::ID = 0; |
| 368 | |
| 369 | namespace { |
| 370 | |
| 371 | struct InsertedPass { |
| 372 | AnalysisID TargetPassID; |
| 373 | IdentifyingPassPtr InsertedPassID; |
| 374 | |
| 375 | InsertedPass(AnalysisID TargetPassID, IdentifyingPassPtr InsertedPassID) |
| 376 | : TargetPassID(TargetPassID), InsertedPassID(InsertedPassID) {} |
| 377 | |
| 378 | Pass *getInsertedPass() const { |
| 379 | assert(InsertedPassID.isValid() && "Illegal Pass ID!" ); |
| 380 | if (InsertedPassID.isInstance()) |
| 381 | return InsertedPassID.getInstance(); |
| 382 | Pass *NP = Pass::createPass(ID: InsertedPassID.getID()); |
| 383 | assert(NP && "Pass ID not registered" ); |
| 384 | return NP; |
| 385 | } |
| 386 | }; |
| 387 | |
| 388 | } // end anonymous namespace |
| 389 | |
| 390 | namespace llvm { |
| 391 | |
| 392 | extern cl::opt<bool> EnableFSDiscriminator; |
| 393 | |
| 394 | class PassConfigImpl { |
| 395 | public: |
| 396 | // List of passes explicitly substituted by this target. Normally this is |
| 397 | // empty, but it is a convenient way to suppress or replace specific passes |
| 398 | // that are part of a standard pass pipeline without overridding the entire |
| 399 | // pipeline. This mechanism allows target options to inherit a standard pass's |
| 400 | // user interface. For example, a target may disable a standard pass by |
| 401 | // default by substituting a pass ID of zero, and the user may still enable |
| 402 | // that standard pass with an explicit command line option. |
| 403 | DenseMap<AnalysisID,IdentifyingPassPtr> TargetPasses; |
| 404 | |
| 405 | /// Store the pairs of <AnalysisID, AnalysisID> of which the second pass |
| 406 | /// is inserted after each instance of the first one. |
| 407 | SmallVector<InsertedPass, 4> InsertedPasses; |
| 408 | }; |
| 409 | |
| 410 | } // end namespace llvm |
| 411 | |
| 412 | // Out of line virtual method. |
| 413 | TargetPassConfig::~TargetPassConfig() { |
| 414 | delete Impl; |
| 415 | } |
| 416 | |
| 417 | static const PassInfo *getPassInfo(StringRef PassName) { |
| 418 | if (PassName.empty()) |
| 419 | return nullptr; |
| 420 | |
| 421 | const PassRegistry &PR = *PassRegistry::getPassRegistry(); |
| 422 | const PassInfo *PI = PR.getPassInfo(Arg: PassName); |
| 423 | if (!PI) |
| 424 | reportFatalUsageError(reason: Twine('\"') + Twine(PassName) + |
| 425 | Twine("\" pass is not registered." )); |
| 426 | return PI; |
| 427 | } |
| 428 | |
| 429 | static AnalysisID getPassIDFromName(StringRef PassName) { |
| 430 | const PassInfo *PI = getPassInfo(PassName); |
| 431 | return PI ? PI->getTypeInfo() : nullptr; |
| 432 | } |
| 433 | |
| 434 | static std::pair<StringRef, unsigned> |
| 435 | getPassNameAndInstanceNum(StringRef PassName) { |
| 436 | StringRef Name, InstanceNumStr; |
| 437 | std::tie(args&: Name, args&: InstanceNumStr) = PassName.split(Separator: ','); |
| 438 | |
| 439 | unsigned InstanceNum = 0; |
| 440 | if (!InstanceNumStr.empty() && InstanceNumStr.getAsInteger(Radix: 10, Result&: InstanceNum)) |
| 441 | reportFatalUsageError(reason: "invalid pass instance specifier " + PassName); |
| 442 | |
| 443 | return std::make_pair(x&: Name, y&: InstanceNum); |
| 444 | } |
| 445 | |
| 446 | void TargetPassConfig::setStartStopPasses() { |
| 447 | StringRef StartBeforeName; |
| 448 | std::tie(args&: StartBeforeName, args&: StartBeforeInstanceNum) = |
| 449 | getPassNameAndInstanceNum(PassName: StartBeforeOpt); |
| 450 | |
| 451 | StringRef StartAfterName; |
| 452 | std::tie(args&: StartAfterName, args&: StartAfterInstanceNum) = |
| 453 | getPassNameAndInstanceNum(PassName: StartAfterOpt); |
| 454 | |
| 455 | StringRef StopBeforeName; |
| 456 | std::tie(args&: StopBeforeName, args&: StopBeforeInstanceNum) |
| 457 | = getPassNameAndInstanceNum(PassName: StopBeforeOpt); |
| 458 | |
| 459 | StringRef StopAfterName; |
| 460 | std::tie(args&: StopAfterName, args&: StopAfterInstanceNum) |
| 461 | = getPassNameAndInstanceNum(PassName: StopAfterOpt); |
| 462 | |
| 463 | StartBefore = getPassIDFromName(PassName: StartBeforeName); |
| 464 | StartAfter = getPassIDFromName(PassName: StartAfterName); |
| 465 | StopBefore = getPassIDFromName(PassName: StopBeforeName); |
| 466 | StopAfter = getPassIDFromName(PassName: StopAfterName); |
| 467 | if (StartBefore && StartAfter) |
| 468 | reportFatalUsageError(reason: Twine(StartBeforeOptName) + Twine(" and " ) + |
| 469 | Twine(StartAfterOptName) + Twine(" specified!" )); |
| 470 | if (StopBefore && StopAfter) |
| 471 | reportFatalUsageError(reason: Twine(StopBeforeOptName) + Twine(" and " ) + |
| 472 | Twine(StopAfterOptName) + Twine(" specified!" )); |
| 473 | Started = (StartAfter == nullptr) && (StartBefore == nullptr); |
| 474 | } |
| 475 | |
| 476 | CGPassBuilderOption llvm::getCGPassBuilderOption() { |
| 477 | CGPassBuilderOption Opt; |
| 478 | |
| 479 | #define SET_OPTION(Option) \ |
| 480 | if (Option.getNumOccurrences()) \ |
| 481 | Opt.Option = Option; |
| 482 | |
| 483 | SET_OPTION(EnableFastISelOption) |
| 484 | SET_OPTION(EnableGlobalISelAbort) |
| 485 | SET_OPTION(EnableGlobalISelOption) |
| 486 | SET_OPTION(EnableIPRA) |
| 487 | SET_OPTION(OptimizeRegAlloc) |
| 488 | SET_OPTION(VerifyMachineCode) |
| 489 | SET_OPTION(DisableAtExitBasedGlobalDtorLowering) |
| 490 | SET_OPTION(DisableExpandReductions) |
| 491 | SET_OPTION(PrintAfterISel) |
| 492 | SET_OPTION(FSProfileFile) |
| 493 | SET_OPTION(GCEmptyBlocks) |
| 494 | |
| 495 | #define SET_BOOLEAN_OPTION(Option) Opt.Option = Option; |
| 496 | |
| 497 | SET_BOOLEAN_OPTION(EarlyLiveIntervals) |
| 498 | SET_BOOLEAN_OPTION(EnableBlockPlacementStats) |
| 499 | SET_BOOLEAN_OPTION(EnableGlobalMergeFunc) |
| 500 | SET_BOOLEAN_OPTION(EnableImplicitNullChecks) |
| 501 | SET_BOOLEAN_OPTION(EnableMachineOutliner) |
| 502 | SET_BOOLEAN_OPTION(MISchedPostRA) |
| 503 | SET_BOOLEAN_OPTION(DisableMergeICmps) |
| 504 | SET_BOOLEAN_OPTION(DisableLSR) |
| 505 | SET_BOOLEAN_OPTION(DisableConstantHoisting) |
| 506 | SET_BOOLEAN_OPTION(DisableCGP) |
| 507 | SET_BOOLEAN_OPTION(DisablePartialLibcallInlining) |
| 508 | SET_BOOLEAN_OPTION(DisableSelectOptimize) |
| 509 | SET_BOOLEAN_OPTION(PrintISelInput) |
| 510 | SET_BOOLEAN_OPTION(DebugifyAndStripAll) |
| 511 | SET_BOOLEAN_OPTION(DebugifyCheckAndStripAll) |
| 512 | SET_BOOLEAN_OPTION(DisableRAFSProfileLoader) |
| 513 | SET_BOOLEAN_OPTION(DisableCFIFixup) |
| 514 | SET_BOOLEAN_OPTION(EnableMachineFunctionSplitter) |
| 515 | |
| 516 | return Opt; |
| 517 | } |
| 518 | |
| 519 | void llvm::registerCodeGenCallback(PassInstrumentationCallbacks &PIC, |
| 520 | TargetMachine &TM) { |
| 521 | |
| 522 | // Register a callback for disabling passes. |
| 523 | PIC.registerShouldRunOptionalPassCallback(C: [](StringRef P, Any) { |
| 524 | |
| 525 | #define DISABLE_PASS(Option, Name) \ |
| 526 | if (Option && P.contains(#Name)) \ |
| 527 | return false; |
| 528 | DISABLE_PASS(DisableBlockPlacement, MachineBlockPlacementPass) |
| 529 | DISABLE_PASS(DisableBranchFold, BranchFolderPass) |
| 530 | DISABLE_PASS(DisableCopyProp, MachineCopyPropagationPass) |
| 531 | DISABLE_PASS(DisableEarlyIfConversion, EarlyIfConverterLegacyPass) |
| 532 | DISABLE_PASS(DisableEarlyTailDup, EarlyTailDuplicatePass) |
| 533 | DISABLE_PASS(DisableMachineCSE, MachineCSELegacyPass) |
| 534 | DISABLE_PASS(DisableMachineDCE, DeadMachineInstructionElimPass) |
| 535 | DISABLE_PASS(DisableMachineLICM, EarlyMachineLICMPass) |
| 536 | DISABLE_PASS(DisableMachineSink, MachineSinkingPass) |
| 537 | DISABLE_PASS(DisablePostRAMachineLICM, MachineLICMPass) |
| 538 | DISABLE_PASS(DisablePostRAMachineSink, PostRAMachineSinkingPass) |
| 539 | DISABLE_PASS(DisablePostRASched, PostRASchedulerPass) |
| 540 | DISABLE_PASS(DisableSSC, StackSlotColoringPass) |
| 541 | DISABLE_PASS(DisableTailDuplicate, TailDuplicatePass) |
| 542 | |
| 543 | return true; |
| 544 | }); |
| 545 | } |
| 546 | |
| 547 | Expected<TargetPassConfig::StartStopInfo> |
| 548 | TargetPassConfig::getStartStopInfo(PassInstrumentationCallbacks &PIC) { |
| 549 | auto [StartBefore, StartBeforeInstanceNum] = |
| 550 | getPassNameAndInstanceNum(PassName: StartBeforeOpt); |
| 551 | auto [StartAfter, StartAfterInstanceNum] = |
| 552 | getPassNameAndInstanceNum(PassName: StartAfterOpt); |
| 553 | auto [StopBefore, StopBeforeInstanceNum] = |
| 554 | getPassNameAndInstanceNum(PassName: StopBeforeOpt); |
| 555 | auto [StopAfter, StopAfterInstanceNum] = |
| 556 | getPassNameAndInstanceNum(PassName: StopAfterOpt); |
| 557 | |
| 558 | if (!StartBefore.empty() && !StartAfter.empty()) |
| 559 | return make_error<StringError>( |
| 560 | Args: Twine(StartBeforeOptName) + " and " + StartAfterOptName + " specified!" , |
| 561 | Args: std::make_error_code(e: std::errc::invalid_argument)); |
| 562 | if (!StopBefore.empty() && !StopAfter.empty()) |
| 563 | return make_error<StringError>( |
| 564 | Args: Twine(StopBeforeOptName) + " and " + StopAfterOptName + " specified!" , |
| 565 | Args: std::make_error_code(e: std::errc::invalid_argument)); |
| 566 | |
| 567 | StartStopInfo Result; |
| 568 | Result.StartPass = StartBefore.empty() ? StartAfter : StartBefore; |
| 569 | Result.StopPass = StopBefore.empty() ? StopAfter : StopBefore; |
| 570 | Result.StartInstanceNum = |
| 571 | StartBefore.empty() ? StartAfterInstanceNum : StartBeforeInstanceNum; |
| 572 | Result.StopInstanceNum = |
| 573 | StopBefore.empty() ? StopAfterInstanceNum : StopBeforeInstanceNum; |
| 574 | Result.StartAfter = !StartAfter.empty(); |
| 575 | Result.StopAfter = !StopAfter.empty(); |
| 576 | Result.StartInstanceNum += Result.StartInstanceNum == 0; |
| 577 | Result.StopInstanceNum += Result.StopInstanceNum == 0; |
| 578 | return Result; |
| 579 | } |
| 580 | |
| 581 | // Out of line constructor provides default values for pass options and |
| 582 | // registers all common codegen passes. |
| 583 | TargetPassConfig::TargetPassConfig(TargetMachine &TM, PassManagerBase &PM) |
| 584 | : ImmutablePass(ID), PM(&PM), TM(&TM) { |
| 585 | Impl = new PassConfigImpl(); |
| 586 | |
| 587 | PassRegistry &PR = *PassRegistry::getPassRegistry(); |
| 588 | // Register all target independent codegen passes to activate their PassIDs, |
| 589 | // including this pass itself. |
| 590 | initializeCodeGen(PR); |
| 591 | |
| 592 | // Also register alias analysis passes required by codegen passes. |
| 593 | initializeBasicAAWrapperPassPass(PR); |
| 594 | initializeAAResultsWrapperPassPass(PR); |
| 595 | |
| 596 | if (EnableIPRA.getNumOccurrences()) { |
| 597 | TM.Options.EnableIPRA = EnableIPRA; |
| 598 | } else { |
| 599 | // If not explicitly specified, use target default. |
| 600 | TM.Options.EnableIPRA |= TM.useIPRA(); |
| 601 | } |
| 602 | |
| 603 | if (TM.Options.EnableIPRA) |
| 604 | setRequiresCodeGenSCCOrder(); |
| 605 | |
| 606 | if (EnableGlobalISelAbort.getNumOccurrences()) |
| 607 | TM.Options.GlobalISelAbort = EnableGlobalISelAbort; |
| 608 | |
| 609 | setStartStopPasses(); |
| 610 | } |
| 611 | |
| 612 | CodeGenOptLevel TargetPassConfig::getOptLevel() const { |
| 613 | return TM->getOptLevel(); |
| 614 | } |
| 615 | |
| 616 | /// Insert InsertedPassID pass after TargetPassID. |
| 617 | void TargetPassConfig::insertPass(AnalysisID TargetPassID, |
| 618 | IdentifyingPassPtr InsertedPassID) { |
| 619 | assert(((!InsertedPassID.isInstance() && |
| 620 | TargetPassID != InsertedPassID.getID()) || |
| 621 | (InsertedPassID.isInstance() && |
| 622 | TargetPassID != InsertedPassID.getInstance()->getPassID())) && |
| 623 | "Insert a pass after itself!" ); |
| 624 | Impl->InsertedPasses.emplace_back(Args&: TargetPassID, Args&: InsertedPassID); |
| 625 | } |
| 626 | |
| 627 | /// createPassConfig - Create a pass configuration object to be used by |
| 628 | /// addPassToEmitX methods for generating a pipeline of CodeGen passes. |
| 629 | /// |
| 630 | /// Targets may override this to extend TargetPassConfig. |
| 631 | TargetPassConfig * |
| 632 | CodeGenTargetMachineImpl::createPassConfig(PassManagerBase &PM) { |
| 633 | return new TargetPassConfig(*this, PM); |
| 634 | } |
| 635 | |
| 636 | TargetPassConfig::TargetPassConfig() |
| 637 | : ImmutablePass(ID) { |
| 638 | reportFatalUsageError(reason: "trying to construct TargetPassConfig without a target " |
| 639 | "machine. Scheduling a CodeGen pass without a target " |
| 640 | "triple set?" ); |
| 641 | } |
| 642 | |
| 643 | bool TargetPassConfig::willCompleteCodeGenPipeline() { |
| 644 | return StopBeforeOpt.empty() && StopAfterOpt.empty(); |
| 645 | } |
| 646 | |
| 647 | bool TargetPassConfig::hasLimitedCodeGenPipeline() { |
| 648 | return !StartBeforeOpt.empty() || !StartAfterOpt.empty() || |
| 649 | !willCompleteCodeGenPipeline(); |
| 650 | } |
| 651 | |
| 652 | std::string TargetPassConfig::getLimitedCodeGenPipelineReason() { |
| 653 | if (!hasLimitedCodeGenPipeline()) |
| 654 | return std::string(); |
| 655 | std::string Res; |
| 656 | static cl::opt<std::string> *PassNames[] = {&StartAfterOpt, &StartBeforeOpt, |
| 657 | &StopAfterOpt, &StopBeforeOpt}; |
| 658 | static const char *OptNames[] = {StartAfterOptName, StartBeforeOptName, |
| 659 | StopAfterOptName, StopBeforeOptName}; |
| 660 | bool IsFirst = true; |
| 661 | for (int Idx = 0; Idx < 4; ++Idx) |
| 662 | if (!PassNames[Idx]->empty()) { |
| 663 | if (!IsFirst) |
| 664 | Res += " and " ; |
| 665 | IsFirst = false; |
| 666 | Res += OptNames[Idx]; |
| 667 | } |
| 668 | return Res; |
| 669 | } |
| 670 | |
| 671 | // Helper to verify the analysis is really immutable. |
| 672 | void TargetPassConfig::setOpt(bool &Opt, bool Val) { |
| 673 | assert(!Initialized && "PassConfig is immutable" ); |
| 674 | Opt = Val; |
| 675 | } |
| 676 | |
| 677 | void TargetPassConfig::substitutePass(AnalysisID StandardID, |
| 678 | IdentifyingPassPtr TargetID) { |
| 679 | Impl->TargetPasses[StandardID] = TargetID; |
| 680 | } |
| 681 | |
| 682 | IdentifyingPassPtr TargetPassConfig::getPassSubstitution(AnalysisID ID) const { |
| 683 | DenseMap<AnalysisID, IdentifyingPassPtr>::const_iterator |
| 684 | I = Impl->TargetPasses.find(Val: ID); |
| 685 | if (I == Impl->TargetPasses.end()) |
| 686 | return ID; |
| 687 | return I->second; |
| 688 | } |
| 689 | |
| 690 | bool TargetPassConfig::isPassSubstitutedOrOverridden(AnalysisID ID) const { |
| 691 | IdentifyingPassPtr TargetID = getPassSubstitution(ID); |
| 692 | IdentifyingPassPtr FinalPtr = overridePass(StandardID: ID, TargetID); |
| 693 | return !FinalPtr.isValid() || FinalPtr.isInstance() || |
| 694 | FinalPtr.getID() != ID; |
| 695 | } |
| 696 | |
| 697 | /// Add a pass to the PassManager if that pass is supposed to be run. If the |
| 698 | /// Started/Stopped flags indicate either that the compilation should start at |
| 699 | /// a later pass or that it should stop after an earlier pass, then do not add |
| 700 | /// the pass. Finally, compare the current pass against the StartAfter |
| 701 | /// and StopAfter options and change the Started/Stopped flags accordingly. |
| 702 | void TargetPassConfig::addPass(Pass *P) { |
| 703 | assert(!Initialized && "PassConfig is immutable" ); |
| 704 | |
| 705 | // Cache the Pass ID here in case the pass manager finds this pass is |
| 706 | // redundant with ones already scheduled / available, and deletes it. |
| 707 | // Fundamentally, once we add the pass to the manager, we no longer own it |
| 708 | // and shouldn't reference it. |
| 709 | AnalysisID PassID = P->getPassID(); |
| 710 | |
| 711 | if (StartBefore == PassID && StartBeforeCount++ == StartBeforeInstanceNum) |
| 712 | Started = true; |
| 713 | if (StopBefore == PassID && StopBeforeCount++ == StopBeforeInstanceNum) |
| 714 | Stopped = true; |
| 715 | if (Started && !Stopped) { |
| 716 | if (AddingMachinePasses) { |
| 717 | // Construct banner message before PM->add() as that may delete the pass. |
| 718 | std::string Banner = |
| 719 | std::string("After " ) + std::string(P->getPassName()); |
| 720 | addMachinePrePasses(); |
| 721 | PM->add(P); |
| 722 | addMachinePostPasses(Banner); |
| 723 | } else { |
| 724 | PM->add(P); |
| 725 | } |
| 726 | |
| 727 | // Add the passes after the pass P if there is any. |
| 728 | for (const auto &IP : Impl->InsertedPasses) |
| 729 | if (IP.TargetPassID == PassID) |
| 730 | addPass(P: IP.getInsertedPass()); |
| 731 | } else { |
| 732 | delete P; |
| 733 | } |
| 734 | |
| 735 | if (StopAfter == PassID && StopAfterCount++ == StopAfterInstanceNum) |
| 736 | Stopped = true; |
| 737 | |
| 738 | if (StartAfter == PassID && StartAfterCount++ == StartAfterInstanceNum) |
| 739 | Started = true; |
| 740 | if (Stopped && !Started) |
| 741 | reportFatalUsageError(reason: "Cannot stop compilation after pass that is not run" ); |
| 742 | } |
| 743 | |
| 744 | /// Add a CodeGen pass at this point in the pipeline after checking for target |
| 745 | /// and command line overrides. |
| 746 | /// |
| 747 | /// addPass cannot return a pointer to the pass instance because is internal the |
| 748 | /// PassManager and the instance we create here may already be freed. |
| 749 | AnalysisID TargetPassConfig::addPass(AnalysisID PassID) { |
| 750 | IdentifyingPassPtr TargetID = getPassSubstitution(ID: PassID); |
| 751 | IdentifyingPassPtr FinalPtr = overridePass(StandardID: PassID, TargetID); |
| 752 | if (!FinalPtr.isValid()) |
| 753 | return nullptr; |
| 754 | |
| 755 | Pass *P; |
| 756 | if (FinalPtr.isInstance()) |
| 757 | P = FinalPtr.getInstance(); |
| 758 | else { |
| 759 | P = Pass::createPass(ID: FinalPtr.getID()); |
| 760 | if (!P) |
| 761 | llvm_unreachable("Pass ID not registered" ); |
| 762 | } |
| 763 | AnalysisID FinalID = P->getPassID(); |
| 764 | addPass(P); // Ends the lifetime of P. |
| 765 | |
| 766 | return FinalID; |
| 767 | } |
| 768 | |
| 769 | void TargetPassConfig::printAndVerify(const std::string &Banner) { |
| 770 | addPrintPass(Banner); |
| 771 | addVerifyPass(Banner); |
| 772 | } |
| 773 | |
| 774 | void TargetPassConfig::addPrintPass(const std::string &Banner) { |
| 775 | if (PrintAfterISel) |
| 776 | PM->add(P: createMachineFunctionPrinterPass(OS&: dbgs(), Banner)); |
| 777 | } |
| 778 | |
| 779 | void TargetPassConfig::addVerifyPass(const std::string &Banner) { |
| 780 | bool Verify = VerifyMachineCode == cl::BOU_TRUE; |
| 781 | #ifdef EXPENSIVE_CHECKS |
| 782 | if (VerifyMachineCode == cl::BOU_UNSET) |
| 783 | Verify = TM->isMachineVerifierClean(); |
| 784 | #endif |
| 785 | if (Verify) |
| 786 | PM->add(P: createMachineVerifierPass(Banner)); |
| 787 | } |
| 788 | |
| 789 | void TargetPassConfig::addDebugifyPass() { |
| 790 | PM->add(P: createDebugifyMachineModulePass()); |
| 791 | } |
| 792 | |
| 793 | void TargetPassConfig::addStripDebugPass() { |
| 794 | PM->add(P: createStripDebugMachineModulePass(/*OnlyDebugified=*/true)); |
| 795 | } |
| 796 | |
| 797 | void TargetPassConfig::addCheckDebugPass() { |
| 798 | PM->add(P: createCheckDebugMachineModulePass()); |
| 799 | } |
| 800 | |
| 801 | void TargetPassConfig::addMachinePrePasses(bool AllowDebugify) { |
| 802 | if (AllowDebugify && DebugifyIsSafe && |
| 803 | (DebugifyAndStripAll == cl::BOU_TRUE || |
| 804 | DebugifyCheckAndStripAll == cl::BOU_TRUE)) |
| 805 | addDebugifyPass(); |
| 806 | } |
| 807 | |
| 808 | void TargetPassConfig::addMachinePostPasses(const std::string &Banner) { |
| 809 | if (DebugifyIsSafe) { |
| 810 | if (DebugifyCheckAndStripAll == cl::BOU_TRUE) { |
| 811 | addCheckDebugPass(); |
| 812 | addStripDebugPass(); |
| 813 | } else if (DebugifyAndStripAll == cl::BOU_TRUE) |
| 814 | addStripDebugPass(); |
| 815 | } |
| 816 | addVerifyPass(Banner); |
| 817 | } |
| 818 | |
| 819 | /// Add common target configurable passes that perform LLVM IR to IR transforms |
| 820 | /// following machine independent optimization. |
| 821 | void TargetPassConfig::addIRPasses() { |
| 822 | // Before running any passes, run the verifier to determine if the input |
| 823 | // coming from the front-end and/or optimizer is valid. |
| 824 | if (!DisableVerify) |
| 825 | addPass(P: createVerifierPass()); |
| 826 | |
| 827 | if (getOptLevel() != CodeGenOptLevel::None) { |
| 828 | // Basic AliasAnalysis support. |
| 829 | // Add TypeBasedAliasAnalysis before BasicAliasAnalysis so that |
| 830 | // BasicAliasAnalysis wins if they disagree. This is intended to help |
| 831 | // support "obvious" type-punning idioms. |
| 832 | addPass(P: createTypeBasedAAWrapperPass()); |
| 833 | addPass(P: createScopedNoAliasAAWrapperPass()); |
| 834 | addPass(P: createBasicAAWrapperPass()); |
| 835 | |
| 836 | // Run loop strength reduction before anything else. |
| 837 | if (!DisableLSR) { |
| 838 | addPass(P: createCanonicalizeFreezeInLoopsPass()); |
| 839 | addPass(P: createLoopStrengthReducePass()); |
| 840 | if (EnableLoopTermFold) |
| 841 | addPass(P: createLoopTermFoldPass()); |
| 842 | } |
| 843 | |
| 844 | // The MergeICmpsPass tries to create memcmp calls by grouping sequences of |
| 845 | // loads and compares. ExpandMemCmpPass then tries to expand those calls |
| 846 | // into optimally-sized loads and compares. The transforms are enabled by a |
| 847 | // target lowering hook. |
| 848 | if (!DisableMergeICmps) |
| 849 | addPass(P: createMergeICmpsLegacyPass()); |
| 850 | addPass(P: createExpandMemCmpLegacyPass()); |
| 851 | } |
| 852 | |
| 853 | // Run GC lowering passes for builtin collectors |
| 854 | // TODO: add a pass insertion point here |
| 855 | addPass(PassID: &GCLoweringID); |
| 856 | addPass(PassID: &ShadowStackGCLoweringID); |
| 857 | |
| 858 | // For MachO, lower @llvm.global_dtors into @llvm.global_ctors with |
| 859 | // __cxa_atexit() calls to avoid emitting the deprecated __mod_term_func. |
| 860 | if (TM->getTargetTriple().isOSBinFormatMachO() && |
| 861 | !DisableAtExitBasedGlobalDtorLowering) |
| 862 | addPass(P: createLowerGlobalDtorsLegacyPass()); |
| 863 | |
| 864 | // Make sure that no unreachable blocks are instruction selected. |
| 865 | addPass(P: createUnreachableBlockEliminationPass()); |
| 866 | |
| 867 | // Prepare expensive constants for SelectionDAG. |
| 868 | if (getOptLevel() != CodeGenOptLevel::None && !DisableConstantHoisting) |
| 869 | addPass(P: createConstantHoistingPass()); |
| 870 | |
| 871 | if (getOptLevel() != CodeGenOptLevel::None && !DisableReplaceWithVecLib) |
| 872 | addPass(P: createReplaceWithVeclibLegacyPass()); |
| 873 | |
| 874 | if (getOptLevel() != CodeGenOptLevel::None && !DisablePartialLibcallInlining) |
| 875 | addPass(P: createPartiallyInlineLibCallsPass()); |
| 876 | |
| 877 | // Instrument function entry after all inlining. |
| 878 | addPass(P: createPostInlineEntryExitInstrumenterPass()); |
| 879 | |
| 880 | // Add scalarization of target's unsupported masked memory intrinsics pass. |
| 881 | // the unsupported intrinsic will be replaced with a chain of basic blocks, |
| 882 | // that stores/loads element one-by-one if the appropriate mask bit is set. |
| 883 | addPass(P: createScalarizeMaskedMemIntrinLegacyPass()); |
| 884 | |
| 885 | // Expand reduction intrinsics into shuffle sequences if the target wants to. |
| 886 | // Allow disabling it for testing purposes. |
| 887 | if (!DisableExpandReductions) |
| 888 | addPass(P: createExpandReductionsPass()); |
| 889 | |
| 890 | // Convert conditional moves to conditional jumps when profitable. |
| 891 | if (getOptLevel() != CodeGenOptLevel::None && !DisableSelectOptimize) |
| 892 | addPass(P: createSelectOptimizePass()); |
| 893 | |
| 894 | if (EnableGlobalMergeFunc) |
| 895 | addPass(P: createGlobalMergeFuncPass()); |
| 896 | |
| 897 | if (TM->getTargetTriple().isOSWindows()) |
| 898 | addPass(P: createWindowsSecureHotPatchingPass()); |
| 899 | } |
| 900 | |
| 901 | /// Turn exception handling constructs into something the code generators can |
| 902 | /// handle. |
| 903 | void TargetPassConfig::addPassesToHandleExceptions() { |
| 904 | const MCAsmInfo *MCAI = TM->getMCAsmInfo(); |
| 905 | assert(MCAI && "No MCAsmInfo" ); |
| 906 | switch (MCAI->getExceptionHandlingType()) { |
| 907 | case ExceptionHandling::SjLj: |
| 908 | // SjLj piggy-backs on dwarf for this bit. The cleanups done apply to both |
| 909 | // Dwarf EH prepare needs to be run after SjLj prepare. Otherwise, |
| 910 | // catch info can get misplaced when a selector ends up more than one block |
| 911 | // removed from the parent invoke(s). This could happen when a landing |
| 912 | // pad is shared by multiple invokes and is also a target of a normal |
| 913 | // edge from elsewhere. |
| 914 | addPass(P: createSjLjEHPreparePass(TM)); |
| 915 | [[fallthrough]]; |
| 916 | case ExceptionHandling::DwarfCFI: |
| 917 | case ExceptionHandling::ARM: |
| 918 | case ExceptionHandling::AIX: |
| 919 | case ExceptionHandling::ZOS: |
| 920 | addPass(P: createDwarfEHPass(OptLevel: getOptLevel())); |
| 921 | break; |
| 922 | case ExceptionHandling::WinEH: |
| 923 | // We support using both GCC-style and MSVC-style exceptions on Windows, so |
| 924 | // add both preparation passes. Each pass will only actually run if it |
| 925 | // recognizes the personality function. |
| 926 | addPass(P: createWinEHPass()); |
| 927 | addPass(P: createDwarfEHPass(OptLevel: getOptLevel())); |
| 928 | break; |
| 929 | case ExceptionHandling::Wasm: |
| 930 | // Wasm EH uses Windows EH instructions, but it does not need to demote PHIs |
| 931 | // on catchpads and cleanuppads because it does not outline them into |
| 932 | // funclets. Catchswitch blocks are not lowered in SelectionDAG, so we |
| 933 | // should remove PHIs there. |
| 934 | addPass(P: createWinEHPass(/*DemoteCatchSwitchPHIOnly=*/true)); |
| 935 | addPass(P: createWasmEHPass()); |
| 936 | break; |
| 937 | case ExceptionHandling::None: |
| 938 | addPass(P: createLowerInvokePass()); |
| 939 | |
| 940 | // The lower invoke pass may create unreachable code. Remove it. |
| 941 | addPass(P: createUnreachableBlockEliminationPass()); |
| 942 | break; |
| 943 | } |
| 944 | } |
| 945 | |
| 946 | /// Add pass to prepare the LLVM IR for code generation. This should be done |
| 947 | /// before exception handling preparation passes. |
| 948 | void TargetPassConfig::addCodeGenPrepare() { |
| 949 | if (getOptLevel() != CodeGenOptLevel::None && !DisableCGP) |
| 950 | addPass(P: createCodeGenPrepareLegacyPass()); |
| 951 | } |
| 952 | |
| 953 | /// Add common passes that perform LLVM IR to IR transforms in preparation for |
| 954 | /// instruction selection. |
| 955 | void TargetPassConfig::addISelPrepare() { |
| 956 | addPreISel(); |
| 957 | |
| 958 | // Force codegen to run according to the callgraph. |
| 959 | if (requiresCodeGenSCCOrder()) |
| 960 | addPass(P: new DummyCGSCCPass); |
| 961 | |
| 962 | if (getOptLevel() != CodeGenOptLevel::None) |
| 963 | addPass(P: createObjCARCContractPass()); |
| 964 | |
| 965 | addPass(P: createCallBrPass()); |
| 966 | |
| 967 | // Add both the safe stack and the stack protection passes: each of them will |
| 968 | // only protect functions that have corresponding attributes. |
| 969 | addPass(P: createSafeStackPass()); |
| 970 | addPass(P: createStackProtectorPass()); |
| 971 | |
| 972 | if (PrintISelInput) |
| 973 | addPass(P: createPrintFunctionPass( |
| 974 | OS&: dbgs(), Banner: "\n\n*** Final LLVM Code input to ISel ***\n" )); |
| 975 | |
| 976 | // All passes which modify the LLVM IR are now complete; run the verifier |
| 977 | // to ensure that the IR is valid. |
| 978 | if (!DisableVerify) |
| 979 | addPass(P: createVerifierPass()); |
| 980 | } |
| 981 | |
| 982 | bool TargetPassConfig::addCoreISelPasses() { |
| 983 | // Enable FastISel with -fast-isel, but allow that to be overridden. |
| 984 | TM->setO0WantsFastISel(EnableFastISelOption != cl::BOU_FALSE); |
| 985 | |
| 986 | // Determine an instruction selector. |
| 987 | enum class SelectorType { SelectionDAG, FastISel, GlobalISel }; |
| 988 | SelectorType Selector; |
| 989 | |
| 990 | if (EnableFastISelOption == cl::BOU_TRUE) |
| 991 | Selector = SelectorType::FastISel; |
| 992 | else if (EnableGlobalISelOption == cl::BOU_TRUE || |
| 993 | (TM->Options.EnableGlobalISel && |
| 994 | EnableGlobalISelOption != cl::BOU_FALSE)) |
| 995 | Selector = SelectorType::GlobalISel; |
| 996 | else if (TM->getOptLevel() == CodeGenOptLevel::None && |
| 997 | TM->getO0WantsFastISel()) |
| 998 | Selector = SelectorType::FastISel; |
| 999 | else |
| 1000 | Selector = SelectorType::SelectionDAG; |
| 1001 | |
| 1002 | // Set consistently TM->Options.EnableFastISel and EnableGlobalISel. |
| 1003 | if (Selector == SelectorType::FastISel) { |
| 1004 | TM->setFastISel(true); |
| 1005 | TM->setGlobalISel(false); |
| 1006 | } else if (Selector == SelectorType::GlobalISel) { |
| 1007 | TM->setFastISel(false); |
| 1008 | TM->setGlobalISel(true); |
| 1009 | } |
| 1010 | |
| 1011 | // FIXME: Injecting into the DAGISel pipeline seems to cause issues with |
| 1012 | // analyses needing to be re-run. This can result in being unable to |
| 1013 | // schedule passes (particularly with 'Function Alias Analysis |
| 1014 | // Results'). It's not entirely clear why but AFAICT this seems to be |
| 1015 | // due to one FunctionPassManager not being able to use analyses from a |
| 1016 | // previous one. As we're injecting a ModulePass we break the usual |
| 1017 | // pass manager into two. GlobalISel with the fallback path disabled |
| 1018 | // and -run-pass seem to be unaffected. The majority of GlobalISel |
| 1019 | // testing uses -run-pass so this probably isn't too bad. |
| 1020 | SaveAndRestore SavedDebugifyIsSafe(DebugifyIsSafe); |
| 1021 | if (Selector != SelectorType::GlobalISel || !isGlobalISelAbortEnabled()) |
| 1022 | DebugifyIsSafe = false; |
| 1023 | |
| 1024 | // Add instruction selector passes for global isel if enabled. |
| 1025 | if (Selector == SelectorType::GlobalISel) { |
| 1026 | SaveAndRestore SavedAddingMachinePasses(AddingMachinePasses, true); |
| 1027 | if (addIRTranslator()) |
| 1028 | return true; |
| 1029 | |
| 1030 | addPreLegalizeMachineIR(); |
| 1031 | |
| 1032 | if (addLegalizeMachineIR()) |
| 1033 | return true; |
| 1034 | |
| 1035 | // Before running the register bank selector, ask the target if it |
| 1036 | // wants to run some passes. |
| 1037 | addPreRegBankSelect(); |
| 1038 | |
| 1039 | if (addRegBankSelect()) |
| 1040 | return true; |
| 1041 | |
| 1042 | addPreGlobalInstructionSelect(); |
| 1043 | |
| 1044 | if (addGlobalInstructionSelect()) |
| 1045 | return true; |
| 1046 | } |
| 1047 | |
| 1048 | // Pass to reset the MachineFunction if the ISel failed. Outside of the above |
| 1049 | // if so that the verifier is not added to it. |
| 1050 | if (Selector == SelectorType::GlobalISel) |
| 1051 | addPass(P: createResetMachineFunctionPass( |
| 1052 | EmitFallbackDiag: reportDiagnosticWhenGlobalISelFallback(), AbortOnFailedISel: isGlobalISelAbortEnabled())); |
| 1053 | |
| 1054 | // Run the SDAG InstSelector, providing a fallback path when we do not want to |
| 1055 | // abort on not-yet-supported input. |
| 1056 | if (Selector != SelectorType::GlobalISel || !isGlobalISelAbortEnabled()) |
| 1057 | if (addInstSelector()) |
| 1058 | return true; |
| 1059 | |
| 1060 | // Expand pseudo-instructions emitted by ISel. Don't run the verifier before |
| 1061 | // FinalizeISel. |
| 1062 | addPass(PassID: &FinalizeISelID); |
| 1063 | |
| 1064 | // Print the instruction selected machine code... |
| 1065 | printAndVerify(Banner: "After Instruction Selection" ); |
| 1066 | |
| 1067 | return false; |
| 1068 | } |
| 1069 | |
| 1070 | bool TargetPassConfig::addISelPasses() { |
| 1071 | if (TM->useEmulatedTLS()) |
| 1072 | addPass(P: createLowerEmuTLSPass()); |
| 1073 | |
| 1074 | PM->add(P: createTargetTransformInfoWrapperPass(TIRA: TM->getTargetIRAnalysis())); |
| 1075 | addPass(P: createPreISelIntrinsicLoweringPass()); |
| 1076 | addPass(P: createExpandLargeDivRemPass()); |
| 1077 | addPass(P: createExpandFpPass()); |
| 1078 | addIRPasses(); |
| 1079 | addCodeGenPrepare(); |
| 1080 | addPassesToHandleExceptions(); |
| 1081 | addISelPrepare(); |
| 1082 | |
| 1083 | return addCoreISelPasses(); |
| 1084 | } |
| 1085 | |
| 1086 | /// -regalloc=... command line option. |
| 1087 | static FunctionPass *useDefaultRegisterAllocator() { return nullptr; } |
| 1088 | static cl::opt<RegisterRegAlloc::FunctionPassCtor, false, |
| 1089 | RegisterPassParser<RegisterRegAlloc>> |
| 1090 | RegAlloc("regalloc" , cl::Hidden, cl::init(Val: &useDefaultRegisterAllocator), |
| 1091 | cl::desc("Register allocator to use" )); |
| 1092 | |
| 1093 | /// Add the complete set of target-independent postISel code generator passes. |
| 1094 | /// |
| 1095 | /// This can be read as the standard order of major LLVM CodeGen stages. Stages |
| 1096 | /// with nontrivial configuration or multiple passes are broken out below in |
| 1097 | /// add%Stage routines. |
| 1098 | /// |
| 1099 | /// Any TargetPassConfig::addXX routine may be overriden by the Target. The |
| 1100 | /// addPre/Post methods with empty header implementations allow injecting |
| 1101 | /// target-specific fixups just before or after major stages. Additionally, |
| 1102 | /// targets have the flexibility to change pass order within a stage by |
| 1103 | /// overriding default implementation of add%Stage routines below. Each |
| 1104 | /// technique has maintainability tradeoffs because alternate pass orders are |
| 1105 | /// not well supported. addPre/Post works better if the target pass is easily |
| 1106 | /// tied to a common pass. But if it has subtle dependencies on multiple passes, |
| 1107 | /// the target should override the stage instead. |
| 1108 | /// |
| 1109 | /// TODO: We could use a single addPre/Post(ID) hook to allow pass injection |
| 1110 | /// before/after any target-independent pass. But it's currently overkill. |
| 1111 | void TargetPassConfig::addMachinePasses() { |
| 1112 | AddingMachinePasses = true; |
| 1113 | |
| 1114 | // Add passes that optimize machine instructions in SSA form. |
| 1115 | if (getOptLevel() != CodeGenOptLevel::None) { |
| 1116 | addMachineSSAOptimization(); |
| 1117 | } else { |
| 1118 | // If the target requests it, assign local variables to stack slots relative |
| 1119 | // to one another and simplify frame index references where possible. |
| 1120 | addPass(PassID: &LocalStackSlotAllocationID); |
| 1121 | } |
| 1122 | |
| 1123 | if (TM->Options.EnableIPRA) |
| 1124 | addPass(P: createRegUsageInfoPropPass()); |
| 1125 | |
| 1126 | // Run pre-ra passes. |
| 1127 | addPreRegAlloc(); |
| 1128 | |
| 1129 | // Debugifying the register allocator passes seems to provoke some |
| 1130 | // non-determinism that affects CodeGen and there doesn't seem to be a point |
| 1131 | // where it becomes safe again so stop debugifying here. |
| 1132 | DebugifyIsSafe = false; |
| 1133 | |
| 1134 | // Add a FSDiscriminator pass right before RA, so that we could get |
| 1135 | // more precise SampleFDO profile for RA. |
| 1136 | if (EnableFSDiscriminator) { |
| 1137 | addPass(P: createMIRAddFSDiscriminatorsPass( |
| 1138 | P: sampleprof::FSDiscriminatorPass::Pass1)); |
| 1139 | const std::string ProfileFile = getFSProfileFile(TM); |
| 1140 | if (!ProfileFile.empty() && !DisableRAFSProfileLoader) |
| 1141 | addPass(P: createMIRProfileLoaderPass(File: ProfileFile, RemappingFile: getFSRemappingFile(TM), |
| 1142 | P: sampleprof::FSDiscriminatorPass::Pass1, |
| 1143 | FS: nullptr)); |
| 1144 | } |
| 1145 | |
| 1146 | // Run register allocation and passes that are tightly coupled with it, |
| 1147 | // including phi elimination and scheduling. |
| 1148 | if (getOptimizeRegAlloc()) |
| 1149 | addOptimizedRegAlloc(); |
| 1150 | else |
| 1151 | addFastRegAlloc(); |
| 1152 | |
| 1153 | // Run post-ra passes. |
| 1154 | addPostRegAlloc(); |
| 1155 | |
| 1156 | addPass(PassID: &RemoveRedundantDebugValuesID); |
| 1157 | |
| 1158 | addPass(PassID: &FixupStatepointCallerSavedID); |
| 1159 | |
| 1160 | // Insert prolog/epilog code. Eliminate abstract frame index references... |
| 1161 | if (getOptLevel() != CodeGenOptLevel::None) { |
| 1162 | addPass(PassID: &PostRAMachineSinkingID); |
| 1163 | addPass(PassID: &ShrinkWrapID); |
| 1164 | } |
| 1165 | |
| 1166 | // Prolog/Epilog inserter needs a TargetMachine to instantiate. But only |
| 1167 | // do so if it hasn't been disabled, substituted, or overridden. |
| 1168 | if (!isPassSubstitutedOrOverridden(ID: &PrologEpilogCodeInserterID)) |
| 1169 | addPass(P: createPrologEpilogInserterPass()); |
| 1170 | |
| 1171 | /// Add passes that optimize machine instructions after register allocation. |
| 1172 | if (getOptLevel() != CodeGenOptLevel::None) |
| 1173 | addMachineLateOptimization(); |
| 1174 | |
| 1175 | // Expand pseudo instructions before second scheduling pass. |
| 1176 | addPass(PassID: &ExpandPostRAPseudosID); |
| 1177 | |
| 1178 | // Run pre-sched2 passes. |
| 1179 | addPreSched2(); |
| 1180 | |
| 1181 | if (EnableImplicitNullChecks) |
| 1182 | addPass(PassID: &ImplicitNullChecksID); |
| 1183 | |
| 1184 | // Second pass scheduler. |
| 1185 | // Let Target optionally insert this pass by itself at some other |
| 1186 | // point. |
| 1187 | if (getOptLevel() != CodeGenOptLevel::None && |
| 1188 | !TM->targetSchedulesPostRAScheduling()) { |
| 1189 | if (MISchedPostRA) |
| 1190 | addPass(PassID: &PostMachineSchedulerID); |
| 1191 | else |
| 1192 | addPass(PassID: &PostRASchedulerID); |
| 1193 | } |
| 1194 | |
| 1195 | // GC |
| 1196 | addGCPasses(); |
| 1197 | |
| 1198 | // Basic block placement. |
| 1199 | if (getOptLevel() != CodeGenOptLevel::None) |
| 1200 | addBlockPlacement(); |
| 1201 | |
| 1202 | // Insert before XRay Instrumentation. |
| 1203 | addPass(PassID: &FEntryInserterID); |
| 1204 | |
| 1205 | addPass(PassID: &XRayInstrumentationID); |
| 1206 | addPass(PassID: &PatchableFunctionID); |
| 1207 | |
| 1208 | addPreEmitPass(); |
| 1209 | |
| 1210 | if (TM->Options.EnableIPRA) |
| 1211 | // Collect register usage information and produce a register mask of |
| 1212 | // clobbered registers, to be used to optimize call sites. |
| 1213 | addPass(P: createRegUsageInfoCollector()); |
| 1214 | |
| 1215 | // FIXME: Some backends are incompatible with running the verifier after |
| 1216 | // addPreEmitPass. Maybe only pass "false" here for those targets? |
| 1217 | addPass(PassID: &FuncletLayoutID); |
| 1218 | |
| 1219 | addPass(PassID: &RemoveLoadsIntoFakeUsesID); |
| 1220 | addPass(PassID: &StackMapLivenessID); |
| 1221 | addPass(PassID: &LiveDebugValuesID); |
| 1222 | addPass(PassID: &MachineSanitizerBinaryMetadataID); |
| 1223 | |
| 1224 | if (TM->Options.EnableMachineOutliner && |
| 1225 | getOptLevel() != CodeGenOptLevel::None && |
| 1226 | EnableMachineOutliner != RunOutliner::NeverOutline) { |
| 1227 | bool RunOnAllFunctions = |
| 1228 | (EnableMachineOutliner == RunOutliner::AlwaysOutline); |
| 1229 | bool AddOutliner = |
| 1230 | RunOnAllFunctions || TM->Options.SupportsDefaultOutlining; |
| 1231 | if (AddOutliner) |
| 1232 | addPass(P: createMachineOutlinerPass(RunOnAllFunctions)); |
| 1233 | } |
| 1234 | |
| 1235 | if (GCEmptyBlocks) |
| 1236 | addPass(P: llvm::createGCEmptyBasicBlocksPass()); |
| 1237 | |
| 1238 | if (EnableFSDiscriminator) |
| 1239 | addPass(P: createMIRAddFSDiscriminatorsPass( |
| 1240 | P: sampleprof::FSDiscriminatorPass::PassLast)); |
| 1241 | |
| 1242 | if (TM->Options.EnableMachineFunctionSplitter || |
| 1243 | EnableMachineFunctionSplitter || SplitStaticData || |
| 1244 | TM->Options.EnableStaticDataPartitioning) { |
| 1245 | const std::string ProfileFile = getFSProfileFile(TM); |
| 1246 | if (!ProfileFile.empty()) { |
| 1247 | if (EnableFSDiscriminator) { |
| 1248 | addPass(P: createMIRProfileLoaderPass( |
| 1249 | File: ProfileFile, RemappingFile: getFSRemappingFile(TM), |
| 1250 | P: sampleprof::FSDiscriminatorPass::PassLast, FS: nullptr)); |
| 1251 | } else { |
| 1252 | // Sample profile is given, but FSDiscriminator is not |
| 1253 | // enabled, this may result in performance regression. |
| 1254 | WithColor::warning() |
| 1255 | << "Using AutoFDO without FSDiscriminator for MFS may regress " |
| 1256 | "performance.\n" ; |
| 1257 | } |
| 1258 | } |
| 1259 | } |
| 1260 | |
| 1261 | // Machine function splitter uses the basic block sections feature. |
| 1262 | // When used along with `-basic-block-sections=`, the basic-block-sections |
| 1263 | // feature takes precedence. This means functions eligible for |
| 1264 | // basic-block-sections optimizations (`=all`, or `=list=` with function |
| 1265 | // included in the list profile) will get that optimization instead. |
| 1266 | if (TM->Options.EnableMachineFunctionSplitter || |
| 1267 | EnableMachineFunctionSplitter) |
| 1268 | addPass(P: createMachineFunctionSplitterPass()); |
| 1269 | |
| 1270 | if (SplitStaticData || TM->Options.EnableStaticDataPartitioning) { |
| 1271 | // The static data splitter pass is a machine function pass. and |
| 1272 | // static data annotator pass is a module-wide pass. See the file comment |
| 1273 | // in StaticDataAnnotator.cpp for the motivation. |
| 1274 | addPass(P: createStaticDataSplitterPass()); |
| 1275 | addPass(P: createStaticDataAnnotatorPass()); |
| 1276 | } |
| 1277 | // We run the BasicBlockSections pass if either we need BB sections or BB |
| 1278 | // address map (or both). |
| 1279 | if (TM->getBBSectionsType() != llvm::BasicBlockSection::None || |
| 1280 | TM->Options.BBAddrMap) { |
| 1281 | if (TM->getBBSectionsType() == llvm::BasicBlockSection::List) { |
| 1282 | addPass(P: llvm::createBasicBlockSectionsProfileReaderWrapperPass( |
| 1283 | Buf: TM->getBBSectionsFuncListBuf())); |
| 1284 | addPass(P: llvm::createBasicBlockPathCloningPass()); |
| 1285 | } |
| 1286 | addPass(P: llvm::createBasicBlockSectionsPass()); |
| 1287 | } |
| 1288 | |
| 1289 | addPostBBSections(); |
| 1290 | |
| 1291 | if (!DisableCFIFixup && TM->Options.EnableCFIFixup) |
| 1292 | addPass(P: createCFIFixup()); |
| 1293 | |
| 1294 | PM->add(P: createStackFrameLayoutAnalysisPass()); |
| 1295 | |
| 1296 | // Add passes that directly emit MI after all other MI passes. |
| 1297 | addPreEmitPass2(); |
| 1298 | |
| 1299 | AddingMachinePasses = false; |
| 1300 | } |
| 1301 | |
| 1302 | /// Add passes that optimize machine instructions in SSA form. |
| 1303 | void TargetPassConfig::addMachineSSAOptimization() { |
| 1304 | // Pre-ra tail duplication. |
| 1305 | addPass(PassID: &EarlyTailDuplicateLegacyID); |
| 1306 | |
| 1307 | // Optimize PHIs before DCE: removing dead PHI cycles may make more |
| 1308 | // instructions dead. |
| 1309 | addPass(PassID: &OptimizePHIsLegacyID); |
| 1310 | |
| 1311 | // This pass merges large allocas. StackSlotColoring is a different pass |
| 1312 | // which merges spill slots. |
| 1313 | addPass(PassID: &StackColoringLegacyID); |
| 1314 | |
| 1315 | // If the target requests it, assign local variables to stack slots relative |
| 1316 | // to one another and simplify frame index references where possible. |
| 1317 | addPass(PassID: &LocalStackSlotAllocationID); |
| 1318 | |
| 1319 | // With optimization, dead code should already be eliminated. However |
| 1320 | // there is one known exception: lowered code for arguments that are only |
| 1321 | // used by tail calls, where the tail calls reuse the incoming stack |
| 1322 | // arguments directly (see t11 in test/CodeGen/X86/sibcall.ll). |
| 1323 | addPass(PassID: &DeadMachineInstructionElimID); |
| 1324 | |
| 1325 | // Allow targets to insert passes that improve instruction level parallelism, |
| 1326 | // like if-conversion. Such passes will typically need dominator trees and |
| 1327 | // loop info, just like LICM and CSE below. |
| 1328 | addILPOpts(); |
| 1329 | |
| 1330 | addPass(PassID: &EarlyMachineLICMID); |
| 1331 | addPass(PassID: &MachineCSELegacyID); |
| 1332 | |
| 1333 | addPass(PassID: &MachineSinkingLegacyID); |
| 1334 | |
| 1335 | addPass(PassID: &PeepholeOptimizerLegacyID); |
| 1336 | // Clean-up the dead code that may have been generated by peephole |
| 1337 | // rewriting. |
| 1338 | addPass(PassID: &DeadMachineInstructionElimID); |
| 1339 | } |
| 1340 | |
| 1341 | //===---------------------------------------------------------------------===// |
| 1342 | /// Register Allocation Pass Configuration |
| 1343 | //===---------------------------------------------------------------------===// |
| 1344 | |
| 1345 | bool TargetPassConfig::getOptimizeRegAlloc() const { |
| 1346 | switch (OptimizeRegAlloc) { |
| 1347 | case cl::BOU_UNSET: |
| 1348 | return getOptLevel() != CodeGenOptLevel::None; |
| 1349 | case cl::BOU_TRUE: return true; |
| 1350 | case cl::BOU_FALSE: return false; |
| 1351 | } |
| 1352 | llvm_unreachable("Invalid optimize-regalloc state" ); |
| 1353 | } |
| 1354 | |
| 1355 | /// A dummy default pass factory indicates whether the register allocator is |
| 1356 | /// overridden on the command line. |
| 1357 | static llvm::once_flag InitializeDefaultRegisterAllocatorFlag; |
| 1358 | |
| 1359 | static RegisterRegAlloc |
| 1360 | defaultRegAlloc("default" , |
| 1361 | "pick register allocator based on -O option" , |
| 1362 | useDefaultRegisterAllocator); |
| 1363 | |
| 1364 | static void initializeDefaultRegisterAllocatorOnce() { |
| 1365 | if (!RegisterRegAlloc::getDefault()) |
| 1366 | RegisterRegAlloc::setDefault(RegAlloc); |
| 1367 | } |
| 1368 | |
| 1369 | /// Instantiate the default register allocator pass for this target for either |
| 1370 | /// the optimized or unoptimized allocation path. This will be added to the pass |
| 1371 | /// manager by addFastRegAlloc in the unoptimized case or addOptimizedRegAlloc |
| 1372 | /// in the optimized case. |
| 1373 | /// |
| 1374 | /// A target that uses the standard regalloc pass order for fast or optimized |
| 1375 | /// allocation may still override this for per-target regalloc |
| 1376 | /// selection. But -regalloc=... always takes precedence. |
| 1377 | FunctionPass *TargetPassConfig::createTargetRegisterAllocator(bool Optimized) { |
| 1378 | if (Optimized) |
| 1379 | return createGreedyRegisterAllocator(); |
| 1380 | else |
| 1381 | return createFastRegisterAllocator(); |
| 1382 | } |
| 1383 | |
| 1384 | /// Find and instantiate the register allocation pass requested by this target |
| 1385 | /// at the current optimization level. Different register allocators are |
| 1386 | /// defined as separate passes because they may require different analysis. |
| 1387 | /// |
| 1388 | /// This helper ensures that the regalloc= option is always available, |
| 1389 | /// even for targets that override the default allocator. |
| 1390 | /// |
| 1391 | /// FIXME: When MachinePassRegistry register pass IDs instead of function ptrs, |
| 1392 | /// this can be folded into addPass. |
| 1393 | FunctionPass *TargetPassConfig::createRegAllocPass(bool Optimized) { |
| 1394 | // Initialize the global default. |
| 1395 | llvm::call_once(flag&: InitializeDefaultRegisterAllocatorFlag, |
| 1396 | F&: initializeDefaultRegisterAllocatorOnce); |
| 1397 | |
| 1398 | RegisterRegAlloc::FunctionPassCtor Ctor = RegisterRegAlloc::getDefault(); |
| 1399 | if (Ctor != useDefaultRegisterAllocator) |
| 1400 | return Ctor(); |
| 1401 | |
| 1402 | // With no -regalloc= override, ask the target for a regalloc pass. |
| 1403 | return createTargetRegisterAllocator(Optimized); |
| 1404 | } |
| 1405 | |
| 1406 | bool TargetPassConfig::isCustomizedRegAlloc() { |
| 1407 | return RegAlloc != |
| 1408 | (RegisterRegAlloc::FunctionPassCtor)&useDefaultRegisterAllocator; |
| 1409 | } |
| 1410 | |
| 1411 | bool TargetPassConfig::addRegAssignAndRewriteFast() { |
| 1412 | if (RegAlloc != (RegisterRegAlloc::FunctionPassCtor)&useDefaultRegisterAllocator && |
| 1413 | RegAlloc != (RegisterRegAlloc::FunctionPassCtor)&createFastRegisterAllocator) |
| 1414 | reportFatalUsageError( |
| 1415 | reason: "Must use fast (default) register allocator for unoptimized regalloc." ); |
| 1416 | |
| 1417 | addPass(P: createRegAllocPass(Optimized: false)); |
| 1418 | |
| 1419 | // Allow targets to change the register assignments after |
| 1420 | // fast register allocation. |
| 1421 | addPostFastRegAllocRewrite(); |
| 1422 | return true; |
| 1423 | } |
| 1424 | |
| 1425 | bool TargetPassConfig::addRegAssignAndRewriteOptimized() { |
| 1426 | // Add the selected register allocation pass. |
| 1427 | addPass(P: createRegAllocPass(Optimized: true)); |
| 1428 | |
| 1429 | // Allow targets to change the register assignments before rewriting. |
| 1430 | addPreRewrite(); |
| 1431 | |
| 1432 | // Finally rewrite virtual registers. |
| 1433 | addPass(PassID: &VirtRegRewriterID); |
| 1434 | |
| 1435 | // Regalloc scoring for ML-driven eviction - noop except when learning a new |
| 1436 | // eviction policy. |
| 1437 | addPass(P: createRegAllocScoringPass()); |
| 1438 | return true; |
| 1439 | } |
| 1440 | |
| 1441 | /// Return true if the default global register allocator is in use and |
| 1442 | /// has not be overriden on the command line with '-regalloc=...' |
| 1443 | bool TargetPassConfig::usingDefaultRegAlloc() const { |
| 1444 | return RegAlloc.getNumOccurrences() == 0; |
| 1445 | } |
| 1446 | |
| 1447 | /// Add the minimum set of target-independent passes that are required for |
| 1448 | /// register allocation. No coalescing or scheduling. |
| 1449 | void TargetPassConfig::addFastRegAlloc() { |
| 1450 | addPass(PassID: &PHIEliminationID); |
| 1451 | addPass(PassID: &TwoAddressInstructionPassID); |
| 1452 | |
| 1453 | addRegAssignAndRewriteFast(); |
| 1454 | } |
| 1455 | |
| 1456 | /// Add standard target-independent passes that are tightly coupled with |
| 1457 | /// optimized register allocation, including coalescing, machine instruction |
| 1458 | /// scheduling, and register allocation itself. |
| 1459 | void TargetPassConfig::addOptimizedRegAlloc() { |
| 1460 | addPass(PassID: &DetectDeadLanesID); |
| 1461 | |
| 1462 | addPass(PassID: &InitUndefID); |
| 1463 | |
| 1464 | addPass(PassID: &ProcessImplicitDefsID); |
| 1465 | |
| 1466 | // LiveVariables currently requires pure SSA form. |
| 1467 | // |
| 1468 | // FIXME: Once TwoAddressInstruction pass no longer uses kill flags, |
| 1469 | // LiveVariables can be removed completely, and LiveIntervals can be directly |
| 1470 | // computed. (We still either need to regenerate kill flags after regalloc, or |
| 1471 | // preferably fix the scavenger to not depend on them). |
| 1472 | // FIXME: UnreachableMachineBlockElim is a dependant pass of LiveVariables. |
| 1473 | // When LiveVariables is removed this has to be removed/moved either. |
| 1474 | // Explicit addition of UnreachableMachineBlockElim allows stopping before or |
| 1475 | // after it with -stop-before/-stop-after. |
| 1476 | addPass(PassID: &UnreachableMachineBlockElimID); |
| 1477 | addPass(PassID: &LiveVariablesID); |
| 1478 | |
| 1479 | // Edge splitting is smarter with machine loop info. |
| 1480 | addPass(PassID: &MachineLoopInfoID); |
| 1481 | addPass(PassID: &PHIEliminationID); |
| 1482 | |
| 1483 | // Eventually, we want to run LiveIntervals before PHI elimination. |
| 1484 | if (EarlyLiveIntervals) |
| 1485 | addPass(PassID: &LiveIntervalsID); |
| 1486 | |
| 1487 | addPass(PassID: &TwoAddressInstructionPassID); |
| 1488 | addPass(PassID: &RegisterCoalescerID); |
| 1489 | |
| 1490 | // The machine scheduler may accidentally create disconnected components |
| 1491 | // when moving subregister definitions around, avoid this by splitting them to |
| 1492 | // separate vregs before. Splitting can also improve reg. allocation quality. |
| 1493 | addPass(PassID: &RenameIndependentSubregsID); |
| 1494 | |
| 1495 | // PreRA instruction scheduling. |
| 1496 | addPass(PassID: &MachineSchedulerID); |
| 1497 | |
| 1498 | if (addRegAssignAndRewriteOptimized()) { |
| 1499 | // Perform stack slot coloring and post-ra machine LICM. |
| 1500 | addPass(PassID: &StackSlotColoringID); |
| 1501 | |
| 1502 | // Allow targets to expand pseudo instructions depending on the choice of |
| 1503 | // registers before MachineCopyPropagation. |
| 1504 | addPostRewrite(); |
| 1505 | |
| 1506 | // Copy propagate to forward register uses and try to eliminate COPYs that |
| 1507 | // were not coalesced. |
| 1508 | addPass(PassID: &MachineCopyPropagationID); |
| 1509 | |
| 1510 | // Run post-ra machine LICM to hoist reloads / remats. |
| 1511 | // |
| 1512 | // FIXME: can this move into MachineLateOptimization? |
| 1513 | addPass(PassID: &MachineLICMID); |
| 1514 | } |
| 1515 | } |
| 1516 | |
| 1517 | //===---------------------------------------------------------------------===// |
| 1518 | /// Post RegAlloc Pass Configuration |
| 1519 | //===---------------------------------------------------------------------===// |
| 1520 | |
| 1521 | /// Add passes that optimize machine instructions after register allocation. |
| 1522 | void TargetPassConfig::addMachineLateOptimization() { |
| 1523 | // Cleanup of redundant immediate/address loads. |
| 1524 | addPass(PassID: &MachineLateInstrsCleanupID); |
| 1525 | |
| 1526 | // Branch folding must be run after regalloc and prolog/epilog insertion. |
| 1527 | addPass(PassID: &BranchFolderPassID); |
| 1528 | |
| 1529 | // Tail duplication. |
| 1530 | // Note that duplicating tail just increases code size and degrades |
| 1531 | // performance for targets that require Structured Control Flow. |
| 1532 | // In addition it can also make CFG irreducible. Thus we disable it. |
| 1533 | if (!TM->requiresStructuredCFG()) |
| 1534 | addPass(PassID: &TailDuplicateLegacyID); |
| 1535 | |
| 1536 | // Copy propagation. |
| 1537 | addPass(PassID: &MachineCopyPropagationID); |
| 1538 | } |
| 1539 | |
| 1540 | /// Add standard GC passes. |
| 1541 | bool TargetPassConfig::addGCPasses() { |
| 1542 | addPass(PassID: &GCMachineCodeAnalysisID); |
| 1543 | return true; |
| 1544 | } |
| 1545 | |
| 1546 | /// Add standard basic block placement passes. |
| 1547 | void TargetPassConfig::addBlockPlacement() { |
| 1548 | if (EnableFSDiscriminator) { |
| 1549 | addPass(P: createMIRAddFSDiscriminatorsPass( |
| 1550 | P: sampleprof::FSDiscriminatorPass::Pass2)); |
| 1551 | const std::string ProfileFile = getFSProfileFile(TM); |
| 1552 | if (!ProfileFile.empty() && !DisableLayoutFSProfileLoader) |
| 1553 | addPass(P: createMIRProfileLoaderPass(File: ProfileFile, RemappingFile: getFSRemappingFile(TM), |
| 1554 | P: sampleprof::FSDiscriminatorPass::Pass2, |
| 1555 | FS: nullptr)); |
| 1556 | } |
| 1557 | if (addPass(PassID: &MachineBlockPlacementID)) { |
| 1558 | // Run a separate pass to collect block placement statistics. |
| 1559 | if (EnableBlockPlacementStats) |
| 1560 | addPass(PassID: &MachineBlockPlacementStatsID); |
| 1561 | } |
| 1562 | } |
| 1563 | |
| 1564 | //===---------------------------------------------------------------------===// |
| 1565 | /// GlobalISel Configuration |
| 1566 | //===---------------------------------------------------------------------===// |
| 1567 | bool TargetPassConfig::isGlobalISelAbortEnabled() const { |
| 1568 | return TM->Options.GlobalISelAbort == GlobalISelAbortMode::Enable; |
| 1569 | } |
| 1570 | |
| 1571 | bool TargetPassConfig::reportDiagnosticWhenGlobalISelFallback() const { |
| 1572 | return TM->Options.GlobalISelAbort == GlobalISelAbortMode::DisableWithDiag; |
| 1573 | } |
| 1574 | |
| 1575 | bool TargetPassConfig::isGISelCSEEnabled() const { |
| 1576 | return true; |
| 1577 | } |
| 1578 | |
| 1579 | std::unique_ptr<CSEConfigBase> TargetPassConfig::getCSEConfig() const { |
| 1580 | return std::make_unique<CSEConfigBase>(); |
| 1581 | } |
| 1582 | |