| 1 | //===- Transforms/IPO/SampleProfileProbe.h ----------*- C++ -*-===// | 
|---|
| 2 | // | 
|---|
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|---|
| 4 | // See https://llvm.org/LICENSE.txt for license information. | 
|---|
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
|---|
| 6 | // | 
|---|
| 7 | //===----------------------------------------------------------------------===// | 
|---|
| 8 | // | 
|---|
| 9 | /// \file | 
|---|
| 10 | /// This file provides the interface for the pseudo probe implementation for | 
|---|
| 11 | /// AutoFDO. | 
|---|
| 12 | // | 
|---|
| 13 | //===----------------------------------------------------------------------===// | 
|---|
| 14 |  | 
|---|
| 15 | #ifndef LLVM_TRANSFORMS_IPO_SAMPLEPROFILEPROBE_H | 
|---|
| 16 | #define LLVM_TRANSFORMS_IPO_SAMPLEPROFILEPROBE_H | 
|---|
| 17 |  | 
|---|
| 18 | #include "llvm/Analysis/LazyCallGraph.h" | 
|---|
| 19 | #include "llvm/IR/PassInstrumentation.h" | 
|---|
| 20 | #include "llvm/IR/PassManager.h" | 
|---|
| 21 | #include "llvm/ProfileData/SampleProf.h" | 
|---|
| 22 | #include "llvm/Support/Compiler.h" | 
|---|
| 23 | #include <unordered_map> | 
|---|
| 24 |  | 
|---|
| 25 | namespace llvm { | 
|---|
| 26 | class BasicBlock; | 
|---|
| 27 | class Function; | 
|---|
| 28 | class Instruction; | 
|---|
| 29 | class Loop; | 
|---|
| 30 | class PassInstrumentationCallbacks; | 
|---|
| 31 | class TargetMachine; | 
|---|
| 32 |  | 
|---|
| 33 | class Module; | 
|---|
| 34 |  | 
|---|
| 35 | using namespace sampleprof; | 
|---|
| 36 | using BlockIdMap = std::unordered_map<BasicBlock *, uint32_t>; | 
|---|
| 37 | using InstructionIdMap = std::unordered_map<Instruction *, uint32_t>; | 
|---|
| 38 | // Map from tuples of Probe id and inline stack hash code to distribution | 
|---|
| 39 | // factors. | 
|---|
| 40 | using ProbeFactorMap = std::unordered_map<std::pair<uint64_t, uint64_t>, float, | 
|---|
| 41 | pair_hash<uint64_t, uint64_t>>; | 
|---|
| 42 | using FuncProbeFactorMap = StringMap<ProbeFactorMap>; | 
|---|
| 43 |  | 
|---|
| 44 |  | 
|---|
| 45 | // A pseudo probe verifier that can be run after each IR passes to detect the | 
|---|
| 46 | // violation of updating probe factors. In principle, the sum of distribution | 
|---|
| 47 | // factor for a probe should be identical before and after a pass. For a | 
|---|
| 48 | // function pass, the factor sum for a probe would be typically 100%. | 
|---|
| 49 | class PseudoProbeVerifier { | 
|---|
| 50 | public: | 
|---|
| 51 | LLVM_ABI void registerCallbacks(PassInstrumentationCallbacks &PIC); | 
|---|
| 52 |  | 
|---|
| 53 | // Implementation of pass instrumentation callbacks for new pass manager. | 
|---|
| 54 | LLVM_ABI void runAfterPass(StringRef PassID, Any IR); | 
|---|
| 55 |  | 
|---|
| 56 | private: | 
|---|
| 57 | // Allow a little bias due the rounding to integral factors. | 
|---|
| 58 | constexpr static float DistributionFactorVariance = 0.02f; | 
|---|
| 59 | // Distribution factors from last pass. | 
|---|
| 60 | FuncProbeFactorMap FunctionProbeFactors; | 
|---|
| 61 |  | 
|---|
| 62 | void collectProbeFactors(const BasicBlock *BB, ProbeFactorMap &ProbeFactors); | 
|---|
| 63 | void runAfterPass(const Module *M); | 
|---|
| 64 | void runAfterPass(const LazyCallGraph::SCC *C); | 
|---|
| 65 | void runAfterPass(const Function *F); | 
|---|
| 66 | void runAfterPass(const Loop *L); | 
|---|
| 67 | bool shouldVerifyFunction(const Function *F); | 
|---|
| 68 | void verifyProbeFactors(const Function *F, | 
|---|
| 69 | const ProbeFactorMap &ProbeFactors); | 
|---|
| 70 | }; | 
|---|
| 71 |  | 
|---|
| 72 | /// Sample profile pseudo prober. | 
|---|
| 73 | /// | 
|---|
| 74 | /// Insert pseudo probes for block sampling and value sampling. | 
|---|
| 75 | class SampleProfileProber { | 
|---|
| 76 | public: | 
|---|
| 77 | // Give an empty module id when the prober is not used for instrumentation. | 
|---|
| 78 | LLVM_ABI SampleProfileProber(Function &F); | 
|---|
| 79 | LLVM_ABI void instrumentOneFunc(Function &F, TargetMachine *TM); | 
|---|
| 80 |  | 
|---|
| 81 | private: | 
|---|
| 82 | Function *getFunction() const { return F; } | 
|---|
| 83 | uint64_t getFunctionHash() const { return FunctionHash; } | 
|---|
| 84 | uint32_t getBlockId(const BasicBlock *BB) const; | 
|---|
| 85 | uint32_t getCallsiteId(const Instruction *Call) const; | 
|---|
| 86 | void findUnreachableBlocks(DenseSet<BasicBlock *> &BlocksToIgnore); | 
|---|
| 87 | void findInvokeNormalDests(DenseSet<BasicBlock *> &InvokeNormalDests); | 
|---|
| 88 | void computeBlocksToIgnore(DenseSet<BasicBlock *> &BlocksToIgnore, | 
|---|
| 89 | DenseSet<BasicBlock *> &BlocksAndCallsToIgnore); | 
|---|
| 90 | const Instruction * | 
|---|
| 91 | getOriginalTerminator(const BasicBlock *Head, | 
|---|
| 92 | const DenseSet<BasicBlock *> &BlocksToIgnore); | 
|---|
| 93 | void computeCFGHash(const DenseSet<BasicBlock *> &BlocksToIgnore); | 
|---|
| 94 | void computeProbeId(const DenseSet<BasicBlock *> &BlocksToIgnore, | 
|---|
| 95 | const DenseSet<BasicBlock *> &BlocksAndCallsToIgnore); | 
|---|
| 96 |  | 
|---|
| 97 | Function *F; | 
|---|
| 98 |  | 
|---|
| 99 | /// The current module ID that is used to name a static object as a comdat | 
|---|
| 100 | /// group. | 
|---|
| 101 | std::string CurModuleUniqueId; | 
|---|
| 102 |  | 
|---|
| 103 | /// A CFG hash code used to identify a function code changes. | 
|---|
| 104 | uint64_t FunctionHash; | 
|---|
| 105 |  | 
|---|
| 106 | /// Map basic blocks to the their pseudo probe ids. | 
|---|
| 107 | BlockIdMap BlockProbeIds; | 
|---|
| 108 |  | 
|---|
| 109 | /// Map indirect calls to the their pseudo probe ids. | 
|---|
| 110 | InstructionIdMap CallProbeIds; | 
|---|
| 111 |  | 
|---|
| 112 | /// The ID of the last probe, Can be used to number a new probe. | 
|---|
| 113 | uint32_t LastProbeId; | 
|---|
| 114 | }; | 
|---|
| 115 |  | 
|---|
| 116 | class SampleProfileProbePass : public PassInfoMixin<SampleProfileProbePass> { | 
|---|
| 117 | TargetMachine *TM; | 
|---|
| 118 |  | 
|---|
| 119 | public: | 
|---|
| 120 | SampleProfileProbePass(TargetMachine *TM) : TM(TM) {} | 
|---|
| 121 | LLVM_ABI PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); | 
|---|
| 122 | }; | 
|---|
| 123 |  | 
|---|
| 124 | // Pseudo probe distribution factor updater. | 
|---|
| 125 | // Sample profile annotation can happen in both LTO prelink and postlink. The | 
|---|
| 126 | // postlink-time re-annotation can degrade profile quality because of prelink | 
|---|
| 127 | // code duplication transformation, such as loop unrolling, jump threading, | 
|---|
| 128 | // indirect call promotion etc. As such, samples corresponding to a source | 
|---|
| 129 | // location may be aggregated multiple times in postlink. With a concept of | 
|---|
| 130 | // distribution factor for pseudo probes, samples can be distributed among | 
|---|
| 131 | // duplicated probes reasonable based on the assumption that optimizations | 
|---|
| 132 | // duplicating code well-maintain the branch frequency information (BFI). This | 
|---|
| 133 | // pass updates distribution factors for each pseudo probe at the end of the | 
|---|
| 134 | // prelink pipeline, to reflect an estimated portion of the real execution | 
|---|
| 135 | // count. | 
|---|
| 136 | class PseudoProbeUpdatePass : public PassInfoMixin<PseudoProbeUpdatePass> { | 
|---|
| 137 | void runOnFunction(Function &F, FunctionAnalysisManager &FAM); | 
|---|
| 138 |  | 
|---|
| 139 | public: | 
|---|
| 140 | PseudoProbeUpdatePass() = default; | 
|---|
| 141 | LLVM_ABI PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); | 
|---|
| 142 | }; | 
|---|
| 143 |  | 
|---|
| 144 | } // end namespace llvm | 
|---|
| 145 | #endif // LLVM_TRANSFORMS_IPO_SAMPLEPROFILEPROBE_H | 
|---|
| 146 |  | 
|---|