| 1 | //===- AggressiveInstCombineInternal.h --------------------------*- C++ -*-===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This file implements the instruction pattern combiner classes. |
| 10 | // Currently, it handles pattern expressions for: |
| 11 | // * Truncate instruction |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #ifndef LLVM_LIB_TRANSFORMS_AGGRESSIVEINSTCOMBINE_COMBINEINTERNAL_H |
| 16 | #define LLVM_LIB_TRANSFORMS_AGGRESSIVEINSTCOMBINE_COMBINEINTERNAL_H |
| 17 | |
| 18 | #include "llvm/ADT/MapVector.h" |
| 19 | #include "llvm/ADT/SmallVector.h" |
| 20 | #include "llvm/Analysis/ValueTracking.h" |
| 21 | #include "llvm/Support/KnownBits.h" |
| 22 | |
| 23 | //===----------------------------------------------------------------------===// |
| 24 | // TruncInstCombine - looks for expression graphs dominated by trunc |
| 25 | // instructions and for each eligible graph, it will create a reduced bit-width |
| 26 | // expression and replace the old expression with this new one and remove the |
| 27 | // old one. Eligible expression graph is such that: |
| 28 | // 1. Contains only supported instructions. |
| 29 | // 2. Supported leaves: ZExtInst, SExtInst, TruncInst and Constant value. |
| 30 | // 3. Can be evaluated into type with reduced legal bit-width (or Trunc type). |
| 31 | // 4. All instructions in the graph must not have users outside the graph. |
| 32 | // Only exception is for {ZExt, SExt}Inst with operand type equal to the |
| 33 | // new reduced type chosen in (3). |
| 34 | // |
| 35 | // The motivation for this optimization is that evaluating and expression using |
| 36 | // smaller bit-width is preferable, especially for vectorization where we can |
| 37 | // fit more values in one vectorized instruction. In addition, this optimization |
| 38 | // may decrease the number of cast instructions, but will not increase it. |
| 39 | //===----------------------------------------------------------------------===// |
| 40 | |
| 41 | namespace llvm { |
| 42 | class AssumptionCache; |
| 43 | class DataLayout; |
| 44 | class DominatorTree; |
| 45 | class Function; |
| 46 | class Instruction; |
| 47 | class TargetLibraryInfo; |
| 48 | class TruncInst; |
| 49 | class Type; |
| 50 | class Value; |
| 51 | |
| 52 | class TruncInstCombine { |
| 53 | AssumptionCache ∾ |
| 54 | TargetLibraryInfo &TLI; |
| 55 | const DataLayout &DL; |
| 56 | const DominatorTree &DT; |
| 57 | |
| 58 | /// List of all TruncInst instructions to be processed. |
| 59 | SmallVector<TruncInst *, 4> Worklist; |
| 60 | |
| 61 | /// Current processed TruncInst instruction. |
| 62 | TruncInst *CurrentTruncInst = nullptr; |
| 63 | |
| 64 | /// Information per each instruction in the expression graph. |
| 65 | struct Info { |
| 66 | /// Number of LSBs that are needed to generate a valid expression. |
| 67 | unsigned ValidBitWidth = 0; |
| 68 | /// Minimum number of LSBs needed to generate the ValidBitWidth. |
| 69 | unsigned MinBitWidth = 0; |
| 70 | /// The reduced value generated to replace the old instruction. |
| 71 | Value *NewValue = nullptr; |
| 72 | }; |
| 73 | /// An ordered map representing expression graph post-dominated by current |
| 74 | /// processed TruncInst. It maps each instruction in the graph to its Info |
| 75 | /// structure. The map is ordered such that each instruction appears before |
| 76 | /// all other instructions in the graph that uses it. |
| 77 | MapVector<Instruction *, Info> InstInfoMap; |
| 78 | |
| 79 | public: |
| 80 | TruncInstCombine(AssumptionCache &AC, TargetLibraryInfo &TLI, |
| 81 | const DataLayout &DL, const DominatorTree &DT) |
| 82 | : AC(AC), TLI(TLI), DL(DL), DT(DT) {} |
| 83 | |
| 84 | /// Perform TruncInst pattern optimization on given function. |
| 85 | bool run(Function &F); |
| 86 | |
| 87 | private: |
| 88 | /// Build expression graph dominated by the /p CurrentTruncInst and append it |
| 89 | /// to the InstInfoMap container. |
| 90 | /// |
| 91 | /// \return true only if succeed to generate an eligible sub expression graph. |
| 92 | bool buildTruncExpressionGraph(); |
| 93 | |
| 94 | /// Calculate the minimal allowed bit-width of the chain ending with the |
| 95 | /// currently visited truncate's operand. |
| 96 | /// |
| 97 | /// \return minimum number of bits to which the chain ending with the |
| 98 | /// truncate's operand can be shrunk to. |
| 99 | unsigned getMinBitWidth(); |
| 100 | |
| 101 | /// Build an expression graph dominated by the current processed TruncInst and |
| 102 | /// Check if it is eligible to be reduced to a smaller type. |
| 103 | /// |
| 104 | /// \return the scalar version of the new type to be used for the reduced |
| 105 | /// expression graph, or nullptr if the expression graph is not |
| 106 | /// eligible to be reduced. |
| 107 | Type *getBestTruncatedType(); |
| 108 | |
| 109 | KnownBits computeKnownBits(const Value *V) const { |
| 110 | return llvm::computeKnownBits(V, DL, AC: &AC, |
| 111 | /*CtxI=*/CxtI: cast<Instruction>(Val: CurrentTruncInst), |
| 112 | DT: &DT); |
| 113 | } |
| 114 | |
| 115 | unsigned ComputeNumSignBits(const Value *V) const { |
| 116 | return llvm::ComputeNumSignBits( |
| 117 | Op: V, DL, AC: &AC, /*CtxI=*/CxtI: cast<Instruction>(Val: CurrentTruncInst), DT: &DT); |
| 118 | } |
| 119 | |
| 120 | /// Given a \p V value and a \p SclTy scalar type return the generated reduced |
| 121 | /// value of \p V based on the type \p SclTy. |
| 122 | /// |
| 123 | /// \param V value to be reduced. |
| 124 | /// \param SclTy scalar version of new type to reduce to. |
| 125 | /// \return the new reduced value. |
| 126 | Value *getReducedOperand(Value *V, Type *SclTy); |
| 127 | |
| 128 | /// Create a new expression graph using the reduced /p SclTy type and replace |
| 129 | /// the old expression graph with it. Also erase all instructions in the old |
| 130 | /// graph, except those that are still needed outside the graph. |
| 131 | /// |
| 132 | /// \param SclTy scalar version of new type to reduce expression graph into. |
| 133 | void ReduceExpressionGraph(Type *SclTy); |
| 134 | }; |
| 135 | } // end namespace llvm. |
| 136 | |
| 137 | #endif // LLVM_LIB_TRANSFORMS_AGGRESSIVEINSTCOMBINE_COMBINEINTERNAL_H |
| 138 | |