| 1 | //===-- SIRegisterInfo.h - SI Register Info Interface ----------*- C++ -*--===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | /// \file |
| 10 | /// Interface definition for SIRegisterInfo |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #ifndef LLVM_LIB_TARGET_AMDGPU_SIREGISTERINFO_H |
| 15 | #define LLVM_LIB_TARGET_AMDGPU_SIREGISTERINFO_H |
| 16 | |
| 17 | #include "llvm/ADT/BitVector.h" |
| 18 | |
| 19 | #define |
| 20 | #include "AMDGPUGenRegisterInfo.inc" |
| 21 | |
| 22 | #include "SIDefines.h" |
| 23 | |
| 24 | namespace llvm { |
| 25 | |
| 26 | class GCNSubtarget; |
| 27 | class LiveIntervals; |
| 28 | class LiveRegUnits; |
| 29 | class MachineInstrBuilder; |
| 30 | class RegisterBank; |
| 31 | struct SGPRSpillBuilder; |
| 32 | |
| 33 | /// Register allocation hint types. Helps eliminate unneeded COPY with True16 |
| 34 | namespace AMDGPURI { |
| 35 | |
| 36 | enum { Size16 = 1, Size32 = 2 }; |
| 37 | |
| 38 | } // end namespace AMDGPURI |
| 39 | |
| 40 | class SIRegisterInfo final : public AMDGPUGenRegisterInfo { |
| 41 | private: |
| 42 | const GCNSubtarget &ST; |
| 43 | bool SpillSGPRToVGPR; |
| 44 | bool isWave32; |
| 45 | BitVector RegPressureIgnoredUnits; |
| 46 | |
| 47 | /// Sub reg indexes for getRegSplitParts. |
| 48 | /// First index represents subreg size from 1 to 32 Half DWORDS. |
| 49 | /// The inner vector is sorted by bit offset. |
| 50 | /// Provided a register can be fully split with given subregs, |
| 51 | /// all elements of the inner vector combined give a full lane mask. |
| 52 | static std::array<std::vector<int16_t>, 32> RegSplitParts; |
| 53 | |
| 54 | // Table representing sub reg of given width and offset. |
| 55 | // First index is subreg size: 32, 64, 96, 128, 160, 192, 224, 256, 512. |
| 56 | // Second index is 32 different dword offsets. |
| 57 | static std::array<std::array<uint16_t, 32>, 9> SubRegFromChannelTable; |
| 58 | |
| 59 | void reserveRegisterTuples(BitVector &, MCRegister Reg) const; |
| 60 | |
| 61 | public: |
| 62 | SIRegisterInfo(const GCNSubtarget &ST); |
| 63 | |
| 64 | struct SpilledReg { |
| 65 | Register VGPR; |
| 66 | int Lane = -1; |
| 67 | |
| 68 | SpilledReg() = default; |
| 69 | SpilledReg(Register R, int L) : VGPR(R), Lane(L) {} |
| 70 | |
| 71 | bool hasLane() { return Lane != -1; } |
| 72 | bool hasReg() { return VGPR != 0; } |
| 73 | }; |
| 74 | |
| 75 | /// \returns the sub reg enum value for the given \p Channel |
| 76 | /// (e.g. getSubRegFromChannel(0) -> AMDGPU::sub0) |
| 77 | static unsigned getSubRegFromChannel(unsigned Channel, unsigned NumRegs = 1); |
| 78 | |
| 79 | bool spillSGPRToVGPR() const { |
| 80 | return SpillSGPRToVGPR; |
| 81 | } |
| 82 | |
| 83 | /// Return the largest available SGPR aligned to \p Align for the register |
| 84 | /// class \p RC. |
| 85 | MCRegister getAlignedHighSGPRForRC(const MachineFunction &MF, |
| 86 | const unsigned Align, |
| 87 | const TargetRegisterClass *RC) const; |
| 88 | |
| 89 | /// Return the end register initially reserved for the scratch buffer in case |
| 90 | /// spilling is needed. |
| 91 | MCRegister reservedPrivateSegmentBufferReg(const MachineFunction &MF) const; |
| 92 | |
| 93 | /// Return a pair of maximum numbers of VGPRs and AGPRs that meet the number |
| 94 | /// of waves per execution unit required for the function \p MF. |
| 95 | std::pair<unsigned, unsigned> |
| 96 | getMaxNumVectorRegs(const MachineFunction &MF) const; |
| 97 | |
| 98 | BitVector getReservedRegs(const MachineFunction &MF) const override; |
| 99 | bool isAsmClobberable(const MachineFunction &MF, |
| 100 | MCRegister PhysReg) const override; |
| 101 | |
| 102 | const MCPhysReg *getCalleeSavedRegs(const MachineFunction *MF) const override; |
| 103 | const MCPhysReg *getCalleeSavedRegsViaCopy(const MachineFunction *MF) const; |
| 104 | const uint32_t *getCallPreservedMask(const MachineFunction &MF, |
| 105 | CallingConv::ID) const override; |
| 106 | const uint32_t *getNoPreservedMask() const override; |
| 107 | |
| 108 | // Functions with the amdgpu_cs_chain or amdgpu_cs_chain_preserve calling |
| 109 | // conventions are free to use certain VGPRs without saving and restoring any |
| 110 | // lanes (not even inactive ones). |
| 111 | static bool isChainScratchRegister(Register VGPR); |
| 112 | |
| 113 | // Stack access is very expensive. CSRs are also the high registers, and we |
| 114 | // want to minimize the number of used registers. |
| 115 | unsigned getCSRFirstUseCost() const override { |
| 116 | return 100; |
| 117 | } |
| 118 | |
| 119 | // When building a block VGPR load, we only really transfer a subset of the |
| 120 | // registers in the block, based on a mask. Liveness analysis is not aware of |
| 121 | // the mask, so it might consider that any register in the block is available |
| 122 | // before the load and may therefore be scavenged. This is not ok for CSRs |
| 123 | // that are not clobbered, since the caller will expect them to be preserved. |
| 124 | // This method will add artificial implicit uses for those registers on the |
| 125 | // load instruction, so liveness analysis knows they're unavailable. |
| 126 | void addImplicitUsesForBlockCSRLoad(MachineInstrBuilder &MIB, |
| 127 | Register BlockReg) const; |
| 128 | |
| 129 | const TargetRegisterClass * |
| 130 | getLargestLegalSuperClass(const TargetRegisterClass *RC, |
| 131 | const MachineFunction &MF) const override; |
| 132 | |
| 133 | Register getFrameRegister(const MachineFunction &MF) const override; |
| 134 | |
| 135 | bool hasBasePointer(const MachineFunction &MF) const; |
| 136 | Register getBaseRegister() const; |
| 137 | |
| 138 | bool shouldRealignStack(const MachineFunction &MF) const override; |
| 139 | bool requiresRegisterScavenging(const MachineFunction &Fn) const override; |
| 140 | |
| 141 | bool requiresFrameIndexScavenging(const MachineFunction &MF) const override; |
| 142 | bool requiresFrameIndexReplacementScavenging( |
| 143 | const MachineFunction &MF) const override; |
| 144 | bool requiresVirtualBaseRegisters(const MachineFunction &Fn) const override; |
| 145 | |
| 146 | int64_t getScratchInstrOffset(const MachineInstr *MI) const; |
| 147 | |
| 148 | int64_t getFrameIndexInstrOffset(const MachineInstr *MI, |
| 149 | int Idx) const override; |
| 150 | |
| 151 | bool needsFrameBaseReg(MachineInstr *MI, int64_t Offset) const override; |
| 152 | |
| 153 | Register materializeFrameBaseRegister(MachineBasicBlock *MBB, int FrameIdx, |
| 154 | int64_t Offset) const override; |
| 155 | |
| 156 | void resolveFrameIndex(MachineInstr &MI, Register BaseReg, |
| 157 | int64_t Offset) const override; |
| 158 | |
| 159 | bool isFrameOffsetLegal(const MachineInstr *MI, Register BaseReg, |
| 160 | int64_t Offset) const override; |
| 161 | |
| 162 | const TargetRegisterClass *getPointerRegClass( |
| 163 | const MachineFunction &MF, unsigned Kind = 0) const override; |
| 164 | |
| 165 | /// Returns a legal register class to copy a register in the specified class |
| 166 | /// to or from. If it is possible to copy the register directly without using |
| 167 | /// a cross register class copy, return the specified RC. Returns NULL if it |
| 168 | /// is not possible to copy between two registers of the specified class. |
| 169 | const TargetRegisterClass * |
| 170 | getCrossCopyRegClass(const TargetRegisterClass *RC) const override; |
| 171 | |
| 172 | const TargetRegisterClass * |
| 173 | getRegClassForBlockOp(const MachineFunction &MF) const { |
| 174 | return &AMDGPU::VReg_1024RegClass; |
| 175 | } |
| 176 | |
| 177 | void buildVGPRSpillLoadStore(SGPRSpillBuilder &SB, int Index, int Offset, |
| 178 | bool IsLoad, bool IsKill = true) const; |
| 179 | |
| 180 | /// If \p OnlyToVGPR is true, this will only succeed if this manages to find a |
| 181 | /// free VGPR lane to spill. |
| 182 | bool spillSGPR(MachineBasicBlock::iterator MI, int FI, RegScavenger *RS, |
| 183 | SlotIndexes *Indexes = nullptr, LiveIntervals *LIS = nullptr, |
| 184 | bool OnlyToVGPR = false, |
| 185 | bool SpillToPhysVGPRLane = false) const; |
| 186 | |
| 187 | bool restoreSGPR(MachineBasicBlock::iterator MI, int FI, RegScavenger *RS, |
| 188 | SlotIndexes *Indexes = nullptr, LiveIntervals *LIS = nullptr, |
| 189 | bool OnlyToVGPR = false, |
| 190 | bool SpillToPhysVGPRLane = false) const; |
| 191 | |
| 192 | bool spillEmergencySGPR(MachineBasicBlock::iterator MI, |
| 193 | MachineBasicBlock &RestoreMBB, Register SGPR, |
| 194 | RegScavenger *RS) const; |
| 195 | |
| 196 | bool eliminateFrameIndex(MachineBasicBlock::iterator MI, int SPAdj, |
| 197 | unsigned FIOperandNum, |
| 198 | RegScavenger *RS) const override; |
| 199 | |
| 200 | bool eliminateSGPRToVGPRSpillFrameIndex( |
| 201 | MachineBasicBlock::iterator MI, int FI, RegScavenger *RS, |
| 202 | SlotIndexes *Indexes = nullptr, LiveIntervals *LIS = nullptr, |
| 203 | bool SpillToPhysVGPRLane = false) const; |
| 204 | |
| 205 | StringRef getRegAsmName(MCRegister Reg) const override; |
| 206 | |
| 207 | // Pseudo regs are not allowed |
| 208 | unsigned getHWRegIndex(MCRegister Reg) const { |
| 209 | return getEncodingValue(Reg) & 0xff; |
| 210 | } |
| 211 | |
| 212 | LLVM_READONLY |
| 213 | const TargetRegisterClass *getVGPRClassForBitWidth(unsigned BitWidth) const; |
| 214 | |
| 215 | LLVM_READONLY |
| 216 | const TargetRegisterClass *getAGPRClassForBitWidth(unsigned BitWidth) const; |
| 217 | |
| 218 | LLVM_READONLY |
| 219 | const TargetRegisterClass * |
| 220 | getVectorSuperClassForBitWidth(unsigned BitWidth) const; |
| 221 | |
| 222 | LLVM_READONLY |
| 223 | static const TargetRegisterClass *getSGPRClassForBitWidth(unsigned BitWidth); |
| 224 | |
| 225 | /// \returns true if this class contains only SGPR registers |
| 226 | static bool isSGPRClass(const TargetRegisterClass *RC) { |
| 227 | return hasSGPRs(RC) && !hasVGPRs(RC) && !hasAGPRs(RC); |
| 228 | } |
| 229 | |
| 230 | /// \returns true if this class ID contains only SGPR registers |
| 231 | bool isSGPRClassID(unsigned RCID) const { |
| 232 | return isSGPRClass(RC: getRegClass(RCID)); |
| 233 | } |
| 234 | |
| 235 | bool isSGPRReg(const MachineRegisterInfo &MRI, Register Reg) const; |
| 236 | bool isSGPRPhysReg(Register Reg) const { |
| 237 | return isSGPRClass(RC: getPhysRegBaseClass(Reg)); |
| 238 | } |
| 239 | |
| 240 | bool isVGPRPhysReg(Register Reg) const { |
| 241 | return isVGPRClass(RC: getPhysRegBaseClass(Reg)); |
| 242 | } |
| 243 | |
| 244 | /// \returns true if this class contains only VGPR registers |
| 245 | static bool isVGPRClass(const TargetRegisterClass *RC) { |
| 246 | return hasVGPRs(RC) && !hasAGPRs(RC) && !hasSGPRs(RC); |
| 247 | } |
| 248 | |
| 249 | /// \returns true if this class contains only AGPR registers |
| 250 | static bool isAGPRClass(const TargetRegisterClass *RC) { |
| 251 | return hasAGPRs(RC) && !hasVGPRs(RC) && !hasSGPRs(RC); |
| 252 | } |
| 253 | |
| 254 | /// \returns true only if this class contains both VGPR and AGPR registers |
| 255 | bool isVectorSuperClass(const TargetRegisterClass *RC) const { |
| 256 | return hasVGPRs(RC) && hasAGPRs(RC) && !hasSGPRs(RC); |
| 257 | } |
| 258 | |
| 259 | /// \returns true only if this class contains both VGPR and SGPR registers |
| 260 | bool isVSSuperClass(const TargetRegisterClass *RC) const { |
| 261 | return hasVGPRs(RC) && hasSGPRs(RC) && !hasAGPRs(RC); |
| 262 | } |
| 263 | |
| 264 | /// \returns true if this class contains VGPR registers. |
| 265 | static bool hasVGPRs(const TargetRegisterClass *RC) { |
| 266 | return RC->TSFlags & SIRCFlags::HasVGPR; |
| 267 | } |
| 268 | |
| 269 | /// \returns true if this class contains AGPR registers. |
| 270 | static bool hasAGPRs(const TargetRegisterClass *RC) { |
| 271 | return RC->TSFlags & SIRCFlags::HasAGPR; |
| 272 | } |
| 273 | |
| 274 | /// \returns true if this class contains SGPR registers. |
| 275 | static bool hasSGPRs(const TargetRegisterClass *RC) { |
| 276 | return RC->TSFlags & SIRCFlags::HasSGPR; |
| 277 | } |
| 278 | |
| 279 | /// \returns true if this class contains any vector registers. |
| 280 | static bool hasVectorRegisters(const TargetRegisterClass *RC) { |
| 281 | return hasVGPRs(RC) || hasAGPRs(RC); |
| 282 | } |
| 283 | |
| 284 | /// \returns A VGPR reg class with the same width as \p SRC |
| 285 | const TargetRegisterClass * |
| 286 | getEquivalentVGPRClass(const TargetRegisterClass *SRC) const; |
| 287 | |
| 288 | /// \returns An AGPR reg class with the same width as \p SRC |
| 289 | const TargetRegisterClass * |
| 290 | getEquivalentAGPRClass(const TargetRegisterClass *SRC) const; |
| 291 | |
| 292 | /// \returns A SGPR reg class with the same width as \p SRC |
| 293 | const TargetRegisterClass * |
| 294 | getEquivalentSGPRClass(const TargetRegisterClass *VRC) const; |
| 295 | |
| 296 | /// Returns a register class which is compatible with \p SuperRC, such that a |
| 297 | /// subregister exists with class \p SubRC with subregister index \p |
| 298 | /// SubIdx. If this is impossible (e.g., an unaligned subregister index within |
| 299 | /// a register tuple), return null. |
| 300 | const TargetRegisterClass * |
| 301 | getCompatibleSubRegClass(const TargetRegisterClass *SuperRC, |
| 302 | const TargetRegisterClass *SubRC, |
| 303 | unsigned SubIdx) const; |
| 304 | |
| 305 | /// \returns True if operands defined with this operand type can accept |
| 306 | /// a literal constant (i.e. any 32-bit immediate). |
| 307 | bool opCanUseLiteralConstant(unsigned OpType) const; |
| 308 | |
| 309 | /// \returns True if operands defined with this operand type can accept |
| 310 | /// an inline constant. i.e. An integer value in the range (-16, 64) or |
| 311 | /// -4.0f, -2.0f, -1.0f, -0.5f, 0.0f, 0.5f, 1.0f, 2.0f, 4.0f. |
| 312 | bool opCanUseInlineConstant(unsigned OpType) const; |
| 313 | |
| 314 | MCRegister findUnusedRegister(const MachineRegisterInfo &MRI, |
| 315 | const TargetRegisterClass *RC, |
| 316 | const MachineFunction &MF, |
| 317 | bool ReserveHighestVGPR = false) const; |
| 318 | |
| 319 | const TargetRegisterClass *getRegClassForReg(const MachineRegisterInfo &MRI, |
| 320 | Register Reg) const; |
| 321 | const TargetRegisterClass * |
| 322 | getRegClassForOperandReg(const MachineRegisterInfo &MRI, |
| 323 | const MachineOperand &MO) const; |
| 324 | |
| 325 | bool isVGPR(const MachineRegisterInfo &MRI, Register Reg) const; |
| 326 | bool isAGPR(const MachineRegisterInfo &MRI, Register Reg) const; |
| 327 | bool isVectorRegister(const MachineRegisterInfo &MRI, Register Reg) const { |
| 328 | return isVGPR(MRI, Reg) || isAGPR(MRI, Reg); |
| 329 | } |
| 330 | |
| 331 | // FIXME: SGPRs are assumed to be uniform, but this is not true for i1 SGPRs |
| 332 | // (such as VCC) which hold a wave-wide vector of boolean values. Examining |
| 333 | // just the register class is not suffcient; it needs to be combined with a |
| 334 | // value type. The next predicate isUniformReg() does this correctly. |
| 335 | bool isDivergentRegClass(const TargetRegisterClass *RC) const override { |
| 336 | return !isSGPRClass(RC); |
| 337 | } |
| 338 | |
| 339 | bool isUniformReg(const MachineRegisterInfo &MRI, const RegisterBankInfo &RBI, |
| 340 | Register Reg) const override; |
| 341 | |
| 342 | ArrayRef<int16_t> getRegSplitParts(const TargetRegisterClass *RC, |
| 343 | unsigned EltSize) const; |
| 344 | |
| 345 | bool shouldCoalesce(MachineInstr *MI, |
| 346 | const TargetRegisterClass *SrcRC, |
| 347 | unsigned SubReg, |
| 348 | const TargetRegisterClass *DstRC, |
| 349 | unsigned DstSubReg, |
| 350 | const TargetRegisterClass *NewRC, |
| 351 | LiveIntervals &LIS) const override; |
| 352 | |
| 353 | unsigned getRegPressureLimit(const TargetRegisterClass *RC, |
| 354 | MachineFunction &MF) const override; |
| 355 | |
| 356 | unsigned getRegPressureSetLimit(const MachineFunction &MF, |
| 357 | unsigned Idx) const override; |
| 358 | |
| 359 | bool getRegAllocationHints(Register VirtReg, ArrayRef<MCPhysReg> Order, |
| 360 | SmallVectorImpl<MCPhysReg> &Hints, |
| 361 | const MachineFunction &MF, const VirtRegMap *VRM, |
| 362 | const LiveRegMatrix *Matrix) const override; |
| 363 | |
| 364 | const int *getRegUnitPressureSets(unsigned RegUnit) const override; |
| 365 | |
| 366 | MCRegister getReturnAddressReg(const MachineFunction &MF) const; |
| 367 | |
| 368 | const TargetRegisterClass * |
| 369 | getRegClassForSizeOnBank(unsigned Size, const RegisterBank &Bank) const; |
| 370 | |
| 371 | const TargetRegisterClass * |
| 372 | getRegClassForTypeOnBank(LLT Ty, const RegisterBank &Bank) const { |
| 373 | return getRegClassForSizeOnBank(Size: Ty.getSizeInBits(), Bank); |
| 374 | } |
| 375 | |
| 376 | const TargetRegisterClass * |
| 377 | getConstrainedRegClassForOperand(const MachineOperand &MO, |
| 378 | const MachineRegisterInfo &MRI) const override; |
| 379 | |
| 380 | const TargetRegisterClass *getBoolRC() const { |
| 381 | return isWave32 ? &AMDGPU::SReg_32RegClass |
| 382 | : &AMDGPU::SReg_64RegClass; |
| 383 | } |
| 384 | |
| 385 | const TargetRegisterClass *getWaveMaskRegClass() const { |
| 386 | return isWave32 ? &AMDGPU::SReg_32_XM0_XEXECRegClass |
| 387 | : &AMDGPU::SReg_64_XEXECRegClass; |
| 388 | } |
| 389 | |
| 390 | // Return the appropriate register class to use for 64-bit VGPRs for the |
| 391 | // subtarget. |
| 392 | const TargetRegisterClass *getVGPR64Class() const; |
| 393 | |
| 394 | MCRegister getVCC() const; |
| 395 | |
| 396 | MCRegister getExec() const; |
| 397 | |
| 398 | const TargetRegisterClass *getRegClass(unsigned RCID) const; |
| 399 | |
| 400 | // Find reaching register definition |
| 401 | MachineInstr *findReachingDef(Register Reg, unsigned SubReg, |
| 402 | MachineInstr &Use, |
| 403 | MachineRegisterInfo &MRI, |
| 404 | LiveIntervals *LIS) const; |
| 405 | |
| 406 | const uint32_t *getAllVGPRRegMask() const; |
| 407 | const uint32_t *getAllAGPRRegMask() const; |
| 408 | const uint32_t *getAllVectorRegMask() const; |
| 409 | const uint32_t *getAllAllocatableSRegMask() const; |
| 410 | |
| 411 | // \returns number of 32 bit registers covered by a \p LM |
| 412 | static unsigned getNumCoveredRegs(LaneBitmask LM) { |
| 413 | // The assumption is that every lo16 subreg is an even bit and every hi16 |
| 414 | // is an adjacent odd bit or vice versa. |
| 415 | uint64_t Mask = LM.getAsInteger(); |
| 416 | uint64_t Even = Mask & 0xAAAAAAAAAAAAAAAAULL; |
| 417 | Mask = (Even >> 1) | Mask; |
| 418 | uint64_t Odd = Mask & 0x5555555555555555ULL; |
| 419 | return llvm::popcount(Value: Odd); |
| 420 | } |
| 421 | |
| 422 | // \returns a DWORD offset of a \p SubReg |
| 423 | unsigned getChannelFromSubReg(unsigned SubReg) const { |
| 424 | return SubReg ? (getSubRegIdxOffset(Idx: SubReg) + 31) / 32 : 0; |
| 425 | } |
| 426 | |
| 427 | // \returns a DWORD size of a \p SubReg |
| 428 | unsigned getNumChannelsFromSubReg(unsigned SubReg) const { |
| 429 | return getNumCoveredRegs(LM: getSubRegIndexLaneMask(SubIdx: SubReg)); |
| 430 | } |
| 431 | |
| 432 | // For a given 16 bit \p Reg \returns a 32 bit register holding it. |
| 433 | // \returns \p Reg otherwise. |
| 434 | MCPhysReg get32BitRegister(MCPhysReg Reg) const; |
| 435 | |
| 436 | // Returns true if a given register class is properly aligned for |
| 437 | // the subtarget. |
| 438 | bool isProperlyAlignedRC(const TargetRegisterClass &RC) const; |
| 439 | |
| 440 | // Given \p RC returns corresponding aligned register class if required |
| 441 | // by the subtarget. |
| 442 | const TargetRegisterClass * |
| 443 | getProperlyAlignedRC(const TargetRegisterClass *RC) const; |
| 444 | |
| 445 | /// Return all SGPR128 which satisfy the waves per execution unit requirement |
| 446 | /// of the subtarget. |
| 447 | ArrayRef<MCPhysReg> getAllSGPR128(const MachineFunction &MF) const; |
| 448 | |
| 449 | /// Return all SGPR64 which satisfy the waves per execution unit requirement |
| 450 | /// of the subtarget. |
| 451 | ArrayRef<MCPhysReg> getAllSGPR64(const MachineFunction &MF) const; |
| 452 | |
| 453 | /// Return all SGPR32 which satisfy the waves per execution unit requirement |
| 454 | /// of the subtarget. |
| 455 | ArrayRef<MCPhysReg> getAllSGPR32(const MachineFunction &MF) const; |
| 456 | |
| 457 | // Insert spill or restore instructions. |
| 458 | // When lowering spill pseudos, the RegScavenger should be set. |
| 459 | // For creating spill instructions during frame lowering, where no scavenger |
| 460 | // is available, LiveUnits can be used. |
| 461 | void buildSpillLoadStore(MachineBasicBlock &MBB, |
| 462 | MachineBasicBlock::iterator MI, const DebugLoc &DL, |
| 463 | unsigned LoadStoreOp, int Index, Register ValueReg, |
| 464 | bool ValueIsKill, MCRegister ScratchOffsetReg, |
| 465 | int64_t InstrOffset, MachineMemOperand *MMO, |
| 466 | RegScavenger *RS, |
| 467 | LiveRegUnits *LiveUnits = nullptr) const; |
| 468 | |
| 469 | // Return alignment in register file of first register in a register tuple. |
| 470 | unsigned getRegClassAlignmentNumBits(const TargetRegisterClass *RC) const { |
| 471 | return (RC->TSFlags & SIRCFlags::RegTupleAlignUnitsMask) * 32; |
| 472 | } |
| 473 | |
| 474 | // Check if register class RC has required alignment. |
| 475 | bool isRegClassAligned(const TargetRegisterClass *RC, |
| 476 | unsigned AlignNumBits) const { |
| 477 | assert(AlignNumBits != 0); |
| 478 | unsigned RCAlign = getRegClassAlignmentNumBits(RC); |
| 479 | return RCAlign == AlignNumBits || |
| 480 | (RCAlign > AlignNumBits && (RCAlign % AlignNumBits) == 0); |
| 481 | } |
| 482 | |
| 483 | // Return alignment of a SubReg relative to start of a register in RC class. |
| 484 | // No check if the subreg is supported by the current RC is made. |
| 485 | unsigned getSubRegAlignmentNumBits(const TargetRegisterClass *RC, |
| 486 | unsigned SubReg) const; |
| 487 | |
| 488 | // \returns a number of registers of a given \p RC used in a function. |
| 489 | // Does not go inside function calls. |
| 490 | unsigned getNumUsedPhysRegs(const MachineRegisterInfo &MRI, |
| 491 | const TargetRegisterClass &RC) const; |
| 492 | |
| 493 | std::optional<uint8_t> getVRegFlagValue(StringRef Name) const override { |
| 494 | return Name == "WWM_REG" ? AMDGPU::VirtRegFlag::WWM_REG |
| 495 | : std::optional<uint8_t>{}; |
| 496 | } |
| 497 | |
| 498 | SmallVector<StringLiteral> |
| 499 | getVRegFlagsOfReg(Register Reg, const MachineFunction &MF) const override; |
| 500 | }; |
| 501 | |
| 502 | namespace AMDGPU { |
| 503 | /// Get the size in bits of a register from the register class \p RC. |
| 504 | unsigned getRegBitWidth(const TargetRegisterClass &RC); |
| 505 | } // namespace AMDGPU |
| 506 | |
| 507 | } // End namespace llvm |
| 508 | |
| 509 | #endif |
| 510 | |