| 1 | //===- AggressiveAntiDepBreaker.cpp - Anti-dep breaker --------------------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This file implements the AggressiveAntiDepBreaker class, which |
| 10 | // implements register anti-dependence breaking during post-RA |
| 11 | // scheduling. It attempts to break all anti-dependencies within a |
| 12 | // block. |
| 13 | // |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
| 16 | #include "AggressiveAntiDepBreaker.h" |
| 17 | #include "llvm/ADT/ArrayRef.h" |
| 18 | #include "llvm/ADT/SmallSet.h" |
| 19 | #include "llvm/ADT/iterator_range.h" |
| 20 | #include "llvm/CodeGen/MachineBasicBlock.h" |
| 21 | #include "llvm/CodeGen/MachineFrameInfo.h" |
| 22 | #include "llvm/CodeGen/MachineFunction.h" |
| 23 | #include "llvm/CodeGen/MachineInstr.h" |
| 24 | #include "llvm/CodeGen/MachineOperand.h" |
| 25 | #include "llvm/CodeGen/MachineRegisterInfo.h" |
| 26 | #include "llvm/CodeGen/RegisterClassInfo.h" |
| 27 | #include "llvm/CodeGen/ScheduleDAG.h" |
| 28 | #include "llvm/CodeGen/TargetInstrInfo.h" |
| 29 | #include "llvm/CodeGen/TargetRegisterInfo.h" |
| 30 | #include "llvm/CodeGenTypes/MachineValueType.h" |
| 31 | #include "llvm/MC/MCInstrDesc.h" |
| 32 | #include "llvm/MC/MCRegisterInfo.h" |
| 33 | #include "llvm/Support/CommandLine.h" |
| 34 | #include "llvm/Support/Debug.h" |
| 35 | #include "llvm/Support/raw_ostream.h" |
| 36 | #include <cassert> |
| 37 | #include <utility> |
| 38 | |
| 39 | using namespace llvm; |
| 40 | |
| 41 | #define DEBUG_TYPE "post-RA-sched" |
| 42 | |
| 43 | // If DebugDiv > 0 then only break antidep with (ID % DebugDiv) == DebugMod |
| 44 | static cl::opt<int> |
| 45 | DebugDiv("agg-antidep-debugdiv" , |
| 46 | cl::desc("Debug control for aggressive anti-dep breaker" ), |
| 47 | cl::init(Val: 0), cl::Hidden); |
| 48 | |
| 49 | static cl::opt<int> |
| 50 | DebugMod("agg-antidep-debugmod" , |
| 51 | cl::desc("Debug control for aggressive anti-dep breaker" ), |
| 52 | cl::init(Val: 0), cl::Hidden); |
| 53 | |
| 54 | AggressiveAntiDepState::AggressiveAntiDepState(const unsigned TargetRegs, |
| 55 | MachineBasicBlock *BB) |
| 56 | : NumTargetRegs(TargetRegs), GroupNodes(TargetRegs, 0), |
| 57 | GroupNodeIndices(TargetRegs, 0), KillIndices(TargetRegs, 0), |
| 58 | DefIndices(TargetRegs, 0) { |
| 59 | const unsigned BBSize = BB->size(); |
| 60 | for (unsigned i = 0; i < NumTargetRegs; ++i) { |
| 61 | // Initialize all registers to be in their own group. Initially we |
| 62 | // assign the register to the same-indexed GroupNode. |
| 63 | GroupNodeIndices[i] = i; |
| 64 | // Initialize the indices to indicate that no registers are live. |
| 65 | KillIndices[i] = ~0u; |
| 66 | DefIndices[i] = BBSize; |
| 67 | } |
| 68 | } |
| 69 | |
| 70 | unsigned AggressiveAntiDepState::GetGroup(MCRegister Reg) { |
| 71 | unsigned Node = GroupNodeIndices[Reg]; |
| 72 | while (GroupNodes[Node] != Node) |
| 73 | Node = GroupNodes[Node]; |
| 74 | |
| 75 | return Node; |
| 76 | } |
| 77 | |
| 78 | void AggressiveAntiDepState::GetGroupRegs( |
| 79 | unsigned Group, std::vector<MCRegister> &Regs, |
| 80 | std::multimap<MCRegister, AggressiveAntiDepState::RegisterReference> |
| 81 | *RegRefs) { |
| 82 | for (unsigned Reg = 0; Reg != NumTargetRegs; ++Reg) { |
| 83 | if ((GetGroup(Reg) == Group) && (RegRefs->count(x: Reg) > 0)) |
| 84 | Regs.push_back(x: Reg); |
| 85 | } |
| 86 | } |
| 87 | |
| 88 | unsigned AggressiveAntiDepState::UnionGroups(MCRegister Reg1, MCRegister Reg2) { |
| 89 | assert(GroupNodes[0] == 0 && "GroupNode 0 not parent!" ); |
| 90 | assert(GroupNodeIndices[0] == 0 && "Reg 0 not in Group 0!" ); |
| 91 | |
| 92 | // find group for each register |
| 93 | unsigned Group1 = GetGroup(Reg: Reg1); |
| 94 | unsigned Group2 = GetGroup(Reg: Reg2); |
| 95 | |
| 96 | // if either group is 0, then that must become the parent |
| 97 | unsigned Parent = (Group1 == 0) ? Group1 : Group2; |
| 98 | unsigned Other = (Parent == Group1) ? Group2 : Group1; |
| 99 | GroupNodes.at(n: Other) = Parent; |
| 100 | return Parent; |
| 101 | } |
| 102 | |
| 103 | unsigned AggressiveAntiDepState::LeaveGroup(MCRegister Reg) { |
| 104 | // Create a new GroupNode for Reg. Reg's existing GroupNode must |
| 105 | // stay as is because there could be other GroupNodes referring to |
| 106 | // it. |
| 107 | unsigned idx = GroupNodes.size(); |
| 108 | GroupNodes.push_back(x: idx); |
| 109 | GroupNodeIndices[Reg] = idx; |
| 110 | return idx; |
| 111 | } |
| 112 | |
| 113 | bool AggressiveAntiDepState::IsLive(MCRegister Reg) { |
| 114 | // KillIndex must be defined and DefIndex not defined for a register |
| 115 | // to be live. |
| 116 | return((KillIndices[Reg] != ~0u) && (DefIndices[Reg] == ~0u)); |
| 117 | } |
| 118 | |
| 119 | AggressiveAntiDepBreaker::AggressiveAntiDepBreaker( |
| 120 | MachineFunction &MFi, const RegisterClassInfo &RCI, |
| 121 | TargetSubtargetInfo::RegClassVector &CriticalPathRCs) |
| 122 | : MF(MFi), MRI(MF.getRegInfo()), TII(MF.getSubtarget().getInstrInfo()), |
| 123 | TRI(MF.getSubtarget().getRegisterInfo()), RegClassInfo(RCI) { |
| 124 | /* Collect a bitset of all registers that are only broken if they |
| 125 | are on the critical path. */ |
| 126 | for (const TargetRegisterClass *RC : CriticalPathRCs) { |
| 127 | BitVector CPSet = TRI->getAllocatableSet(MF, RC); |
| 128 | if (CriticalPathSet.none()) |
| 129 | CriticalPathSet = CPSet; |
| 130 | else |
| 131 | CriticalPathSet |= CPSet; |
| 132 | } |
| 133 | |
| 134 | LLVM_DEBUG(dbgs() << "AntiDep Critical-Path Registers:" ); |
| 135 | LLVM_DEBUG(for (unsigned r |
| 136 | : CriticalPathSet.set_bits()) dbgs() |
| 137 | << " " << printReg(r, TRI)); |
| 138 | LLVM_DEBUG(dbgs() << '\n'); |
| 139 | } |
| 140 | |
| 141 | AggressiveAntiDepBreaker::~AggressiveAntiDepBreaker() { |
| 142 | delete State; |
| 143 | } |
| 144 | |
| 145 | void AggressiveAntiDepBreaker::StartBlock(MachineBasicBlock *BB) { |
| 146 | assert(!State); |
| 147 | State = new AggressiveAntiDepState(TRI->getNumRegs(), BB); |
| 148 | |
| 149 | bool IsReturnBlock = BB->isReturnBlock(); |
| 150 | std::vector<unsigned> &KillIndices = State->GetKillIndices(); |
| 151 | std::vector<unsigned> &DefIndices = State->GetDefIndices(); |
| 152 | |
| 153 | // Examine the live-in regs of all successors. |
| 154 | for (MachineBasicBlock *Succ : BB->successors()) |
| 155 | for (const auto &LI : Succ->liveins()) { |
| 156 | for (MCRegAliasIterator AI(LI.PhysReg, TRI, true); AI.isValid(); ++AI) { |
| 157 | unsigned Reg = *AI; |
| 158 | State->UnionGroups(Reg1: Reg, Reg2: 0); |
| 159 | KillIndices[Reg] = BB->size(); |
| 160 | DefIndices[Reg] = ~0u; |
| 161 | } |
| 162 | } |
| 163 | |
| 164 | // Mark live-out callee-saved registers. In a return block this is |
| 165 | // all callee-saved registers. In non-return this is any |
| 166 | // callee-saved register that is not saved in the prolog. |
| 167 | const MachineFrameInfo &MFI = MF.getFrameInfo(); |
| 168 | BitVector Pristine = MFI.getPristineRegs(MF); |
| 169 | for (const MCPhysReg *I = MF.getRegInfo().getCalleeSavedRegs(); *I; |
| 170 | ++I) { |
| 171 | unsigned Reg = *I; |
| 172 | if (!IsReturnBlock && !Pristine.test(Idx: Reg)) |
| 173 | continue; |
| 174 | for (MCRegAliasIterator AI(Reg, TRI, true); AI.isValid(); ++AI) { |
| 175 | MCRegister AliasReg = *AI; |
| 176 | State->UnionGroups(Reg1: AliasReg, Reg2: 0); |
| 177 | KillIndices[AliasReg] = BB->size(); |
| 178 | DefIndices[AliasReg] = ~0u; |
| 179 | } |
| 180 | } |
| 181 | } |
| 182 | |
| 183 | void AggressiveAntiDepBreaker::FinishBlock() { |
| 184 | delete State; |
| 185 | State = nullptr; |
| 186 | } |
| 187 | |
| 188 | void AggressiveAntiDepBreaker::Observe(MachineInstr &MI, unsigned Count, |
| 189 | unsigned InsertPosIndex) { |
| 190 | assert(Count < InsertPosIndex && "Instruction index out of expected range!" ); |
| 191 | |
| 192 | std::set<MCRegister> PassthruRegs; |
| 193 | GetPassthruRegs(MI, PassthruRegs); |
| 194 | PrescanInstruction(MI, Count, PassthruRegs); |
| 195 | ScanInstruction(MI, Count); |
| 196 | |
| 197 | LLVM_DEBUG(dbgs() << "Observe: " ); |
| 198 | LLVM_DEBUG(MI.dump()); |
| 199 | LLVM_DEBUG(dbgs() << "\tRegs:" ); |
| 200 | |
| 201 | std::vector<unsigned> &DefIndices = State->GetDefIndices(); |
| 202 | for (unsigned Reg = 1; Reg != TRI->getNumRegs(); ++Reg) { |
| 203 | // If Reg is current live, then mark that it can't be renamed as |
| 204 | // we don't know the extent of its live-range anymore (now that it |
| 205 | // has been scheduled). If it is not live but was defined in the |
| 206 | // previous schedule region, then set its def index to the most |
| 207 | // conservative location (i.e. the beginning of the previous |
| 208 | // schedule region). |
| 209 | if (State->IsLive(Reg)) { |
| 210 | LLVM_DEBUG(if (State->GetGroup(Reg) != 0) dbgs() |
| 211 | << " " << printReg(Reg, TRI) << "=g" << State->GetGroup(Reg) |
| 212 | << "->g0(region live-out)" ); |
| 213 | State->UnionGroups(Reg1: Reg, Reg2: 0); |
| 214 | } else if ((DefIndices[Reg] < InsertPosIndex) |
| 215 | && (DefIndices[Reg] >= Count)) { |
| 216 | DefIndices[Reg] = Count; |
| 217 | } |
| 218 | } |
| 219 | LLVM_DEBUG(dbgs() << '\n'); |
| 220 | } |
| 221 | |
| 222 | bool AggressiveAntiDepBreaker::IsImplicitDefUse(MachineInstr &MI, |
| 223 | MachineOperand &MO) { |
| 224 | if (!MO.isReg() || !MO.isImplicit()) |
| 225 | return false; |
| 226 | |
| 227 | Register Reg = MO.getReg(); |
| 228 | if (Reg == 0) |
| 229 | return false; |
| 230 | |
| 231 | MachineOperand *Op = nullptr; |
| 232 | if (MO.isDef()) |
| 233 | Op = MI.findRegisterUseOperand(Reg, /*TRI=*/nullptr, isKill: true); |
| 234 | else |
| 235 | Op = MI.findRegisterDefOperand(Reg, /*TRI=*/nullptr); |
| 236 | |
| 237 | return(Op && Op->isImplicit()); |
| 238 | } |
| 239 | |
| 240 | void AggressiveAntiDepBreaker::GetPassthruRegs( |
| 241 | MachineInstr &MI, std::set<MCRegister> &PassthruRegs) { |
| 242 | for (unsigned i = 0, e = MI.getNumOperands(); i != e; ++i) { |
| 243 | MachineOperand &MO = MI.getOperand(i); |
| 244 | if (!MO.isReg()) continue; |
| 245 | if ((MO.isDef() && MI.isRegTiedToUseOperand(DefOpIdx: i)) || |
| 246 | IsImplicitDefUse(MI, MO)) { |
| 247 | const Register Reg = MO.getReg(); |
| 248 | for (MCPhysReg SubReg : TRI->subregs_inclusive(Reg)) |
| 249 | PassthruRegs.insert(x: SubReg); |
| 250 | } |
| 251 | } |
| 252 | } |
| 253 | |
| 254 | /// AntiDepEdges - Return in Edges the anti- and output- dependencies |
| 255 | /// in SU that we want to consider for breaking. |
| 256 | static void AntiDepEdges(const SUnit *SU, std::vector<const SDep *> &Edges) { |
| 257 | SmallSet<Register, 4> RegSet; |
| 258 | for (const SDep &Pred : SU->Preds) { |
| 259 | if ((Pred.getKind() == SDep::Anti) || (Pred.getKind() == SDep::Output)) { |
| 260 | if (RegSet.insert(V: Pred.getReg()).second) |
| 261 | Edges.push_back(x: &Pred); |
| 262 | } |
| 263 | } |
| 264 | } |
| 265 | |
| 266 | /// CriticalPathStep - Return the next SUnit after SU on the bottom-up |
| 267 | /// critical path. |
| 268 | static const SUnit *CriticalPathStep(const SUnit *SU) { |
| 269 | const SDep *Next = nullptr; |
| 270 | unsigned NextDepth = 0; |
| 271 | // Find the predecessor edge with the greatest depth. |
| 272 | if (SU) { |
| 273 | for (const SDep &Pred : SU->Preds) { |
| 274 | const SUnit *PredSU = Pred.getSUnit(); |
| 275 | unsigned PredLatency = Pred.getLatency(); |
| 276 | unsigned PredTotalLatency = PredSU->getDepth() + PredLatency; |
| 277 | // In the case of a latency tie, prefer an anti-dependency edge over |
| 278 | // other types of edges. |
| 279 | if (NextDepth < PredTotalLatency || |
| 280 | (NextDepth == PredTotalLatency && Pred.getKind() == SDep::Anti)) { |
| 281 | NextDepth = PredTotalLatency; |
| 282 | Next = &Pred; |
| 283 | } |
| 284 | } |
| 285 | } |
| 286 | |
| 287 | return (Next) ? Next->getSUnit() : nullptr; |
| 288 | } |
| 289 | |
| 290 | void AggressiveAntiDepBreaker::HandleLastUse(MCRegister Reg, unsigned KillIdx, |
| 291 | const char *tag, |
| 292 | const char *, |
| 293 | const char *) { |
| 294 | std::vector<unsigned> &KillIndices = State->GetKillIndices(); |
| 295 | std::vector<unsigned> &DefIndices = State->GetDefIndices(); |
| 296 | std::multimap<MCRegister, AggressiveAntiDepState::RegisterReference> |
| 297 | &RegRefs = State->GetRegRefs(); |
| 298 | |
| 299 | // FIXME: We must leave subregisters of live super registers as live, so that |
| 300 | // we don't clear out the register tracking information for subregisters of |
| 301 | // super registers we're still tracking (and with which we're unioning |
| 302 | // subregister definitions). |
| 303 | for (MCRegAliasIterator AI(Reg, TRI, true); AI.isValid(); ++AI) |
| 304 | if (TRI->isSuperRegister(RegA: Reg, RegB: *AI) && State->IsLive(Reg: *AI)) { |
| 305 | LLVM_DEBUG(if (!header && footer) dbgs() << footer); |
| 306 | return; |
| 307 | } |
| 308 | |
| 309 | if (!State->IsLive(Reg)) { |
| 310 | KillIndices[Reg] = KillIdx; |
| 311 | DefIndices[Reg] = ~0u; |
| 312 | RegRefs.erase(x: Reg); |
| 313 | State->LeaveGroup(Reg); |
| 314 | LLVM_DEBUG(if (header) { |
| 315 | dbgs() << header << printReg(Reg, TRI); |
| 316 | header = nullptr; |
| 317 | }); |
| 318 | LLVM_DEBUG(dbgs() << "->g" << State->GetGroup(Reg) << tag); |
| 319 | // Repeat for subregisters. Note that we only do this if the superregister |
| 320 | // was not live because otherwise, regardless whether we have an explicit |
| 321 | // use of the subregister, the subregister's contents are needed for the |
| 322 | // uses of the superregister. |
| 323 | for (MCPhysReg SubregReg : TRI->subregs(Reg)) { |
| 324 | if (!State->IsLive(Reg: SubregReg)) { |
| 325 | KillIndices[SubregReg] = KillIdx; |
| 326 | DefIndices[SubregReg] = ~0u; |
| 327 | RegRefs.erase(x: SubregReg); |
| 328 | State->LeaveGroup(Reg: SubregReg); |
| 329 | LLVM_DEBUG(if (header) { |
| 330 | dbgs() << header << printReg(Reg, TRI); |
| 331 | header = nullptr; |
| 332 | }); |
| 333 | LLVM_DEBUG(dbgs() << " " << printReg(SubregReg, TRI) << "->g" |
| 334 | << State->GetGroup(SubregReg) << tag); |
| 335 | } |
| 336 | } |
| 337 | } |
| 338 | |
| 339 | LLVM_DEBUG(if (!header && footer) dbgs() << footer); |
| 340 | } |
| 341 | |
| 342 | void AggressiveAntiDepBreaker::PrescanInstruction( |
| 343 | MachineInstr &MI, unsigned Count, |
| 344 | const std::set<MCRegister> &PassthruRegs) { |
| 345 | std::vector<unsigned> &DefIndices = State->GetDefIndices(); |
| 346 | std::multimap<MCRegister, AggressiveAntiDepState::RegisterReference> |
| 347 | &RegRefs = State->GetRegRefs(); |
| 348 | |
| 349 | // Handle dead defs by simulating a last-use of the register just |
| 350 | // after the def. A dead def can occur because the def is truly |
| 351 | // dead, or because only a subregister is live at the def. If we |
| 352 | // don't do this the dead def will be incorrectly merged into the |
| 353 | // previous def. |
| 354 | for (const MachineOperand &MO : MI.all_defs()) { |
| 355 | Register Reg = MO.getReg(); |
| 356 | if (!Reg) |
| 357 | continue; |
| 358 | |
| 359 | HandleLastUse(Reg: Reg.asMCReg(), KillIdx: Count + 1, tag: "" , header: "\tDead Def: " , footer: "\n" ); |
| 360 | } |
| 361 | |
| 362 | LLVM_DEBUG(dbgs() << "\tDef Groups:" ); |
| 363 | for (unsigned i = 0, e = MI.getNumOperands(); i != e; ++i) { |
| 364 | MachineOperand &MO = MI.getOperand(i); |
| 365 | if (!MO.isReg() || !MO.isDef()) continue; |
| 366 | Register Reg = MO.getReg(); |
| 367 | if (!Reg) |
| 368 | continue; |
| 369 | |
| 370 | LLVM_DEBUG(dbgs() << " " << printReg(Reg, TRI) << "=g" |
| 371 | << State->GetGroup(Reg)); |
| 372 | |
| 373 | // If MI's defs have a special allocation requirement, don't allow |
| 374 | // any def registers to be changed. Also assume all registers |
| 375 | // defined in a call must not be changed (ABI). Inline assembly may |
| 376 | // reference either system calls or the register directly. Skip it until we |
| 377 | // can tell user specified registers from compiler-specified. |
| 378 | if (MI.isCall() || MI.hasExtraDefRegAllocReq() || TII->isPredicated(MI) || |
| 379 | MI.isInlineAsm()) { |
| 380 | LLVM_DEBUG(if (State->GetGroup(Reg) != 0) dbgs() << "->g0(alloc-req)" ); |
| 381 | State->UnionGroups(Reg1: Reg, Reg2: 0); |
| 382 | } |
| 383 | |
| 384 | // Any aliased that are live at this point are completely or |
| 385 | // partially defined here, so group those aliases with Reg. |
| 386 | for (MCRegAliasIterator AI(Reg, TRI, false); AI.isValid(); ++AI) { |
| 387 | MCRegister AliasReg = *AI; |
| 388 | if (State->IsLive(Reg: AliasReg)) { |
| 389 | State->UnionGroups(Reg1: Reg, Reg2: AliasReg); |
| 390 | LLVM_DEBUG(dbgs() << "->g" << State->GetGroup(Reg) << "(via " |
| 391 | << printReg(AliasReg, TRI) << ")" ); |
| 392 | } |
| 393 | } |
| 394 | |
| 395 | // Note register reference... |
| 396 | const TargetRegisterClass *RC = nullptr; |
| 397 | if (i < MI.getDesc().getNumOperands()) |
| 398 | RC = TII->getRegClass(MCID: MI.getDesc(), OpNum: i, TRI, MF); |
| 399 | AggressiveAntiDepState::RegisterReference RR = { .Operand: &MO, .RC: RC }; |
| 400 | RegRefs.emplace(args: Reg.asMCReg(), args&: RR); |
| 401 | } |
| 402 | |
| 403 | LLVM_DEBUG(dbgs() << '\n'); |
| 404 | |
| 405 | // Scan the register defs for this instruction and update |
| 406 | // live-ranges. |
| 407 | for (const MachineOperand &MO : MI.all_defs()) { |
| 408 | Register Reg = MO.getReg(); |
| 409 | if (!Reg) |
| 410 | continue; |
| 411 | // Ignore KILLs and passthru registers for liveness... |
| 412 | if (MI.isKill() || (PassthruRegs.count(x: Reg) != 0)) |
| 413 | continue; |
| 414 | |
| 415 | // Update def for Reg and aliases. |
| 416 | for (MCRegAliasIterator AI(Reg, TRI, true); AI.isValid(); ++AI) { |
| 417 | // We need to be careful here not to define already-live super registers. |
| 418 | // If the super register is already live, then this definition is not |
| 419 | // a definition of the whole super register (just a partial insertion |
| 420 | // into it). Earlier subregister definitions (which we've not yet visited |
| 421 | // because we're iterating bottom-up) need to be linked to the same group |
| 422 | // as this definition. |
| 423 | if (TRI->isSuperRegister(RegA: Reg, RegB: *AI) && State->IsLive(Reg: *AI)) |
| 424 | continue; |
| 425 | |
| 426 | DefIndices[(*AI).id()] = Count; |
| 427 | } |
| 428 | } |
| 429 | } |
| 430 | |
| 431 | void AggressiveAntiDepBreaker::ScanInstruction(MachineInstr &MI, |
| 432 | unsigned Count) { |
| 433 | LLVM_DEBUG(dbgs() << "\tUse Groups:" ); |
| 434 | std::multimap<MCRegister, AggressiveAntiDepState::RegisterReference> |
| 435 | &RegRefs = State->GetRegRefs(); |
| 436 | |
| 437 | // If MI's uses have special allocation requirement, don't allow |
| 438 | // any use registers to be changed. Also assume all registers |
| 439 | // used in a call must not be changed (ABI). |
| 440 | // Inline Assembly register uses also cannot be safely changed. |
| 441 | // FIXME: The issue with predicated instruction is more complex. We are being |
| 442 | // conservatively here because the kill markers cannot be trusted after |
| 443 | // if-conversion: |
| 444 | // %r6 = LDR %sp, %reg0, 92, 14, %reg0; mem:LD4[FixedStack14] |
| 445 | // ... |
| 446 | // STR %r0, killed %r6, %reg0, 0, 0, %cpsr; mem:ST4[%395] |
| 447 | // %r6 = LDR %sp, %reg0, 100, 0, %cpsr; mem:LD4[FixedStack12] |
| 448 | // STR %r0, killed %r6, %reg0, 0, 14, %reg0; mem:ST4[%396](align=8) |
| 449 | // |
| 450 | // The first R6 kill is not really a kill since it's killed by a predicated |
| 451 | // instruction which may not be executed. The second R6 def may or may not |
| 452 | // re-define R6 so it's not safe to change it since the last R6 use cannot be |
| 453 | // changed. |
| 454 | bool Special = MI.isCall() || MI.hasExtraSrcRegAllocReq() || |
| 455 | TII->isPredicated(MI) || MI.isInlineAsm(); |
| 456 | |
| 457 | // Scan the register uses for this instruction and update |
| 458 | // live-ranges, groups and RegRefs. |
| 459 | for (unsigned i = 0, e = MI.getNumOperands(); i != e; ++i) { |
| 460 | MachineOperand &MO = MI.getOperand(i); |
| 461 | if (!MO.isReg() || !MO.isUse()) continue; |
| 462 | Register Reg = MO.getReg(); |
| 463 | if (!Reg) |
| 464 | continue; |
| 465 | |
| 466 | LLVM_DEBUG(dbgs() << " " << printReg(Reg, TRI) << "=g" |
| 467 | << State->GetGroup(Reg)); |
| 468 | |
| 469 | // It wasn't previously live but now it is, this is a kill. Forget |
| 470 | // the previous live-range information and start a new live-range |
| 471 | // for the register. |
| 472 | HandleLastUse(Reg: Reg.asMCReg(), KillIdx: Count, tag: "(last-use)" ); |
| 473 | |
| 474 | if (Special) { |
| 475 | LLVM_DEBUG(if (State->GetGroup(Reg) != 0) dbgs() << "->g0(alloc-req)" ); |
| 476 | State->UnionGroups(Reg1: Reg, Reg2: 0); |
| 477 | } |
| 478 | |
| 479 | // Note register reference... |
| 480 | const TargetRegisterClass *RC = nullptr; |
| 481 | if (i < MI.getDesc().getNumOperands()) |
| 482 | RC = TII->getRegClass(MCID: MI.getDesc(), OpNum: i, TRI, MF); |
| 483 | AggressiveAntiDepState::RegisterReference RR = { .Operand: &MO, .RC: RC }; |
| 484 | RegRefs.emplace(args: Reg.asMCReg(), args&: RR); |
| 485 | } |
| 486 | |
| 487 | LLVM_DEBUG(dbgs() << '\n'); |
| 488 | |
| 489 | // Form a group of all defs and uses of a KILL instruction to ensure |
| 490 | // that all registers are renamed as a group. |
| 491 | if (MI.isKill()) { |
| 492 | LLVM_DEBUG(dbgs() << "\tKill Group:" ); |
| 493 | |
| 494 | Register FirstReg; |
| 495 | for (const MachineOperand &MO : MI.operands()) { |
| 496 | if (!MO.isReg()) continue; |
| 497 | Register Reg = MO.getReg(); |
| 498 | if (!Reg) |
| 499 | continue; |
| 500 | |
| 501 | if (FirstReg) { |
| 502 | LLVM_DEBUG(dbgs() << "=" << printReg(Reg, TRI)); |
| 503 | State->UnionGroups(Reg1: FirstReg, Reg2: Reg); |
| 504 | } else { |
| 505 | LLVM_DEBUG(dbgs() << " " << printReg(Reg, TRI)); |
| 506 | FirstReg = Reg; |
| 507 | } |
| 508 | } |
| 509 | |
| 510 | LLVM_DEBUG(dbgs() << "->g" << State->GetGroup(FirstReg) << '\n'); |
| 511 | } |
| 512 | } |
| 513 | |
| 514 | BitVector AggressiveAntiDepBreaker::GetRenameRegisters(MCRegister Reg) { |
| 515 | BitVector BV(TRI->getNumRegs(), false); |
| 516 | bool first = true; |
| 517 | |
| 518 | // Check all references that need rewriting for Reg. For each, use |
| 519 | // the corresponding register class to narrow the set of registers |
| 520 | // that are appropriate for renaming. |
| 521 | for (const auto &Q : make_range(p: State->GetRegRefs().equal_range(x: Reg))) { |
| 522 | const TargetRegisterClass *RC = Q.second.RC; |
| 523 | if (!RC) continue; |
| 524 | |
| 525 | BitVector RCBV = TRI->getAllocatableSet(MF, RC); |
| 526 | if (first) { |
| 527 | BV |= RCBV; |
| 528 | first = false; |
| 529 | } else { |
| 530 | BV &= RCBV; |
| 531 | } |
| 532 | |
| 533 | LLVM_DEBUG(dbgs() << " " << TRI->getRegClassName(RC)); |
| 534 | } |
| 535 | |
| 536 | return BV; |
| 537 | } |
| 538 | |
| 539 | bool AggressiveAntiDepBreaker::FindSuitableFreeRegisters( |
| 540 | MCRegister SuperReg, unsigned AntiDepGroupIndex, |
| 541 | RenameOrderType &RenameOrder, std::map<MCRegister, MCRegister> &RenameMap) { |
| 542 | std::vector<unsigned> &KillIndices = State->GetKillIndices(); |
| 543 | std::vector<unsigned> &DefIndices = State->GetDefIndices(); |
| 544 | std::multimap<MCRegister, AggressiveAntiDepState::RegisterReference> |
| 545 | &RegRefs = State->GetRegRefs(); |
| 546 | |
| 547 | // Collect all referenced registers in the same group as |
| 548 | // AntiDepReg. These all need to be renamed together if we are to |
| 549 | // break the anti-dependence. |
| 550 | std::vector<MCRegister> Regs; |
| 551 | State->GetGroupRegs(Group: AntiDepGroupIndex, Regs, RegRefs: &RegRefs); |
| 552 | assert(!Regs.empty() && "Empty register group!" ); |
| 553 | if (Regs.empty()) |
| 554 | return false; |
| 555 | |
| 556 | // Collect the BitVector of registers that can be used to rename |
| 557 | // each register. |
| 558 | LLVM_DEBUG(dbgs() << "\tRename Candidates for Group g" << AntiDepGroupIndex |
| 559 | << ":\n" ); |
| 560 | std::map<MCRegister, BitVector> RenameRegisterMap; |
| 561 | for (MCRegister Reg : Regs) { |
| 562 | // If Reg has any references, then collect possible rename regs |
| 563 | if (RegRefs.count(x: Reg) > 0) { |
| 564 | LLVM_DEBUG(dbgs() << "\t\t" << printReg(Reg, TRI) << ":" ); |
| 565 | |
| 566 | BitVector &BV = RenameRegisterMap[Reg]; |
| 567 | assert(BV.empty()); |
| 568 | BV = GetRenameRegisters(Reg); |
| 569 | |
| 570 | LLVM_DEBUG({ |
| 571 | dbgs() << " ::" ; |
| 572 | for (unsigned r : BV.set_bits()) |
| 573 | dbgs() << " " << printReg(r, TRI); |
| 574 | dbgs() << "\n" ; |
| 575 | }); |
| 576 | } |
| 577 | } |
| 578 | |
| 579 | // All group registers should be a subreg of SuperReg. |
| 580 | for (MCRegister Reg : Regs) { |
| 581 | if (Reg == SuperReg) continue; |
| 582 | bool IsSub = TRI->isSubRegister(RegA: SuperReg, RegB: Reg); |
| 583 | // FIXME: remove this once PR18663 has been properly fixed. For now, |
| 584 | // return a conservative answer: |
| 585 | // assert(IsSub && "Expecting group subregister"); |
| 586 | if (!IsSub) |
| 587 | return false; |
| 588 | } |
| 589 | |
| 590 | #ifndef NDEBUG |
| 591 | // If DebugDiv > 0 then only rename (renamecnt % DebugDiv) == DebugMod |
| 592 | if (DebugDiv > 0) { |
| 593 | static int renamecnt = 0; |
| 594 | if (renamecnt++ % DebugDiv != DebugMod) |
| 595 | return false; |
| 596 | |
| 597 | dbgs() << "*** Performing rename " << printReg(SuperReg, TRI) |
| 598 | << " for debug ***\n" ; |
| 599 | } |
| 600 | #endif |
| 601 | |
| 602 | // Check each possible rename register for SuperReg in round-robin |
| 603 | // order. If that register is available, and the corresponding |
| 604 | // registers are available for the other group subregisters, then we |
| 605 | // can use those registers to rename. |
| 606 | |
| 607 | // FIXME: Using getMinimalPhysRegClass is very conservative. We should |
| 608 | // check every use of the register and find the largest register class |
| 609 | // that can be used in all of them. |
| 610 | const TargetRegisterClass *SuperRC = |
| 611 | TRI->getMinimalPhysRegClass(Reg: SuperReg, VT: MVT::Other); |
| 612 | |
| 613 | ArrayRef<MCPhysReg> Order = RegClassInfo.getOrder(RC: SuperRC); |
| 614 | if (Order.empty()) { |
| 615 | LLVM_DEBUG(dbgs() << "\tEmpty Super Regclass!!\n" ); |
| 616 | return false; |
| 617 | } |
| 618 | |
| 619 | LLVM_DEBUG(dbgs() << "\tFind Registers:" ); |
| 620 | |
| 621 | RenameOrder.insert(x: RenameOrderType::value_type(SuperRC, Order.size())); |
| 622 | |
| 623 | unsigned OrigR = RenameOrder[SuperRC]; |
| 624 | unsigned EndR = ((OrigR == Order.size()) ? 0 : OrigR); |
| 625 | unsigned R = OrigR; |
| 626 | do { |
| 627 | if (R == 0) R = Order.size(); |
| 628 | --R; |
| 629 | const MCRegister NewSuperReg = Order[R]; |
| 630 | // Don't consider non-allocatable registers |
| 631 | if (!MRI.isAllocatable(PhysReg: NewSuperReg)) continue; |
| 632 | // Don't replace a register with itself. |
| 633 | if (NewSuperReg == SuperReg) continue; |
| 634 | |
| 635 | LLVM_DEBUG(dbgs() << " [" << printReg(NewSuperReg, TRI) << ':'); |
| 636 | RenameMap.clear(); |
| 637 | |
| 638 | // For each referenced group register (which must be a SuperReg or |
| 639 | // a subregister of SuperReg), find the corresponding subregister |
| 640 | // of NewSuperReg and make sure it is free to be renamed. |
| 641 | for (MCRegister Reg : Regs) { |
| 642 | MCRegister NewReg; |
| 643 | if (Reg == SuperReg) { |
| 644 | NewReg = NewSuperReg; |
| 645 | } else { |
| 646 | unsigned NewSubRegIdx = TRI->getSubRegIndex(RegNo: SuperReg, SubRegNo: Reg); |
| 647 | if (NewSubRegIdx != 0) |
| 648 | NewReg = TRI->getSubReg(Reg: NewSuperReg, Idx: NewSubRegIdx); |
| 649 | } |
| 650 | |
| 651 | LLVM_DEBUG(dbgs() << " " << printReg(NewReg, TRI)); |
| 652 | |
| 653 | // Check if Reg can be renamed to NewReg. |
| 654 | if (!RenameRegisterMap[Reg].test(Idx: NewReg)) { |
| 655 | LLVM_DEBUG(dbgs() << "(no rename)" ); |
| 656 | goto next_super_reg; |
| 657 | } |
| 658 | |
| 659 | // If NewReg is dead and NewReg's most recent def is not before |
| 660 | // Regs's kill, it's safe to replace Reg with NewReg. We |
| 661 | // must also check all aliases of NewReg, because we can't define a |
| 662 | // register when any sub or super is already live. |
| 663 | if (State->IsLive(Reg: NewReg) || (KillIndices[Reg] > DefIndices[NewReg])) { |
| 664 | LLVM_DEBUG(dbgs() << "(live)" ); |
| 665 | goto next_super_reg; |
| 666 | } else { |
| 667 | bool found = false; |
| 668 | for (MCRegAliasIterator AI(NewReg, TRI, false); AI.isValid(); ++AI) { |
| 669 | MCRegister AliasReg = *AI; |
| 670 | if (State->IsLive(Reg: AliasReg) || |
| 671 | (KillIndices[Reg] > DefIndices[AliasReg])) { |
| 672 | LLVM_DEBUG(dbgs() |
| 673 | << "(alias " << printReg(AliasReg, TRI) << " live)" ); |
| 674 | found = true; |
| 675 | break; |
| 676 | } |
| 677 | } |
| 678 | if (found) |
| 679 | goto next_super_reg; |
| 680 | } |
| 681 | |
| 682 | // We cannot rename 'Reg' to 'NewReg' if one of the uses of 'Reg' also |
| 683 | // defines 'NewReg' via an early-clobber operand. |
| 684 | for (const auto &Q : make_range(p: RegRefs.equal_range(x: Reg))) { |
| 685 | MachineInstr *UseMI = Q.second.Operand->getParent(); |
| 686 | int Idx = UseMI->findRegisterDefOperandIdx(Reg: NewReg, TRI, isDead: false, Overlap: true); |
| 687 | if (Idx == -1) |
| 688 | continue; |
| 689 | |
| 690 | if (UseMI->getOperand(i: Idx).isEarlyClobber()) { |
| 691 | LLVM_DEBUG(dbgs() << "(ec)" ); |
| 692 | goto next_super_reg; |
| 693 | } |
| 694 | } |
| 695 | |
| 696 | // Also, we cannot rename 'Reg' to 'NewReg' if the instruction defining |
| 697 | // 'Reg' is an early-clobber define and that instruction also uses |
| 698 | // 'NewReg'. |
| 699 | for (const auto &Q : make_range(p: RegRefs.equal_range(x: Reg))) { |
| 700 | if (!Q.second.Operand->isDef() || !Q.second.Operand->isEarlyClobber()) |
| 701 | continue; |
| 702 | |
| 703 | MachineInstr *DefMI = Q.second.Operand->getParent(); |
| 704 | if (DefMI->readsRegister(Reg: NewReg, TRI)) { |
| 705 | LLVM_DEBUG(dbgs() << "(ec)" ); |
| 706 | goto next_super_reg; |
| 707 | } |
| 708 | } |
| 709 | |
| 710 | // Record that 'Reg' can be renamed to 'NewReg'. |
| 711 | RenameMap.insert(x: std::make_pair(x&: Reg, y&: NewReg)); |
| 712 | } |
| 713 | |
| 714 | // If we fall-out here, then every register in the group can be |
| 715 | // renamed, as recorded in RenameMap. |
| 716 | RenameOrder.erase(x: SuperRC); |
| 717 | RenameOrder.insert(x: RenameOrderType::value_type(SuperRC, R)); |
| 718 | LLVM_DEBUG(dbgs() << "]\n" ); |
| 719 | return true; |
| 720 | |
| 721 | next_super_reg: |
| 722 | LLVM_DEBUG(dbgs() << ']'); |
| 723 | } while (R != EndR); |
| 724 | |
| 725 | LLVM_DEBUG(dbgs() << '\n'); |
| 726 | |
| 727 | // No registers are free and available! |
| 728 | return false; |
| 729 | } |
| 730 | |
| 731 | /// BreakAntiDependencies - Identifiy anti-dependencies within the |
| 732 | /// ScheduleDAG and break them by renaming registers. |
| 733 | unsigned AggressiveAntiDepBreaker::BreakAntiDependencies( |
| 734 | const std::vector<SUnit> &SUnits, |
| 735 | MachineBasicBlock::iterator Begin, |
| 736 | MachineBasicBlock::iterator End, |
| 737 | unsigned InsertPosIndex, |
| 738 | DbgValueVector &DbgValues) { |
| 739 | std::vector<unsigned> &KillIndices = State->GetKillIndices(); |
| 740 | std::vector<unsigned> &DefIndices = State->GetDefIndices(); |
| 741 | std::multimap<MCRegister, AggressiveAntiDepState::RegisterReference> |
| 742 | &RegRefs = State->GetRegRefs(); |
| 743 | |
| 744 | // The code below assumes that there is at least one instruction, |
| 745 | // so just duck out immediately if the block is empty. |
| 746 | if (SUnits.empty()) return 0; |
| 747 | |
| 748 | // For each regclass the next register to use for renaming. |
| 749 | RenameOrderType RenameOrder; |
| 750 | |
| 751 | // ...need a map from MI to SUnit. |
| 752 | std::map<MachineInstr *, const SUnit *> MISUnitMap; |
| 753 | for (const SUnit &SU : SUnits) |
| 754 | MISUnitMap.insert(x: std::make_pair(x: SU.getInstr(), y: &SU)); |
| 755 | |
| 756 | // Track progress along the critical path through the SUnit graph as |
| 757 | // we walk the instructions. This is needed for regclasses that only |
| 758 | // break critical-path anti-dependencies. |
| 759 | const SUnit *CriticalPathSU = nullptr; |
| 760 | MachineInstr *CriticalPathMI = nullptr; |
| 761 | if (CriticalPathSet.any()) { |
| 762 | for (const SUnit &SU : SUnits) { |
| 763 | if (!CriticalPathSU || |
| 764 | ((SU.getDepth() + SU.Latency) > |
| 765 | (CriticalPathSU->getDepth() + CriticalPathSU->Latency))) { |
| 766 | CriticalPathSU = &SU; |
| 767 | } |
| 768 | } |
| 769 | assert(CriticalPathSU && "Failed to find SUnit critical path" ); |
| 770 | CriticalPathMI = CriticalPathSU->getInstr(); |
| 771 | } |
| 772 | |
| 773 | #ifndef NDEBUG |
| 774 | LLVM_DEBUG(dbgs() << "\n===== Aggressive anti-dependency breaking\n" ); |
| 775 | LLVM_DEBUG(dbgs() << "Available regs:" ); |
| 776 | for (unsigned Reg = 1; Reg < TRI->getNumRegs(); ++Reg) { |
| 777 | if (!State->IsLive(Reg)) |
| 778 | LLVM_DEBUG(dbgs() << " " << printReg(Reg, TRI)); |
| 779 | } |
| 780 | LLVM_DEBUG(dbgs() << '\n'); |
| 781 | #endif |
| 782 | |
| 783 | BitVector RegAliases(TRI->getNumRegs()); |
| 784 | |
| 785 | // Attempt to break anti-dependence edges. Walk the instructions |
| 786 | // from the bottom up, tracking information about liveness as we go |
| 787 | // to help determine which registers are available. |
| 788 | unsigned Broken = 0; |
| 789 | unsigned Count = InsertPosIndex - 1; |
| 790 | for (MachineBasicBlock::iterator I = End, E = Begin; |
| 791 | I != E; --Count) { |
| 792 | MachineInstr &MI = *--I; |
| 793 | |
| 794 | if (MI.isDebugInstr()) |
| 795 | continue; |
| 796 | |
| 797 | LLVM_DEBUG(dbgs() << "Anti: " ); |
| 798 | LLVM_DEBUG(MI.dump()); |
| 799 | |
| 800 | std::set<MCRegister> PassthruRegs; |
| 801 | GetPassthruRegs(MI, PassthruRegs); |
| 802 | |
| 803 | // Process the defs in MI... |
| 804 | PrescanInstruction(MI, Count, PassthruRegs); |
| 805 | |
| 806 | // The dependence edges that represent anti- and output- |
| 807 | // dependencies that are candidates for breaking. |
| 808 | std::vector<const SDep *> Edges; |
| 809 | const SUnit *PathSU = MISUnitMap[&MI]; |
| 810 | AntiDepEdges(SU: PathSU, Edges); |
| 811 | |
| 812 | // If MI is not on the critical path, then we don't rename |
| 813 | // registers in the CriticalPathSet. |
| 814 | BitVector *ExcludeRegs = nullptr; |
| 815 | if (&MI == CriticalPathMI) { |
| 816 | CriticalPathSU = CriticalPathStep(SU: CriticalPathSU); |
| 817 | CriticalPathMI = (CriticalPathSU) ? CriticalPathSU->getInstr() : nullptr; |
| 818 | } else if (CriticalPathSet.any()) { |
| 819 | ExcludeRegs = &CriticalPathSet; |
| 820 | } |
| 821 | |
| 822 | // Ignore KILL instructions (they form a group in ScanInstruction |
| 823 | // but don't cause any anti-dependence breaking themselves) |
| 824 | if (!MI.isKill()) { |
| 825 | // Attempt to break each anti-dependency... |
| 826 | for (const SDep *Edge : Edges) { |
| 827 | SUnit *NextSU = Edge->getSUnit(); |
| 828 | |
| 829 | if ((Edge->getKind() != SDep::Anti) && |
| 830 | (Edge->getKind() != SDep::Output)) continue; |
| 831 | |
| 832 | MCRegister AntiDepReg = Edge->getReg().asMCReg(); |
| 833 | LLVM_DEBUG(dbgs() << "\tAntidep reg: " << printReg(AntiDepReg, TRI)); |
| 834 | assert(AntiDepReg && "Anti-dependence on reg0?" ); |
| 835 | |
| 836 | if (!MRI.isAllocatable(PhysReg: AntiDepReg)) { |
| 837 | // Don't break anti-dependencies on non-allocatable registers. |
| 838 | LLVM_DEBUG(dbgs() << " (non-allocatable)\n" ); |
| 839 | continue; |
| 840 | } else if (ExcludeRegs && ExcludeRegs->test(Idx: AntiDepReg.id())) { |
| 841 | // Don't break anti-dependencies for critical path registers |
| 842 | // if not on the critical path |
| 843 | LLVM_DEBUG(dbgs() << " (not critical-path)\n" ); |
| 844 | continue; |
| 845 | } else if (PassthruRegs.count(x: AntiDepReg) != 0) { |
| 846 | // If the anti-dep register liveness "passes-thru", then |
| 847 | // don't try to change it. It will be changed along with |
| 848 | // the use if required to break an earlier antidep. |
| 849 | LLVM_DEBUG(dbgs() << " (passthru)\n" ); |
| 850 | continue; |
| 851 | } else { |
| 852 | // No anti-dep breaking for implicit deps |
| 853 | MachineOperand *AntiDepOp = |
| 854 | MI.findRegisterDefOperand(Reg: AntiDepReg, /*TRI=*/nullptr); |
| 855 | assert(AntiDepOp && "Can't find index for defined register operand" ); |
| 856 | if (!AntiDepOp || AntiDepOp->isImplicit()) { |
| 857 | LLVM_DEBUG(dbgs() << " (implicit)\n" ); |
| 858 | continue; |
| 859 | } |
| 860 | |
| 861 | // If the SUnit has other dependencies on the SUnit that |
| 862 | // it anti-depends on, don't bother breaking the |
| 863 | // anti-dependency since those edges would prevent such |
| 864 | // units from being scheduled past each other |
| 865 | // regardless. |
| 866 | // |
| 867 | // Also, if there are dependencies on other SUnits with the |
| 868 | // same register as the anti-dependency, don't attempt to |
| 869 | // break it. |
| 870 | for (const SDep &Pred : PathSU->Preds) { |
| 871 | if (Pred.getSUnit() == NextSU ? (Pred.getKind() != SDep::Anti || |
| 872 | Pred.getReg() != AntiDepReg) |
| 873 | : (Pred.getKind() == SDep::Data && |
| 874 | Pred.getReg() == AntiDepReg)) { |
| 875 | AntiDepReg = MCRegister(); |
| 876 | break; |
| 877 | } |
| 878 | } |
| 879 | for (const SDep &Pred : PathSU->Preds) { |
| 880 | if ((Pred.getSUnit() == NextSU) && (Pred.getKind() != SDep::Anti) && |
| 881 | (Pred.getKind() != SDep::Output)) { |
| 882 | LLVM_DEBUG(dbgs() << " (real dependency)\n" ); |
| 883 | AntiDepReg = MCRegister(); |
| 884 | break; |
| 885 | } else if ((Pred.getSUnit() != NextSU) && |
| 886 | (Pred.getKind() == SDep::Data) && |
| 887 | (Pred.getReg() == AntiDepReg)) { |
| 888 | LLVM_DEBUG(dbgs() << " (other dependency)\n" ); |
| 889 | AntiDepReg = MCRegister(); |
| 890 | break; |
| 891 | } |
| 892 | } |
| 893 | |
| 894 | if (!AntiDepReg) |
| 895 | continue; |
| 896 | } |
| 897 | |
| 898 | assert(AntiDepReg); |
| 899 | |
| 900 | // Determine AntiDepReg's register group. |
| 901 | const unsigned GroupIndex = State->GetGroup(Reg: AntiDepReg); |
| 902 | if (GroupIndex == 0) { |
| 903 | LLVM_DEBUG(dbgs() << " (zero group)\n" ); |
| 904 | continue; |
| 905 | } |
| 906 | |
| 907 | LLVM_DEBUG(dbgs() << '\n'); |
| 908 | |
| 909 | // Look for a suitable register to use to break the anti-dependence. |
| 910 | std::map<MCRegister, MCRegister> RenameMap; |
| 911 | if (FindSuitableFreeRegisters(SuperReg: AntiDepReg, AntiDepGroupIndex: GroupIndex, RenameOrder, |
| 912 | RenameMap)) { |
| 913 | LLVM_DEBUG(dbgs() << "\tBreaking anti-dependence edge on " |
| 914 | << printReg(AntiDepReg, TRI) << ":" ); |
| 915 | |
| 916 | // Handle each group register... |
| 917 | for (const auto &P : RenameMap) { |
| 918 | MCRegister CurrReg = P.first; |
| 919 | MCRegister NewReg = P.second; |
| 920 | |
| 921 | LLVM_DEBUG(dbgs() << " " << printReg(CurrReg, TRI) << "->" |
| 922 | << printReg(NewReg, TRI) << "(" |
| 923 | << RegRefs.count(CurrReg) << " refs)" ); |
| 924 | |
| 925 | // Update the references to the old register CurrReg to |
| 926 | // refer to the new register NewReg. |
| 927 | for (const auto &Q : make_range(p: RegRefs.equal_range(x: CurrReg))) { |
| 928 | Q.second.Operand->setReg(NewReg); |
| 929 | // If the SU for the instruction being updated has debug |
| 930 | // information related to the anti-dependency register, make |
| 931 | // sure to update that as well. |
| 932 | const SUnit *SU = MISUnitMap[Q.second.Operand->getParent()]; |
| 933 | if (!SU) continue; |
| 934 | UpdateDbgValues(DbgValues, ParentMI: Q.second.Operand->getParent(), |
| 935 | OldReg: AntiDepReg, NewReg); |
| 936 | } |
| 937 | |
| 938 | // We just went back in time and modified history; the |
| 939 | // liveness information for CurrReg is now inconsistent. Set |
| 940 | // the state as if it were dead. |
| 941 | State->UnionGroups(Reg1: NewReg, Reg2: 0); |
| 942 | RegRefs.erase(x: NewReg); |
| 943 | DefIndices[NewReg] = DefIndices[CurrReg]; |
| 944 | KillIndices[NewReg] = KillIndices[CurrReg]; |
| 945 | |
| 946 | State->UnionGroups(Reg1: CurrReg, Reg2: 0); |
| 947 | RegRefs.erase(x: CurrReg); |
| 948 | DefIndices[CurrReg] = KillIndices[CurrReg]; |
| 949 | KillIndices[CurrReg] = ~0u; |
| 950 | assert(((KillIndices[CurrReg] == ~0u) != |
| 951 | (DefIndices[CurrReg] == ~0u)) && |
| 952 | "Kill and Def maps aren't consistent for AntiDepReg!" ); |
| 953 | } |
| 954 | |
| 955 | ++Broken; |
| 956 | LLVM_DEBUG(dbgs() << '\n'); |
| 957 | } |
| 958 | } |
| 959 | } |
| 960 | |
| 961 | ScanInstruction(MI, Count); |
| 962 | } |
| 963 | |
| 964 | return Broken; |
| 965 | } |
| 966 | |
| 967 | AntiDepBreaker *llvm::createAggressiveAntiDepBreaker( |
| 968 | MachineFunction &MFi, const RegisterClassInfo &RCI, |
| 969 | TargetSubtargetInfo::RegClassVector &CriticalPathRCs) { |
| 970 | return new AggressiveAntiDepBreaker(MFi, RCI, CriticalPathRCs); |
| 971 | } |
| 972 | |