| 1 | //===----- x86_64.cpp - Generic JITLink x86-64 edge kinds, utilities ------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // Generic utilities for graphs representing x86-64 objects. |
| 10 | // |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | |
| 13 | #include "llvm/ExecutionEngine/JITLink/x86_64.h" |
| 14 | |
| 15 | #define DEBUG_TYPE "jitlink" |
| 16 | |
| 17 | namespace llvm { |
| 18 | namespace jitlink { |
| 19 | namespace x86_64 { |
| 20 | |
| 21 | const char *getEdgeKindName(Edge::Kind K) { |
| 22 | switch (K) { |
| 23 | case Pointer64: |
| 24 | return "Pointer64" ; |
| 25 | case Pointer32: |
| 26 | return "Pointer32" ; |
| 27 | case Pointer32Signed: |
| 28 | return "Pointer32Signed" ; |
| 29 | case Pointer16: |
| 30 | return "Pointer16" ; |
| 31 | case Pointer8: |
| 32 | return "Pointer8" ; |
| 33 | case Delta64: |
| 34 | return "Delta64" ; |
| 35 | case Delta32: |
| 36 | return "Delta32" ; |
| 37 | case Delta16: |
| 38 | return "Delta16" ; |
| 39 | case Delta8: |
| 40 | return "Delta8" ; |
| 41 | case NegDelta64: |
| 42 | return "NegDelta64" ; |
| 43 | case NegDelta32: |
| 44 | return "NegDelta32" ; |
| 45 | case Size64: |
| 46 | return "Size64" ; |
| 47 | case Size32: |
| 48 | return "Size32" ; |
| 49 | case Delta64FromGOT: |
| 50 | return "Delta64FromGOT" ; |
| 51 | case PCRel32: |
| 52 | return "PCRel32" ; |
| 53 | case BranchPCRel32: |
| 54 | return "BranchPCRel32" ; |
| 55 | case BranchPCRel32ToPtrJumpStub: |
| 56 | return "BranchPCRel32ToPtrJumpStub" ; |
| 57 | case BranchPCRel32ToPtrJumpStubBypassable: |
| 58 | return "BranchPCRel32ToPtrJumpStubBypassable" ; |
| 59 | case RequestGOTAndTransformToDelta32: |
| 60 | return "RequestGOTAndTransformToDelta32" ; |
| 61 | case RequestGOTAndTransformToDelta64: |
| 62 | return "RequestGOTAndTransformToDelta64" ; |
| 63 | case RequestGOTAndTransformToDelta64FromGOT: |
| 64 | return "RequestGOTAndTransformToDelta64FromGOT" ; |
| 65 | case PCRel32GOTLoadREXRelaxable: |
| 66 | return "PCRel32GOTLoadREXRelaxable" ; |
| 67 | case RequestGOTAndTransformToPCRel32GOTLoadREXRelaxable: |
| 68 | return "RequestGOTAndTransformToPCRel32GOTLoadREXRelaxable" ; |
| 69 | case PCRel32GOTLoadRelaxable: |
| 70 | return "PCRel32GOTLoadRelaxable" ; |
| 71 | case RequestGOTAndTransformToPCRel32GOTLoadRelaxable: |
| 72 | return "RequestGOTAndTransformToPCRel32GOTLoadRelaxable" ; |
| 73 | case PCRel32TLVPLoadREXRelaxable: |
| 74 | return "PCRel32TLVPLoadREXRelaxable" ; |
| 75 | case RequestTLVPAndTransformToPCRel32TLVPLoadREXRelaxable: |
| 76 | return "RequestTLVPAndTransformToPCRel32TLVPLoadREXRelaxable" ; |
| 77 | default: |
| 78 | return getGenericEdgeKindName(K); |
| 79 | } |
| 80 | } |
| 81 | |
| 82 | const char NullPointerContent[PointerSize] = {0x00, 0x00, 0x00, 0x00, |
| 83 | 0x00, 0x00, 0x00, 0x00}; |
| 84 | |
| 85 | const char PointerJumpStubContent[6] = { |
| 86 | static_cast<char>(0xFFu), 0x25, 0x00, 0x00, 0x00, 0x00}; |
| 87 | |
| 88 | const char ReentryTrampolineContent[5] = { |
| 89 | static_cast<char>(0xe8), 0x00, 0x00, 0x00, 0x00 |
| 90 | }; |
| 91 | |
| 92 | void GOTTableManager::registerExistingEntries() { |
| 93 | for (auto *EntrySym : GOTSection->symbols()) { |
| 94 | assert(EntrySym->getBlock().edges_size() == 1 && |
| 95 | "GOT block edge count != 1" ); |
| 96 | registerPreExistingEntry(Target&: EntrySym->getBlock().edges().begin()->getTarget(), |
| 97 | Entry&: *EntrySym); |
| 98 | } |
| 99 | } |
| 100 | |
| 101 | void PLTTableManager::registerExistingEntries() { |
| 102 | for (auto *EntrySym : StubsSection->symbols()) { |
| 103 | assert(EntrySym->getBlock().edges_size() == 1 && |
| 104 | "PLT block edge count != 1" ); |
| 105 | auto &GOTSym = EntrySym->getBlock().edges().begin()->getTarget(); |
| 106 | assert(GOTSym.getBlock().edges_size() == 1 && "GOT block edge count != 1" ); |
| 107 | registerPreExistingEntry(Target&: GOTSym.getBlock().edges().begin()->getTarget(), |
| 108 | Entry&: *EntrySym); |
| 109 | } |
| 110 | } |
| 111 | |
| 112 | Error optimizeGOTAndStubAccesses(LinkGraph &G) { |
| 113 | LLVM_DEBUG(dbgs() << "Optimizing GOT entries and stubs:\n" ); |
| 114 | |
| 115 | for (auto *B : G.blocks()) |
| 116 | for (auto &E : B->edges()) { |
| 117 | if (E.getKind() == x86_64::PCRel32GOTLoadRelaxable || |
| 118 | E.getKind() == x86_64::PCRel32GOTLoadREXRelaxable) { |
| 119 | #ifndef NDEBUG |
| 120 | bool REXPrefix = E.getKind() == x86_64::PCRel32GOTLoadREXRelaxable; |
| 121 | assert(E.getOffset() >= (REXPrefix ? 3u : 2u) && |
| 122 | "GOT edge occurs too early in block" ); |
| 123 | #endif |
| 124 | auto *FixupData = reinterpret_cast<uint8_t *>( |
| 125 | const_cast<char *>(B->getContent().data())) + |
| 126 | E.getOffset(); |
| 127 | const uint8_t Op = FixupData[-2]; |
| 128 | const uint8_t ModRM = FixupData[-1]; |
| 129 | |
| 130 | auto &GOTEntryBlock = E.getTarget().getBlock(); |
| 131 | assert(GOTEntryBlock.getSize() == G.getPointerSize() && |
| 132 | "GOT entry block should be pointer sized" ); |
| 133 | assert(GOTEntryBlock.edges_size() == 1 && |
| 134 | "GOT entry should only have one outgoing edge" ); |
| 135 | auto &GOTTarget = GOTEntryBlock.edges().begin()->getTarget(); |
| 136 | orc::ExecutorAddr TargetAddr = GOTTarget.getAddress(); |
| 137 | orc::ExecutorAddr EdgeAddr = B->getFixupAddress(E); |
| 138 | int64_t Displacement = TargetAddr - EdgeAddr + 4; |
| 139 | bool TargetInRangeForImmU32 = isUInt<32>(x: TargetAddr.getValue()); |
| 140 | bool DisplacementInRangeForImmS32 = isInt<32>(x: Displacement); |
| 141 | |
| 142 | // If both of the Target and displacement is out of range, then |
| 143 | // there isn't optimization chance. |
| 144 | if (!(TargetInRangeForImmU32 || DisplacementInRangeForImmS32)) |
| 145 | continue; |
| 146 | |
| 147 | // Transform "mov foo@GOTPCREL(%rip),%reg" to "lea foo(%rip),%reg". |
| 148 | if (Op == 0x8b && DisplacementInRangeForImmS32) { |
| 149 | FixupData[-2] = 0x8d; |
| 150 | E.setKind(x86_64::Delta32); |
| 151 | E.setTarget(GOTTarget); |
| 152 | E.setAddend(E.getAddend() - 4); |
| 153 | LLVM_DEBUG({ |
| 154 | dbgs() << " Replaced GOT load wih LEA:\n " ; |
| 155 | printEdge(dbgs(), *B, E, getEdgeKindName(E.getKind())); |
| 156 | dbgs() << "\n" ; |
| 157 | }); |
| 158 | continue; |
| 159 | } |
| 160 | |
| 161 | // Transform call/jmp instructions |
| 162 | if (Op == 0xff && TargetInRangeForImmU32) { |
| 163 | if (ModRM == 0x15) { |
| 164 | // ABI says we can convert "call *foo@GOTPCREL(%rip)" to "nop; call |
| 165 | // foo" But lld convert it to "addr32 call foo, because that makes |
| 166 | // result expression to be a single instruction. |
| 167 | FixupData[-2] = 0x67; |
| 168 | FixupData[-1] = 0xe8; |
| 169 | LLVM_DEBUG({ |
| 170 | dbgs() << " replaced call instruction's memory operand wih imm " |
| 171 | "operand:\n " ; |
| 172 | printEdge(dbgs(), *B, E, getEdgeKindName(E.getKind())); |
| 173 | dbgs() << "\n" ; |
| 174 | }); |
| 175 | } else { |
| 176 | // Transform "jmp *foo@GOTPCREL(%rip)" to "jmp foo; nop" |
| 177 | assert(ModRM == 0x25 && "Invalid ModRm for call/jmp instructions" ); |
| 178 | FixupData[-2] = 0xe9; |
| 179 | FixupData[3] = 0x90; |
| 180 | E.setOffset(E.getOffset() - 1); |
| 181 | LLVM_DEBUG({ |
| 182 | dbgs() << " replaced jmp instruction's memory operand wih imm " |
| 183 | "operand:\n " ; |
| 184 | printEdge(dbgs(), *B, E, getEdgeKindName(E.getKind())); |
| 185 | dbgs() << "\n" ; |
| 186 | }); |
| 187 | } |
| 188 | E.setKind(x86_64::Pointer32); |
| 189 | E.setTarget(GOTTarget); |
| 190 | continue; |
| 191 | } |
| 192 | } else if (E.getKind() == x86_64::BranchPCRel32ToPtrJumpStubBypassable) { |
| 193 | auto &StubBlock = E.getTarget().getBlock(); |
| 194 | assert(StubBlock.getSize() == sizeof(PointerJumpStubContent) && |
| 195 | "Stub block should be stub sized" ); |
| 196 | assert(StubBlock.edges_size() == 1 && |
| 197 | "Stub block should only have one outgoing edge" ); |
| 198 | |
| 199 | auto &GOTBlock = StubBlock.edges().begin()->getTarget().getBlock(); |
| 200 | assert(GOTBlock.getSize() == G.getPointerSize() && |
| 201 | "GOT block should be pointer sized" ); |
| 202 | assert(GOTBlock.edges_size() == 1 && |
| 203 | "GOT block should only have one outgoing edge" ); |
| 204 | |
| 205 | auto &GOTTarget = GOTBlock.edges().begin()->getTarget(); |
| 206 | orc::ExecutorAddr EdgeAddr = B->getAddress() + E.getOffset(); |
| 207 | orc::ExecutorAddr TargetAddr = GOTTarget.getAddress(); |
| 208 | |
| 209 | int64_t Displacement = TargetAddr - EdgeAddr + 4; |
| 210 | if (isInt<32>(x: Displacement)) { |
| 211 | E.setKind(x86_64::BranchPCRel32); |
| 212 | E.setTarget(GOTTarget); |
| 213 | LLVM_DEBUG({ |
| 214 | dbgs() << " Replaced stub branch with direct branch:\n " ; |
| 215 | printEdge(dbgs(), *B, E, getEdgeKindName(E.getKind())); |
| 216 | dbgs() << "\n" ; |
| 217 | }); |
| 218 | } |
| 219 | } |
| 220 | } |
| 221 | |
| 222 | return Error::success(); |
| 223 | } |
| 224 | |
| 225 | } // end namespace x86_64 |
| 226 | } // end namespace jitlink |
| 227 | } // end namespace llvm |
| 228 | |