1 | //===-- ARMMachObjectWriter.cpp - ARM Mach Object Writer ------------------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | |
9 | #include "MCTargetDesc/ARMBaseInfo.h" |
10 | #include "MCTargetDesc/ARMFixupKinds.h" |
11 | #include "MCTargetDesc/ARMMCTargetDesc.h" |
12 | #include "llvm/ADT/StringExtras.h" |
13 | #include "llvm/ADT/Twine.h" |
14 | #include "llvm/BinaryFormat/MachO.h" |
15 | #include "llvm/MC/MCAssembler.h" |
16 | #include "llvm/MC/MCContext.h" |
17 | #include "llvm/MC/MCExpr.h" |
18 | #include "llvm/MC/MCFixup.h" |
19 | #include "llvm/MC/MCFixupKindInfo.h" |
20 | #include "llvm/MC/MCMachObjectWriter.h" |
21 | #include "llvm/MC/MCSection.h" |
22 | #include "llvm/MC/MCValue.h" |
23 | #include "llvm/Support/ErrorHandling.h" |
24 | |
25 | using namespace llvm; |
26 | |
27 | namespace { |
28 | class ARMMachObjectWriter : public MCMachObjectTargetWriter { |
29 | void recordARMScatteredRelocation(MachObjectWriter *Writer, |
30 | const MCAssembler &Asm, |
31 | const MCFragment *Fragment, |
32 | const MCFixup &Fixup, MCValue Target, |
33 | unsigned Type, unsigned Log2Size, |
34 | uint64_t &FixedValue); |
35 | void recordARMScatteredHalfRelocation(MachObjectWriter *Writer, |
36 | const MCAssembler &Asm, |
37 | const MCFragment *Fragment, |
38 | const MCFixup &Fixup, MCValue Target, |
39 | uint64_t &FixedValue); |
40 | |
41 | bool requiresExternRelocation(MachObjectWriter *Writer, |
42 | const MCAssembler &Asm, |
43 | const MCFragment &Fragment, unsigned RelocType, |
44 | const MCSymbol &S, uint64_t FixedValue); |
45 | |
46 | public: |
47 | ARMMachObjectWriter(bool Is64Bit, uint32_t CPUType, uint32_t CPUSubtype) |
48 | : MCMachObjectTargetWriter(Is64Bit, CPUType, CPUSubtype) {} |
49 | |
50 | void recordRelocation(MachObjectWriter *Writer, MCAssembler &Asm, |
51 | const MCFragment *Fragment, const MCFixup &Fixup, |
52 | MCValue Target, uint64_t &FixedValue) override; |
53 | }; |
54 | } |
55 | |
56 | static bool getARMFixupKindMachOInfo(unsigned Kind, unsigned &RelocType, |
57 | unsigned &Log2Size) { |
58 | RelocType = unsigned(MachO::ARM_RELOC_VANILLA); |
59 | Log2Size = ~0U; |
60 | |
61 | switch (Kind) { |
62 | default: |
63 | return false; |
64 | |
65 | case FK_Data_1: |
66 | Log2Size = llvm::Log2_32(Value: 1); |
67 | return true; |
68 | case FK_Data_2: |
69 | Log2Size = llvm::Log2_32(Value: 2); |
70 | return true; |
71 | case FK_Data_4: |
72 | Log2Size = llvm::Log2_32(Value: 4); |
73 | return true; |
74 | case FK_Data_8: |
75 | Log2Size = llvm::Log2_32(Value: 8); |
76 | return false; |
77 | |
78 | // These fixups are expected to always be resolvable at assembly time and |
79 | // have no relocations supported. |
80 | case ARM::fixup_arm_ldst_pcrel_12: |
81 | case ARM::fixup_arm_pcrel_10: |
82 | case ARM::fixup_arm_adr_pcrel_12: |
83 | case ARM::fixup_arm_thumb_br: |
84 | return false; |
85 | |
86 | // Handle 24-bit branch kinds. |
87 | case ARM::fixup_arm_condbranch: |
88 | case ARM::fixup_arm_uncondbranch: |
89 | case ARM::fixup_arm_uncondbl: |
90 | case ARM::fixup_arm_condbl: |
91 | case ARM::fixup_arm_blx: |
92 | RelocType = unsigned(MachO::ARM_RELOC_BR24); |
93 | // Report as 'long', even though that is not quite accurate. |
94 | Log2Size = llvm::Log2_32(Value: 4); |
95 | return true; |
96 | |
97 | case ARM::fixup_t2_uncondbranch: |
98 | case ARM::fixup_arm_thumb_bl: |
99 | case ARM::fixup_arm_thumb_blx: |
100 | RelocType = unsigned(MachO::ARM_THUMB_RELOC_BR22); |
101 | Log2Size = llvm::Log2_32(Value: 4); |
102 | return true; |
103 | |
104 | // For movw/movt r_type relocations they always have a pair following them and |
105 | // the r_length bits are used differently. The encoding of the r_length is as |
106 | // follows: |
107 | // low bit of r_length: |
108 | // 0 - :lower16: for movw instructions |
109 | // 1 - :upper16: for movt instructions |
110 | // high bit of r_length: |
111 | // 0 - arm instructions |
112 | // 1 - thumb instructions |
113 | case ARM::fixup_arm_movt_hi16: |
114 | RelocType = unsigned(MachO::ARM_RELOC_HALF); |
115 | Log2Size = 1; |
116 | return true; |
117 | case ARM::fixup_t2_movt_hi16: |
118 | RelocType = unsigned(MachO::ARM_RELOC_HALF); |
119 | Log2Size = 3; |
120 | return true; |
121 | |
122 | case ARM::fixup_arm_movw_lo16: |
123 | RelocType = unsigned(MachO::ARM_RELOC_HALF); |
124 | Log2Size = 0; |
125 | return true; |
126 | case ARM::fixup_t2_movw_lo16: |
127 | RelocType = unsigned(MachO::ARM_RELOC_HALF); |
128 | Log2Size = 2; |
129 | return true; |
130 | } |
131 | } |
132 | |
133 | void ARMMachObjectWriter::recordARMScatteredHalfRelocation( |
134 | MachObjectWriter *Writer, const MCAssembler &Asm, |
135 | const MCFragment *Fragment, const MCFixup &Fixup, MCValue Target, |
136 | uint64_t &FixedValue) { |
137 | uint32_t FixupOffset = Asm.getFragmentOffset(F: *Fragment) + Fixup.getOffset(); |
138 | |
139 | if (FixupOffset & 0xff000000) { |
140 | Asm.getContext().reportError(L: Fixup.getLoc(), |
141 | Msg: "can not encode offset '0x" + |
142 | utohexstr(X: FixupOffset) + |
143 | "' in resulting scattered relocation." ); |
144 | return; |
145 | } |
146 | |
147 | unsigned IsPCRel = Writer->isFixupKindPCRel(Asm, Kind: Fixup.getKind()); |
148 | unsigned Type = MachO::ARM_RELOC_HALF; |
149 | |
150 | // See <reloc.h>. |
151 | const MCSymbol *A = &Target.getSymA()->getSymbol(); |
152 | |
153 | if (!A->getFragment()) { |
154 | Asm.getContext().reportError(L: Fixup.getLoc(), |
155 | Msg: "symbol '" + A->getName() + |
156 | "' can not be undefined in a subtraction expression" ); |
157 | return; |
158 | } |
159 | |
160 | uint32_t Value = Writer->getSymbolAddress(S: *A, Asm); |
161 | uint32_t Value2 = 0; |
162 | uint64_t SecAddr = Writer->getSectionAddress(Sec: A->getFragment()->getParent()); |
163 | FixedValue += SecAddr; |
164 | |
165 | if (const MCSymbolRefExpr *B = Target.getSymB()) { |
166 | const MCSymbol *SB = &B->getSymbol(); |
167 | |
168 | if (!SB->getFragment()) { |
169 | Asm.getContext().reportError(L: Fixup.getLoc(), |
170 | Msg: "symbol '" + B->getSymbol().getName() + |
171 | "' can not be undefined in a subtraction expression" ); |
172 | return; |
173 | } |
174 | |
175 | // Select the appropriate difference relocation type. |
176 | Type = MachO::ARM_RELOC_HALF_SECTDIFF; |
177 | Value2 = Writer->getSymbolAddress(S: B->getSymbol(), Asm); |
178 | FixedValue -= Writer->getSectionAddress(Sec: SB->getFragment()->getParent()); |
179 | } |
180 | |
181 | // Relocations are written out in reverse order, so the PAIR comes first. |
182 | // ARM_RELOC_HALF and ARM_RELOC_HALF_SECTDIFF abuse the r_length field: |
183 | // |
184 | // For these two r_type relocations they always have a pair following them and |
185 | // the r_length bits are used differently. The encoding of the r_length is as |
186 | // follows: |
187 | // low bit of r_length: |
188 | // 0 - :lower16: for movw instructions |
189 | // 1 - :upper16: for movt instructions |
190 | // high bit of r_length: |
191 | // 0 - arm instructions |
192 | // 1 - thumb instructions |
193 | // the other half of the relocated expression is in the following pair |
194 | // relocation entry in the low 16 bits of r_address field. |
195 | unsigned ThumbBit = 0; |
196 | unsigned MovtBit = 0; |
197 | switch (Fixup.getTargetKind()) { |
198 | default: break; |
199 | case ARM::fixup_arm_movt_hi16: |
200 | MovtBit = 1; |
201 | // The thumb bit shouldn't be set in the 'other-half' bit of the |
202 | // relocation, but it will be set in FixedValue if the base symbol |
203 | // is a thumb function. Clear it out here. |
204 | if (Asm.isThumbFunc(Func: A)) |
205 | FixedValue &= 0xfffffffe; |
206 | break; |
207 | case ARM::fixup_t2_movt_hi16: |
208 | if (Asm.isThumbFunc(Func: A)) |
209 | FixedValue &= 0xfffffffe; |
210 | MovtBit = 1; |
211 | [[fallthrough]]; |
212 | case ARM::fixup_t2_movw_lo16: |
213 | ThumbBit = 1; |
214 | break; |
215 | } |
216 | |
217 | if (Type == MachO::ARM_RELOC_HALF_SECTDIFF) { |
218 | uint32_t OtherHalf = MovtBit |
219 | ? (FixedValue & 0xffff) : ((FixedValue & 0xffff0000) >> 16); |
220 | |
221 | MachO::any_relocation_info MRE; |
222 | MRE.r_word0 = ((OtherHalf << 0) | |
223 | (MachO::ARM_RELOC_PAIR << 24) | |
224 | (MovtBit << 28) | |
225 | (ThumbBit << 29) | |
226 | (IsPCRel << 30) | |
227 | MachO::R_SCATTERED); |
228 | MRE.r_word1 = Value2; |
229 | Writer->addRelocation(RelSymbol: nullptr, Sec: Fragment->getParent(), MRE); |
230 | } |
231 | |
232 | MachO::any_relocation_info MRE; |
233 | MRE.r_word0 = ((FixupOffset << 0) | |
234 | (Type << 24) | |
235 | (MovtBit << 28) | |
236 | (ThumbBit << 29) | |
237 | (IsPCRel << 30) | |
238 | MachO::R_SCATTERED); |
239 | MRE.r_word1 = Value; |
240 | Writer->addRelocation(RelSymbol: nullptr, Sec: Fragment->getParent(), MRE); |
241 | } |
242 | |
243 | void ARMMachObjectWriter::recordARMScatteredRelocation( |
244 | MachObjectWriter *Writer, const MCAssembler &Asm, |
245 | const MCFragment *Fragment, const MCFixup &Fixup, MCValue Target, |
246 | unsigned Type, unsigned Log2Size, uint64_t &FixedValue) { |
247 | uint32_t FixupOffset = Asm.getFragmentOffset(F: *Fragment) + Fixup.getOffset(); |
248 | |
249 | if (FixupOffset & 0xff000000) { |
250 | Asm.getContext().reportError(L: Fixup.getLoc(), |
251 | Msg: "can not encode offset '0x" + |
252 | utohexstr(X: FixupOffset) + |
253 | "' in resulting scattered relocation." ); |
254 | return; |
255 | } |
256 | |
257 | unsigned IsPCRel = Writer->isFixupKindPCRel(Asm, Kind: Fixup.getKind()); |
258 | |
259 | // See <reloc.h>. |
260 | const MCSymbol *A = &Target.getSymA()->getSymbol(); |
261 | |
262 | if (!A->getFragment()) { |
263 | Asm.getContext().reportError(L: Fixup.getLoc(), |
264 | Msg: "symbol '" + A->getName() + |
265 | "' can not be undefined in a subtraction expression" ); |
266 | return; |
267 | } |
268 | |
269 | uint32_t Value = Writer->getSymbolAddress(S: *A, Asm); |
270 | uint64_t SecAddr = Writer->getSectionAddress(Sec: A->getFragment()->getParent()); |
271 | FixedValue += SecAddr; |
272 | uint32_t Value2 = 0; |
273 | |
274 | if (const MCSymbolRefExpr *B = Target.getSymB()) { |
275 | assert(Type == MachO::ARM_RELOC_VANILLA && "invalid reloc for 2 symbols" ); |
276 | const MCSymbol *SB = &B->getSymbol(); |
277 | |
278 | if (!SB->getFragment()) { |
279 | Asm.getContext().reportError(L: Fixup.getLoc(), |
280 | Msg: "symbol '" + B->getSymbol().getName() + |
281 | "' can not be undefined in a subtraction expression" ); |
282 | return; |
283 | } |
284 | |
285 | // Select the appropriate difference relocation type. |
286 | Type = MachO::ARM_RELOC_SECTDIFF; |
287 | Value2 = Writer->getSymbolAddress(S: B->getSymbol(), Asm); |
288 | FixedValue -= Writer->getSectionAddress(Sec: SB->getFragment()->getParent()); |
289 | } |
290 | |
291 | // Relocations are written out in reverse order, so the PAIR comes first. |
292 | if (Type == MachO::ARM_RELOC_SECTDIFF || |
293 | Type == MachO::ARM_RELOC_LOCAL_SECTDIFF) { |
294 | MachO::any_relocation_info MRE; |
295 | MRE.r_word0 = ((0 << 0) | |
296 | (MachO::ARM_RELOC_PAIR << 24) | |
297 | (Log2Size << 28) | |
298 | (IsPCRel << 30) | |
299 | MachO::R_SCATTERED); |
300 | MRE.r_word1 = Value2; |
301 | Writer->addRelocation(RelSymbol: nullptr, Sec: Fragment->getParent(), MRE); |
302 | } |
303 | |
304 | MachO::any_relocation_info MRE; |
305 | MRE.r_word0 = ((FixupOffset << 0) | |
306 | (Type << 24) | |
307 | (Log2Size << 28) | |
308 | (IsPCRel << 30) | |
309 | MachO::R_SCATTERED); |
310 | MRE.r_word1 = Value; |
311 | Writer->addRelocation(RelSymbol: nullptr, Sec: Fragment->getParent(), MRE); |
312 | } |
313 | |
314 | bool ARMMachObjectWriter::requiresExternRelocation(MachObjectWriter *Writer, |
315 | const MCAssembler &Asm, |
316 | const MCFragment &Fragment, |
317 | unsigned RelocType, |
318 | const MCSymbol &S, |
319 | uint64_t FixedValue) { |
320 | // Most cases can be identified purely from the symbol. |
321 | if (Writer->doesSymbolRequireExternRelocation(S)) |
322 | return true; |
323 | int64_t Value = (int64_t)FixedValue; // The displacement is signed. |
324 | int64_t Range; |
325 | switch (RelocType) { |
326 | default: |
327 | return false; |
328 | case MachO::ARM_RELOC_BR24: |
329 | // An ARM call might be to a Thumb function, in which case the offset may |
330 | // not be encodable in the instruction and we must use an external |
331 | // relocation that explicitly mentions the function. Not a problem if it's |
332 | // to a temporary "Lwhatever" symbol though, and in fact trying to use an |
333 | // external relocation there causes more issues. |
334 | if (!S.isTemporary()) |
335 | return true; |
336 | |
337 | // PC pre-adjustment of 8 for these instructions. |
338 | Value -= 8; |
339 | // ARM BL/BLX has a 25-bit offset. |
340 | Range = 0x1ffffff; |
341 | break; |
342 | case MachO::ARM_THUMB_RELOC_BR22: |
343 | // PC pre-adjustment of 4 for these instructions. |
344 | Value -= 4; |
345 | // Thumb BL/BLX has a 24-bit offset. |
346 | Range = 0xffffff; |
347 | } |
348 | // BL/BLX also use external relocations when an internal relocation |
349 | // would result in the target being out of range. This gives the linker |
350 | // enough information to generate a branch island. |
351 | Value += Writer->getSectionAddress(Sec: &S.getSection()); |
352 | Value -= Writer->getSectionAddress(Sec: Fragment.getParent()); |
353 | // If the resultant value would be out of range for an internal relocation, |
354 | // use an external instead. |
355 | if (Value > Range || Value < -(Range + 1)) |
356 | return true; |
357 | return false; |
358 | } |
359 | |
360 | void ARMMachObjectWriter::recordRelocation(MachObjectWriter *Writer, |
361 | MCAssembler &Asm, |
362 | const MCFragment *Fragment, |
363 | const MCFixup &Fixup, MCValue Target, |
364 | uint64_t &FixedValue) { |
365 | unsigned IsPCRel = Writer->isFixupKindPCRel(Asm, Kind: Fixup.getKind()); |
366 | unsigned Log2Size; |
367 | unsigned RelocType = MachO::ARM_RELOC_VANILLA; |
368 | if (!getARMFixupKindMachOInfo(Kind: Fixup.getKind(), RelocType, Log2Size)) { |
369 | // If we failed to get fixup kind info, it's because there's no legal |
370 | // relocation type for the fixup kind. This happens when it's a fixup that's |
371 | // expected to always be resolvable at assembly time and not have any |
372 | // relocations needed. |
373 | Asm.getContext().reportError(L: Fixup.getLoc(), Msg: "unsupported relocation type" ); |
374 | return; |
375 | } |
376 | |
377 | // If this is a difference or a defined symbol plus an offset, then we need a |
378 | // scattered relocation entry. Differences always require scattered |
379 | // relocations. |
380 | if (Target.getSymB()) { |
381 | if (RelocType == MachO::ARM_RELOC_HALF) |
382 | return recordARMScatteredHalfRelocation(Writer, Asm, Fragment, Fixup, |
383 | Target, FixedValue); |
384 | return recordARMScatteredRelocation(Writer, Asm, Fragment, Fixup, Target, |
385 | Type: RelocType, Log2Size, FixedValue); |
386 | } |
387 | |
388 | // Get the symbol data, if any. |
389 | const MCSymbol *A = nullptr; |
390 | if (Target.getSymA()) |
391 | A = &Target.getSymA()->getSymbol(); |
392 | |
393 | // FIXME: For other platforms, we need to use scattered relocations for |
394 | // internal relocations with offsets. If this is an internal relocation with |
395 | // an offset, it also needs a scattered relocation entry. |
396 | // |
397 | // Is this right for ARM? |
398 | uint32_t Offset = Target.getConstant(); |
399 | if (IsPCRel && RelocType == MachO::ARM_RELOC_VANILLA) |
400 | Offset += 1 << Log2Size; |
401 | if (Offset && A && !Writer->doesSymbolRequireExternRelocation(S: *A) && |
402 | RelocType != MachO::ARM_RELOC_HALF) |
403 | return recordARMScatteredRelocation(Writer, Asm, Fragment, Fixup, Target, |
404 | Type: RelocType, Log2Size, FixedValue); |
405 | |
406 | // See <reloc.h>. |
407 | uint32_t FixupOffset = Asm.getFragmentOffset(F: *Fragment) + Fixup.getOffset(); |
408 | unsigned Index = 0; |
409 | unsigned Type = 0; |
410 | const MCSymbol *RelSymbol = nullptr; |
411 | |
412 | if (!A) { // constant |
413 | // FIXME! This is Target.isAbsolute() case as we check SymB above. We check |
414 | // !A to ensure that null pointer isn't dereferenced and suppress static |
415 | // analyzer warnings. |
416 | report_fatal_error(reason: "FIXME: relocations to absolute targets " |
417 | "not yet implemented" ); |
418 | } else { |
419 | // Resolve constant variables. |
420 | if (A->isVariable()) { |
421 | int64_t Res; |
422 | if (A->getVariableValue()->evaluateAsAbsolute( |
423 | Res, Asm, Addrs: Writer->getSectionAddressMap())) { |
424 | FixedValue = Res; |
425 | return; |
426 | } |
427 | } |
428 | |
429 | // Check whether we need an external or internal relocation. |
430 | if (requiresExternRelocation(Writer, Asm, Fragment: *Fragment, RelocType, S: *A, |
431 | FixedValue)) { |
432 | RelSymbol = A; |
433 | |
434 | // For external relocations, make sure to offset the fixup value to |
435 | // compensate for the addend of the symbol address, if it was |
436 | // undefined. This occurs with weak definitions, for example. |
437 | if (!A->isUndefined()) |
438 | FixedValue -= Asm.getSymbolOffset(S: *A); |
439 | } else { |
440 | // The index is the section ordinal (1-based). |
441 | const MCSection &Sec = A->getSection(); |
442 | Index = Sec.getOrdinal() + 1; |
443 | FixedValue += Writer->getSectionAddress(Sec: &Sec); |
444 | } |
445 | if (IsPCRel) |
446 | FixedValue -= Writer->getSectionAddress(Sec: Fragment->getParent()); |
447 | |
448 | // The type is determined by the fixup kind. |
449 | Type = RelocType; |
450 | } |
451 | |
452 | // struct relocation_info (8 bytes) |
453 | MachO::any_relocation_info MRE; |
454 | MRE.r_word0 = FixupOffset; |
455 | MRE.r_word1 = |
456 | (Index << 0) | (IsPCRel << 24) | (Log2Size << 25) | (Type << 28); |
457 | |
458 | // Even when it's not a scattered relocation, movw/movt always uses |
459 | // a PAIR relocation. |
460 | if (Type == MachO::ARM_RELOC_HALF) { |
461 | // The entire addend is needed to correctly apply a relocation. One half is |
462 | // extracted from the instruction itself, the other comes from this |
463 | // PAIR. I.e. it's correct that we insert the high bits of the addend in the |
464 | // MOVW case here. relocation entries. |
465 | uint32_t Value = 0; |
466 | switch (Fixup.getTargetKind()) { |
467 | default: break; |
468 | case ARM::fixup_arm_movw_lo16: |
469 | case ARM::fixup_t2_movw_lo16: |
470 | Value = (FixedValue >> 16) & 0xffff; |
471 | break; |
472 | case ARM::fixup_arm_movt_hi16: |
473 | case ARM::fixup_t2_movt_hi16: |
474 | Value = FixedValue & 0xffff; |
475 | break; |
476 | } |
477 | MachO::any_relocation_info MREPair; |
478 | MREPair.r_word0 = Value; |
479 | MREPair.r_word1 = ((0xffffff << 0) | |
480 | (Log2Size << 25) | |
481 | (MachO::ARM_RELOC_PAIR << 28)); |
482 | |
483 | Writer->addRelocation(RelSymbol: nullptr, Sec: Fragment->getParent(), MRE&: MREPair); |
484 | } |
485 | |
486 | Writer->addRelocation(RelSymbol, Sec: Fragment->getParent(), MRE); |
487 | } |
488 | |
489 | std::unique_ptr<MCObjectTargetWriter> |
490 | llvm::createARMMachObjectWriter(bool Is64Bit, uint32_t CPUType, |
491 | uint32_t CPUSubtype) { |
492 | return std::make_unique<ARMMachObjectWriter>(args&: Is64Bit, args&: CPUType, args&: CPUSubtype); |
493 | } |
494 | |