| 1 | //===- OutputSegment.cpp --------------------------------------------------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | |
| 9 | #include "OutputSegment.h" |
| 10 | #include "ConcatOutputSection.h" |
| 11 | #include "InputSection.h" |
| 12 | #include "Sections.h" |
| 13 | #include "Symbols.h" |
| 14 | #include "SyntheticSections.h" |
| 15 | |
| 16 | #include "lld/Common/Memory.h" |
| 17 | #include "llvm/ADT/StringSwitch.h" |
| 18 | #include "llvm/BinaryFormat/MachO.h" |
| 19 | |
| 20 | using namespace llvm; |
| 21 | using namespace llvm::MachO; |
| 22 | using namespace lld; |
| 23 | using namespace lld::macho; |
| 24 | |
| 25 | static uint32_t initProt(StringRef name) { |
| 26 | auto it = find_if( |
| 27 | Range&: config->segmentProtections, |
| 28 | P: [&](const SegmentProtection &segprot) { return segprot.name == name; }); |
| 29 | if (it != config->segmentProtections.end()) |
| 30 | return it->initProt; |
| 31 | |
| 32 | if (name == segment_names::text) |
| 33 | return VM_PROT_READ | VM_PROT_EXECUTE; |
| 34 | if (name == segment_names::pageZero) |
| 35 | return 0; |
| 36 | if (name == segment_names::linkEdit) |
| 37 | return VM_PROT_READ; |
| 38 | return VM_PROT_READ | VM_PROT_WRITE; |
| 39 | } |
| 40 | |
| 41 | static uint32_t maxProt(StringRef name) { |
| 42 | assert(config->arch() != AK_i386 && |
| 43 | "TODO: i386 has different maxProt requirements" ); |
| 44 | auto it = find_if( |
| 45 | Range&: config->segmentProtections, |
| 46 | P: [&](const SegmentProtection &segprot) { return segprot.name == name; }); |
| 47 | if (it != config->segmentProtections.end()) |
| 48 | return it->maxProt; |
| 49 | |
| 50 | return initProt(name); |
| 51 | } |
| 52 | |
| 53 | static uint32_t flags(StringRef name) { |
| 54 | // If we ever implement shared cache output support, SG_READ_ONLY should not |
| 55 | // be used for dylibs that can be placed in it. |
| 56 | return name == segment_names::dataConst ? (uint32_t)SG_READ_ONLY : 0; |
| 57 | } |
| 58 | |
| 59 | size_t OutputSegment::numNonHiddenSections() const { |
| 60 | size_t count = 0; |
| 61 | for (const OutputSection *osec : sections) |
| 62 | count += (!osec->isHidden() ? 1 : 0); |
| 63 | return count; |
| 64 | } |
| 65 | |
| 66 | void OutputSegment::addOutputSection(OutputSection *osec) { |
| 67 | inputOrder = std::min(a: inputOrder, b: osec->inputOrder); |
| 68 | |
| 69 | osec->parent = this; |
| 70 | sections.push_back(x: osec); |
| 71 | |
| 72 | for (const SectionAlign §Align : config->sectionAlignments) |
| 73 | if (sectAlign.segName == name && sectAlign.sectName == osec->name) |
| 74 | osec->align = sectAlign.align; |
| 75 | } |
| 76 | |
| 77 | template <typename T, typename F> static auto compareByOrder(F ord) { |
| 78 | return [=](T a, T b) { return ord(a) < ord(b); }; |
| 79 | } |
| 80 | |
| 81 | static int segmentOrder(OutputSegment *seg) { |
| 82 | return StringSwitch<int>(seg->name) |
| 83 | .Case(S: segment_names::pageZero, Value: -4) |
| 84 | .Case(S: segment_names::text, Value: -3) |
| 85 | .Case(S: segment_names::dataConst, Value: -2) |
| 86 | .Case(S: segment_names::data, Value: -1) |
| 87 | .Case(S: segment_names::llvm, Value: std::numeric_limits<int>::max() - 1) |
| 88 | // Make sure __LINKEDIT is the last segment (i.e. all its hidden |
| 89 | // sections must be ordered after other sections). |
| 90 | .Case(S: segment_names::linkEdit, Value: std::numeric_limits<int>::max()) |
| 91 | .Default(Value: seg->inputOrder); |
| 92 | } |
| 93 | |
| 94 | static int sectionOrder(OutputSection *osec) { |
| 95 | StringRef segname = osec->parent->name; |
| 96 | // Sections are uniquely identified by their segment + section name. |
| 97 | if (segname == segment_names::text) { |
| 98 | if (osec->name == section_names::header) |
| 99 | return -7; |
| 100 | // `__text` needs to precede the other code sections since its |
| 101 | // expected to be the largest. This means in effect that it will |
| 102 | // be the section that determines whether we need thunks or not. |
| 103 | if (osec->name == section_names::text) |
| 104 | return -6; |
| 105 | |
| 106 | // Prioritize specific section ordering based on our knowledge. This ensures |
| 107 | // that certain sections are placed in a particular order, even if they |
| 108 | // are also categorized as code sections. This explicit ordering takes |
| 109 | // precedence over the general code section ordering. |
| 110 | int knownPriority = |
| 111 | StringSwitch<int>(osec->name) |
| 112 | .Case(S: section_names::stubs, Value: -4) |
| 113 | .Case(S: section_names::stubHelper, Value: -3) |
| 114 | .Case(S: section_names::objcStubs, Value: -2) |
| 115 | .Case(S: section_names::initOffsets, Value: -1) |
| 116 | .Case(S: section_names::unwindInfo, |
| 117 | Value: std::numeric_limits<int>::max() - 1) |
| 118 | .Case(S: section_names::ehFrame, Value: std::numeric_limits<int>::max()) |
| 119 | .Default(Value: 0); |
| 120 | |
| 121 | if (knownPriority != 0) |
| 122 | return knownPriority; |
| 123 | |
| 124 | // Ensure all code sections are contiguous with `__text` for thunk |
| 125 | // calculations. |
| 126 | if (sections::isCodeSection(name: osec->name, segName: segment_names::text, flags: osec->flags)) { |
| 127 | return -5; |
| 128 | } |
| 129 | |
| 130 | return osec->inputOrder; |
| 131 | } else if (segname == segment_names::data || |
| 132 | segname == segment_names::dataConst) { |
| 133 | // For each thread spawned, dyld will initialize its TLVs by copying the |
| 134 | // address range from the start of the first thread-local data section to |
| 135 | // the end of the last one. We therefore arrange these sections contiguously |
| 136 | // to minimize the amount of memory used. Additionally, since zerofill |
| 137 | // sections must be at the end of their segments, and since TLV data |
| 138 | // sections can be zerofills, we end up putting all TLV data sections at the |
| 139 | // end of the segment. |
| 140 | switch (sectionType(flags: osec->flags)) { |
| 141 | case S_THREAD_LOCAL_VARIABLE_POINTERS: |
| 142 | return std::numeric_limits<int>::max() - 3; |
| 143 | case S_THREAD_LOCAL_REGULAR: |
| 144 | return std::numeric_limits<int>::max() - 2; |
| 145 | case S_THREAD_LOCAL_ZEROFILL: |
| 146 | return std::numeric_limits<int>::max() - 1; |
| 147 | case S_ZEROFILL: |
| 148 | return std::numeric_limits<int>::max(); |
| 149 | default: |
| 150 | return StringSwitch<int>(osec->name) |
| 151 | .Case(S: section_names::got, Value: -3) |
| 152 | .Case(S: section_names::lazySymbolPtr, Value: -2) |
| 153 | .Case(S: section_names::const_, Value: -1) |
| 154 | .Default(Value: osec->inputOrder); |
| 155 | } |
| 156 | } else if (segname == segment_names::linkEdit) { |
| 157 | return StringSwitch<int>(osec->name) |
| 158 | .Case(S: section_names::chainFixups, Value: -11) |
| 159 | .Case(S: section_names::rebase, Value: -10) |
| 160 | .Case(S: section_names::binding, Value: -9) |
| 161 | .Case(S: section_names::weakBinding, Value: -8) |
| 162 | .Case(S: section_names::lazyBinding, Value: -7) |
| 163 | .Case(S: section_names::export_, Value: -6) |
| 164 | .Case(S: section_names::functionStarts, Value: -5) |
| 165 | .Case(S: section_names::dataInCode, Value: -4) |
| 166 | .Case(S: section_names::symbolTable, Value: -3) |
| 167 | .Case(S: section_names::indirectSymbolTable, Value: -2) |
| 168 | .Case(S: section_names::stringTable, Value: -1) |
| 169 | .Case(S: section_names::codeSignature, Value: std::numeric_limits<int>::max()) |
| 170 | .Default(Value: osec->inputOrder); |
| 171 | } |
| 172 | // ZeroFill sections must always be the at the end of their segments: |
| 173 | // dyld checks if a segment's file size is smaller than its in-memory |
| 174 | // size to detect if a segment has zerofill sections, and if so it maps |
| 175 | // the missing tail as zerofill. |
| 176 | if (sectionType(flags: osec->flags) == S_ZEROFILL) |
| 177 | return std::numeric_limits<int>::max(); |
| 178 | return osec->inputOrder; |
| 179 | } |
| 180 | |
| 181 | void OutputSegment::sortOutputSections() { |
| 182 | // Must be stable_sort() to keep special sections such as |
| 183 | // S_THREAD_LOCAL_REGULAR in input order. |
| 184 | llvm::stable_sort(Range&: sections, C: compareByOrder<OutputSection *>(ord: sectionOrder)); |
| 185 | } |
| 186 | |
| 187 | void OutputSegment::assignAddressesToStartEndSymbols() { |
| 188 | for (Defined *d : segmentStartSymbols) |
| 189 | d->value = addr; |
| 190 | for (Defined *d : segmentEndSymbols) |
| 191 | d->value = addr + vmSize; |
| 192 | } |
| 193 | |
| 194 | void macho::sortOutputSegments() { |
| 195 | llvm::stable_sort(Range&: outputSegments, |
| 196 | C: compareByOrder<OutputSegment *>(ord: segmentOrder)); |
| 197 | } |
| 198 | |
| 199 | static DenseMap<StringRef, OutputSegment *> nameToOutputSegment; |
| 200 | std::vector<OutputSegment *> macho::outputSegments; |
| 201 | |
| 202 | void macho::resetOutputSegments() { |
| 203 | outputSegments.clear(); |
| 204 | nameToOutputSegment.clear(); |
| 205 | } |
| 206 | |
| 207 | static StringRef maybeRenameSegment(StringRef name) { |
| 208 | auto newName = config->segmentRenameMap.find(Val: name); |
| 209 | if (newName != config->segmentRenameMap.end()) |
| 210 | return newName->second; |
| 211 | return name; |
| 212 | } |
| 213 | |
| 214 | OutputSegment *macho::getOrCreateOutputSegment(StringRef name) { |
| 215 | name = maybeRenameSegment(name); |
| 216 | |
| 217 | OutputSegment *&segRef = nameToOutputSegment[name]; |
| 218 | if (segRef) |
| 219 | return segRef; |
| 220 | |
| 221 | segRef = make<OutputSegment>(); |
| 222 | segRef->name = name; |
| 223 | segRef->maxProt = maxProt(name); |
| 224 | segRef->initProt = initProt(name); |
| 225 | segRef->flags = flags(name); |
| 226 | |
| 227 | outputSegments.push_back(x: segRef); |
| 228 | return segRef; |
| 229 | } |
| 230 | |