| 1 | //===- Symbols.cpp --------------------------------------------------------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | |
| 9 | #include "Symbols.h" |
| 10 | #include "Driver.h" |
| 11 | #include "InputFiles.h" |
| 12 | #include "InputSection.h" |
| 13 | #include "OutputSections.h" |
| 14 | #include "SymbolTable.h" |
| 15 | #include "SyntheticSections.h" |
| 16 | #include "Target.h" |
| 17 | #include "Writer.h" |
| 18 | #include "llvm/Demangle/Demangle.h" |
| 19 | #include "llvm/Support/Compiler.h" |
| 20 | #include <cstring> |
| 21 | |
| 22 | using namespace llvm; |
| 23 | using namespace llvm::object; |
| 24 | using namespace llvm::ELF; |
| 25 | using namespace lld; |
| 26 | using namespace lld::elf; |
| 27 | |
| 28 | static_assert(sizeof(SymbolUnion) <= 64, "SymbolUnion too large" ); |
| 29 | |
| 30 | template <typename T> struct AssertSymbol { |
| 31 | static_assert(std::is_trivially_destructible<T>(), |
| 32 | "Symbol types must be trivially destructible" ); |
| 33 | static_assert(sizeof(T) <= sizeof(SymbolUnion), "SymbolUnion too small" ); |
| 34 | static_assert(alignof(T) <= alignof(SymbolUnion), |
| 35 | "SymbolUnion not aligned enough" ); |
| 36 | }; |
| 37 | |
| 38 | LLVM_ATTRIBUTE_UNUSED static inline void assertSymbols() { |
| 39 | AssertSymbol<Defined>(); |
| 40 | AssertSymbol<CommonSymbol>(); |
| 41 | AssertSymbol<Undefined>(); |
| 42 | AssertSymbol<SharedSymbol>(); |
| 43 | AssertSymbol<LazySymbol>(); |
| 44 | } |
| 45 | |
| 46 | // Returns a symbol for an error message. |
| 47 | static std::string maybeDemangleSymbol(Ctx &ctx, StringRef symName) { |
| 48 | return ctx.arg.demangle ? demangle(MangledName: symName.str()) : symName.str(); |
| 49 | } |
| 50 | |
| 51 | std::string elf::toStr(Ctx &ctx, const elf::Symbol &sym) { |
| 52 | StringRef name = sym.getName(); |
| 53 | std::string ret = maybeDemangleSymbol(ctx, symName: name); |
| 54 | |
| 55 | const char *suffix = sym.getVersionSuffix(); |
| 56 | if (*suffix == '@') |
| 57 | ret += suffix; |
| 58 | return ret; |
| 59 | } |
| 60 | |
| 61 | const ELFSyncStream &elf::operator<<(const ELFSyncStream &s, |
| 62 | const Symbol *sym) { |
| 63 | return s << toStr(ctx&: s.ctx, sym: *sym); |
| 64 | } |
| 65 | |
| 66 | static uint64_t getSymVA(Ctx &ctx, const Symbol &sym, int64_t addend) { |
| 67 | switch (sym.kind()) { |
| 68 | case Symbol::DefinedKind: { |
| 69 | auto &d = cast<Defined>(Val: sym); |
| 70 | SectionBase *isec = d.section; |
| 71 | |
| 72 | // This is an absolute symbol. |
| 73 | if (!isec) |
| 74 | return d.value; |
| 75 | |
| 76 | assert(isec != &InputSection::discarded); |
| 77 | |
| 78 | uint64_t offset = d.value; |
| 79 | |
| 80 | // An object in an SHF_MERGE section might be referenced via a |
| 81 | // section symbol (as a hack for reducing the number of local |
| 82 | // symbols). |
| 83 | // Depending on the addend, the reference via a section symbol |
| 84 | // refers to a different object in the merge section. |
| 85 | // Since the objects in the merge section are not necessarily |
| 86 | // contiguous in the output, the addend can thus affect the final |
| 87 | // VA in a non-linear way. |
| 88 | // To make this work, we incorporate the addend into the section |
| 89 | // offset (and zero out the addend for later processing) so that |
| 90 | // we find the right object in the section. |
| 91 | if (d.isSection()) |
| 92 | offset += addend; |
| 93 | |
| 94 | // In the typical case, this is actually very simple and boils |
| 95 | // down to adding together 3 numbers: |
| 96 | // 1. The address of the output section. |
| 97 | // 2. The offset of the input section within the output section. |
| 98 | // 3. The offset within the input section (this addition happens |
| 99 | // inside InputSection::getOffset). |
| 100 | // |
| 101 | // If you understand the data structures involved with this next |
| 102 | // line (and how they get built), then you have a pretty good |
| 103 | // understanding of the linker. |
| 104 | uint64_t va = isec->getVA(offset); |
| 105 | if (d.isSection()) |
| 106 | va -= addend; |
| 107 | |
| 108 | // MIPS relocatable files can mix regular and microMIPS code. |
| 109 | // Linker needs to distinguish such code. To do so microMIPS |
| 110 | // symbols has the `STO_MIPS_MICROMIPS` flag in the `st_other` |
| 111 | // field. Unfortunately, the `MIPS::relocate()` method has |
| 112 | // a symbol value only. To pass type of the symbol (regular/microMIPS) |
| 113 | // to that routine as well as other places where we write |
| 114 | // a symbol value as-is (.dynamic section, `Elf_Ehdr::e_entry` |
| 115 | // field etc) do the same trick as compiler uses to mark microMIPS |
| 116 | // for CPU - set the less-significant bit. |
| 117 | if (ctx.arg.emachine == EM_MIPS && isMicroMips(ctx) && |
| 118 | ((sym.stOther & STO_MIPS_MICROMIPS) || sym.hasFlag(bit: NEEDS_COPY))) |
| 119 | va |= 1; |
| 120 | |
| 121 | if (d.isTls() && !ctx.arg.relocatable) { |
| 122 | // Use the address of the TLS segment's first section rather than the |
| 123 | // segment's address, because segment addresses aren't initialized until |
| 124 | // after sections are finalized. (e.g. Measuring the size of .rela.dyn |
| 125 | // for Android relocation packing requires knowing TLS symbol addresses |
| 126 | // during section finalization.) |
| 127 | if (!ctx.tlsPhdr || !ctx.tlsPhdr->firstSec) { |
| 128 | Err(ctx) << d.file |
| 129 | << " has an STT_TLS symbol but doesn't have a PT_TLS segment" ; |
| 130 | return 0; |
| 131 | } |
| 132 | return va - ctx.tlsPhdr->firstSec->addr; |
| 133 | } |
| 134 | return va; |
| 135 | } |
| 136 | case Symbol::SharedKind: |
| 137 | case Symbol::UndefinedKind: |
| 138 | return 0; |
| 139 | case Symbol::LazyKind: |
| 140 | llvm_unreachable("lazy symbol reached writer" ); |
| 141 | case Symbol::CommonKind: |
| 142 | llvm_unreachable("common symbol reached writer" ); |
| 143 | case Symbol::PlaceholderKind: |
| 144 | llvm_unreachable("placeholder symbol reached writer" ); |
| 145 | } |
| 146 | llvm_unreachable("invalid symbol kind" ); |
| 147 | } |
| 148 | |
| 149 | uint64_t Symbol::getVA(Ctx &ctx, int64_t addend) const { |
| 150 | return getSymVA(ctx, sym: *this, addend) + addend; |
| 151 | } |
| 152 | |
| 153 | uint64_t Symbol::getGotVA(Ctx &ctx) const { |
| 154 | if (gotInIgot) |
| 155 | return ctx.in.igotPlt->getVA() + getGotPltOffset(ctx); |
| 156 | return ctx.in.got->getVA() + getGotOffset(ctx); |
| 157 | } |
| 158 | |
| 159 | uint64_t Symbol::getGotOffset(Ctx &ctx) const { |
| 160 | return getGotIdx(ctx) * ctx.target->gotEntrySize; |
| 161 | } |
| 162 | |
| 163 | uint64_t Symbol::getGotPltVA(Ctx &ctx) const { |
| 164 | if (isInIplt) |
| 165 | return ctx.in.igotPlt->getVA() + getGotPltOffset(ctx); |
| 166 | return ctx.in.gotPlt->getVA() + getGotPltOffset(ctx); |
| 167 | } |
| 168 | |
| 169 | uint64_t Symbol::getGotPltOffset(Ctx &ctx) const { |
| 170 | if (isInIplt) |
| 171 | return getPltIdx(ctx) * ctx.target->gotEntrySize; |
| 172 | return (getPltIdx(ctx) + ctx.target->gotPltHeaderEntriesNum) * |
| 173 | ctx.target->gotEntrySize; |
| 174 | } |
| 175 | |
| 176 | uint64_t Symbol::getPltVA(Ctx &ctx) const { |
| 177 | uint64_t outVA = isInIplt ? ctx.in.iplt->getVA() + |
| 178 | getPltIdx(ctx) * ctx.target->ipltEntrySize |
| 179 | : ctx.in.plt->getVA() + ctx.in.plt->headerSize + |
| 180 | getPltIdx(ctx) * ctx.target->pltEntrySize; |
| 181 | |
| 182 | // While linking microMIPS code PLT code are always microMIPS |
| 183 | // code. Set the less-significant bit to track that fact. |
| 184 | // See detailed comment in the `getSymVA` function. |
| 185 | if (ctx.arg.emachine == EM_MIPS && isMicroMips(ctx)) |
| 186 | outVA |= 1; |
| 187 | return outVA; |
| 188 | } |
| 189 | |
| 190 | uint64_t Symbol::getSize() const { |
| 191 | if (const auto *dr = dyn_cast<Defined>(Val: this)) |
| 192 | return dr->size; |
| 193 | return cast<SharedSymbol>(Val: this)->size; |
| 194 | } |
| 195 | |
| 196 | OutputSection *Symbol::getOutputSection() const { |
| 197 | if (auto *s = dyn_cast<Defined>(Val: this)) { |
| 198 | if (auto *sec = s->section) |
| 199 | return sec->getOutputSection(); |
| 200 | return nullptr; |
| 201 | } |
| 202 | return nullptr; |
| 203 | } |
| 204 | |
| 205 | // If a symbol name contains '@', the characters after that is |
| 206 | // a symbol version name. This function parses that. |
| 207 | void Symbol::parseSymbolVersion(Ctx &ctx) { |
| 208 | // Return if localized by a local: pattern in a version script. |
| 209 | if (versionId == VER_NDX_LOCAL) |
| 210 | return; |
| 211 | StringRef s = getName(); |
| 212 | size_t pos = s.find(C: '@'); |
| 213 | if (pos == StringRef::npos) |
| 214 | return; |
| 215 | StringRef verstr = s.substr(Start: pos + 1); |
| 216 | |
| 217 | // Truncate the symbol name so that it doesn't include the version string. |
| 218 | nameSize = pos; |
| 219 | |
| 220 | if (verstr.empty()) |
| 221 | return; |
| 222 | |
| 223 | // If this is not in this DSO, it is not a definition. |
| 224 | if (!isDefined()) |
| 225 | return; |
| 226 | |
| 227 | // '@@' in a symbol name means the default version. |
| 228 | // It is usually the most recent one. |
| 229 | bool isDefault = (verstr[0] == '@'); |
| 230 | if (isDefault) |
| 231 | verstr = verstr.substr(Start: 1); |
| 232 | |
| 233 | for (const VersionDefinition &ver : namedVersionDefs(ctx)) { |
| 234 | if (ver.name != verstr) |
| 235 | continue; |
| 236 | |
| 237 | if (isDefault) |
| 238 | versionId = ver.id; |
| 239 | else |
| 240 | versionId = ver.id | VERSYM_HIDDEN; |
| 241 | return; |
| 242 | } |
| 243 | |
| 244 | // It is an error if the specified version is not defined. |
| 245 | // Usually version script is not provided when linking executable, |
| 246 | // but we may still want to override a versioned symbol from DSO, |
| 247 | // so we do not report error in this case. We also do not error |
| 248 | // if the symbol has a local version as it won't be in the dynamic |
| 249 | // symbol table. |
| 250 | if (ctx.arg.shared && versionId != VER_NDX_LOCAL) |
| 251 | ErrAlways(ctx) << file << ": symbol " << s << " has undefined version " |
| 252 | << verstr; |
| 253 | } |
| 254 | |
| 255 | void Symbol::(Ctx &ctx) const { |
| 256 | assert(file->lazy); |
| 257 | file->lazy = false; |
| 258 | parseFile(ctx, file); |
| 259 | } |
| 260 | |
| 261 | uint8_t Symbol::computeBinding(Ctx &ctx) const { |
| 262 | auto v = visibility(); |
| 263 | if ((v != STV_DEFAULT && v != STV_PROTECTED) || versionId == VER_NDX_LOCAL) |
| 264 | return STB_LOCAL; |
| 265 | if (binding == STB_GNU_UNIQUE && !ctx.arg.gnuUnique) |
| 266 | return STB_GLOBAL; |
| 267 | return binding; |
| 268 | } |
| 269 | |
| 270 | // Print out a log message for --trace-symbol. |
| 271 | void elf::printTraceSymbol(const Symbol &sym, StringRef name) { |
| 272 | std::string s; |
| 273 | if (sym.isUndefined()) |
| 274 | s = ": reference to " ; |
| 275 | else if (sym.isLazy()) |
| 276 | s = ": lazy definition of " ; |
| 277 | else if (sym.isShared()) |
| 278 | s = ": shared definition of " ; |
| 279 | else if (sym.isCommon()) |
| 280 | s = ": common definition of " ; |
| 281 | else |
| 282 | s = ": definition of " ; |
| 283 | |
| 284 | Msg(ctx&: sym.file->ctx) << sym.file << s << name; |
| 285 | } |
| 286 | |
| 287 | static void (Ctx &ctx, const InputFile *reference, |
| 288 | const InputFile &, const Symbol &sym) { |
| 289 | ctx.whyExtractRecords.emplace_back(Args: toStr(ctx, f: reference), Args: &extracted, Args: sym); |
| 290 | } |
| 291 | |
| 292 | void elf::maybeWarnUnorderableSymbol(Ctx &ctx, const Symbol *sym) { |
| 293 | if (!ctx.arg.warnSymbolOrdering) |
| 294 | return; |
| 295 | |
| 296 | // If UnresolvedPolicy::Ignore is used, no "undefined symbol" error/warning is |
| 297 | // emitted. It makes sense to not warn on undefined symbols (excluding those |
| 298 | // demoted by demoteSymbols). |
| 299 | // |
| 300 | // Note, ld.bfd --symbol-ordering-file= does not warn on undefined symbols, |
| 301 | // but we don't have to be compatible here. |
| 302 | if (sym->isUndefined() && !cast<Undefined>(Val: sym)->discardedSecIdx && |
| 303 | ctx.arg.unresolvedSymbols == UnresolvedPolicy::Ignore) |
| 304 | return; |
| 305 | |
| 306 | const InputFile *file = sym->file; |
| 307 | auto *d = dyn_cast<Defined>(Val: sym); |
| 308 | |
| 309 | auto report = [&](StringRef s) { Warn(ctx) << file << s << sym->getName(); }; |
| 310 | |
| 311 | if (sym->isUndefined()) { |
| 312 | if (cast<Undefined>(Val: sym)->discardedSecIdx) |
| 313 | report(": unable to order discarded symbol: " ); |
| 314 | else |
| 315 | report(": unable to order undefined symbol: " ); |
| 316 | } else if (sym->isShared()) |
| 317 | report(": unable to order shared symbol: " ); |
| 318 | else if (d && !d->section) |
| 319 | report(": unable to order absolute symbol: " ); |
| 320 | else if (d && isa<OutputSection>(Val: d->section)) |
| 321 | report(": unable to order synthetic symbol: " ); |
| 322 | else if (d && !d->section->isLive()) |
| 323 | report(": unable to order discarded symbol: " ); |
| 324 | } |
| 325 | |
| 326 | // Returns true if a symbol can be replaced at load-time by a symbol |
| 327 | // with the same name defined in other ELF executable or DSO. |
| 328 | bool elf::computeIsPreemptible(Ctx &ctx, const Symbol &sym) { |
| 329 | assert(!sym.isLocal() || sym.isPlaceholder()); |
| 330 | |
| 331 | // Only symbols with default visibility that appear in dynsym can be |
| 332 | // preempted. Symbols with protected visibility cannot be preempted. |
| 333 | if (sym.visibility() != STV_DEFAULT) |
| 334 | return false; |
| 335 | |
| 336 | // At this point copy relocations have not been created yet. |
| 337 | // Shared symbols are preemptible. Undefined symbols are preemptible |
| 338 | // when zDynamicUndefined (default in dynamic linking). Weakness is not |
| 339 | // checked, though undefined non-weak would typically trigger relocation |
| 340 | // errors unless options like -z undefs are used. |
| 341 | if (!sym.isDefined()) |
| 342 | return !sym.isUndefined() || ctx.arg.zDynamicUndefined; |
| 343 | |
| 344 | if (!ctx.arg.shared) |
| 345 | return false; |
| 346 | |
| 347 | // If -Bsymbolic or --dynamic-list is specified, or -Bsymbolic-functions is |
| 348 | // specified and the symbol is STT_FUNC, the symbol is preemptible iff it is |
| 349 | // in the dynamic list. -Bsymbolic-non-weak-functions is a non-weak subset of |
| 350 | // -Bsymbolic-functions. |
| 351 | if (ctx.arg.symbolic || |
| 352 | (ctx.arg.bsymbolic == BsymbolicKind::NonWeak && |
| 353 | sym.binding != STB_WEAK) || |
| 354 | (ctx.arg.bsymbolic == BsymbolicKind::Functions && sym.isFunc()) || |
| 355 | (ctx.arg.bsymbolic == BsymbolicKind::NonWeakFunctions && sym.isFunc() && |
| 356 | sym.binding != STB_WEAK)) |
| 357 | return sym.inDynamicList; |
| 358 | return true; |
| 359 | } |
| 360 | |
| 361 | void elf::parseVersionAndComputeIsPreemptible(Ctx &ctx) { |
| 362 | // Symbol themselves might know their versions because symbols |
| 363 | // can contain versions in the form of <name>@<version>. |
| 364 | // Let them parse and update their names to exclude version suffix. |
| 365 | // In addition, compute isExported and isPreemptible. |
| 366 | for (Symbol *sym : ctx.symtab->getSymbols()) { |
| 367 | if (sym->hasVersionSuffix) |
| 368 | sym->parseSymbolVersion(ctx); |
| 369 | if (sym->computeBinding(ctx) == STB_LOCAL) { |
| 370 | sym->isExported = false; |
| 371 | continue; |
| 372 | } |
| 373 | if (!sym->isDefined() && !sym->isCommon()) { |
| 374 | sym->isPreemptible = computeIsPreemptible(ctx, sym: *sym); |
| 375 | } else if (ctx.arg.exportDynamic && |
| 376 | (sym->isUsedInRegularObj || !sym->ltoCanOmit)) { |
| 377 | sym->isExported = true; |
| 378 | sym->isPreemptible = computeIsPreemptible(ctx, sym: *sym); |
| 379 | } |
| 380 | } |
| 381 | } |
| 382 | |
| 383 | // Merge symbol properties. |
| 384 | // |
| 385 | // When we have many symbols of the same name, we choose one of them, |
| 386 | // and that's the result of symbol resolution. However, symbols that |
| 387 | // were not chosen still affect some symbol properties. |
| 388 | void Symbol::mergeProperties(const Symbol &other) { |
| 389 | // DSO symbols do not affect visibility in the output. |
| 390 | if (!other.isShared() && other.visibility() != STV_DEFAULT) { |
| 391 | uint8_t v = visibility(), ov = other.visibility(); |
| 392 | setVisibility(v == STV_DEFAULT ? ov : std::min(a: v, b: ov)); |
| 393 | } |
| 394 | } |
| 395 | |
| 396 | void Symbol::resolve(Ctx &ctx, const Undefined &other) { |
| 397 | if (other.visibility() != STV_DEFAULT) { |
| 398 | uint8_t v = visibility(), ov = other.visibility(); |
| 399 | setVisibility(v == STV_DEFAULT ? ov : std::min(a: v, b: ov)); |
| 400 | } |
| 401 | // An undefined symbol with non default visibility must be satisfied |
| 402 | // in the same DSO. |
| 403 | // |
| 404 | // If this is a non-weak defined symbol in a discarded section, override the |
| 405 | // existing undefined symbol for better error message later. |
| 406 | if (isPlaceholder() || (isShared() && other.visibility() != STV_DEFAULT) || |
| 407 | (isUndefined() && other.binding != STB_WEAK && other.discardedSecIdx)) { |
| 408 | other.overwrite(sym&: *this); |
| 409 | return; |
| 410 | } |
| 411 | |
| 412 | if (traced) |
| 413 | printTraceSymbol(sym: other, name: getName()); |
| 414 | |
| 415 | if (isLazy()) { |
| 416 | // An undefined weak will not extract archive members. See comment on Lazy |
| 417 | // in Symbols.h for the details. |
| 418 | if (other.binding == STB_WEAK) { |
| 419 | binding = STB_WEAK; |
| 420 | type = other.type; |
| 421 | return; |
| 422 | } |
| 423 | |
| 424 | // Do extra check for --warn-backrefs. |
| 425 | // |
| 426 | // --warn-backrefs is an option to prevent an undefined reference from |
| 427 | // extracting an archive member written earlier in the command line. It can |
| 428 | // be used to keep compatibility with GNU linkers to some degree. I'll |
| 429 | // explain the feature and why you may find it useful in this comment. |
| 430 | // |
| 431 | // lld's symbol resolution semantics is more relaxed than traditional Unix |
| 432 | // linkers. For example, |
| 433 | // |
| 434 | // ld.lld foo.a bar.o |
| 435 | // |
| 436 | // succeeds even if bar.o contains an undefined symbol that has to be |
| 437 | // resolved by some object file in foo.a. Traditional Unix linkers don't |
| 438 | // allow this kind of backward reference, as they visit each file only once |
| 439 | // from left to right in the command line while resolving all undefined |
| 440 | // symbols at the moment of visiting. |
| 441 | // |
| 442 | // In the above case, since there's no undefined symbol when a linker visits |
| 443 | // foo.a, no files are pulled out from foo.a, and because the linker forgets |
| 444 | // about foo.a after visiting, it can't resolve undefined symbols in bar.o |
| 445 | // that could have been resolved otherwise. |
| 446 | // |
| 447 | // That lld accepts more relaxed form means that (besides it'd make more |
| 448 | // sense) you can accidentally write a command line or a build file that |
| 449 | // works only with lld, even if you have a plan to distribute it to wider |
| 450 | // users who may be using GNU linkers. With --warn-backrefs, you can detect |
| 451 | // a library order that doesn't work with other Unix linkers. |
| 452 | // |
| 453 | // The option is also useful to detect cyclic dependencies between static |
| 454 | // archives. Again, lld accepts |
| 455 | // |
| 456 | // ld.lld foo.a bar.a |
| 457 | // |
| 458 | // even if foo.a and bar.a depend on each other. With --warn-backrefs, it is |
| 459 | // handled as an error. |
| 460 | // |
| 461 | // Here is how the option works. We assign a group ID to each file. A file |
| 462 | // with a smaller group ID can pull out object files from an archive file |
| 463 | // with an equal or greater group ID. Otherwise, it is a reverse dependency |
| 464 | // and an error. |
| 465 | // |
| 466 | // A file outside --{start,end}-group gets a fresh ID when instantiated. All |
| 467 | // files within the same --{start,end}-group get the same group ID. E.g. |
| 468 | // |
| 469 | // ld.lld A B --start-group C D --end-group E |
| 470 | // |
| 471 | // A forms group 0. B form group 1. C and D (including their member object |
| 472 | // files) form group 2. E forms group 3. I think that you can see how this |
| 473 | // group assignment rule simulates the traditional linker's semantics. |
| 474 | bool backref = ctx.arg.warnBackrefs && file->groupId < other.file->groupId; |
| 475 | extract(ctx); |
| 476 | |
| 477 | if (!ctx.arg.whyExtract.empty()) |
| 478 | recordWhyExtract(ctx, reference: other.file, extracted: *file, sym: *this); |
| 479 | |
| 480 | // We don't report backward references to weak symbols as they can be |
| 481 | // overridden later. |
| 482 | // |
| 483 | // A traditional linker does not error for -ldef1 -lref -ldef2 (linking |
| 484 | // sandwich), where def2 may or may not be the same as def1. We don't want |
| 485 | // to warn for this case, so dismiss the warning if we see a subsequent lazy |
| 486 | // definition. this->file needs to be saved because in the case of LTO it |
| 487 | // may be reset to internalFile or be replaced with a file named lto.tmp. |
| 488 | if (backref && !isWeak()) |
| 489 | ctx.backwardReferences.try_emplace(Key: this, |
| 490 | Args: std::make_pair(x: other.file, y&: file)); |
| 491 | return; |
| 492 | } |
| 493 | |
| 494 | // Undefined symbols in a SharedFile do not change the binding. |
| 495 | if (isa<SharedFile>(Val: other.file)) |
| 496 | return; |
| 497 | |
| 498 | if (isUndefined() || isShared()) { |
| 499 | // The binding will be weak if there is at least one reference and all are |
| 500 | // weak. The binding has one opportunity to change to weak: if the first |
| 501 | // reference is weak. |
| 502 | if (other.binding != STB_WEAK || !referenced) |
| 503 | binding = other.binding; |
| 504 | } |
| 505 | } |
| 506 | |
| 507 | // Compare two symbols. Return true if the new symbol should win. |
| 508 | bool Symbol::shouldReplace(Ctx &ctx, const Defined &other) const { |
| 509 | if (LLVM_UNLIKELY(isCommon())) { |
| 510 | if (ctx.arg.warnCommon) |
| 511 | Warn(ctx) << "common " << getName() << " is overridden" ; |
| 512 | return !other.isWeak(); |
| 513 | } |
| 514 | if (!isDefined()) |
| 515 | return true; |
| 516 | |
| 517 | // Incoming STB_GLOBAL overrides STB_WEAK/STB_GNU_UNIQUE. -fgnu-unique changes |
| 518 | // some vague linkage data in COMDAT from STB_WEAK to STB_GNU_UNIQUE. Treat |
| 519 | // STB_GNU_UNIQUE like STB_WEAK so that we prefer the first among all |
| 520 | // STB_WEAK/STB_GNU_UNIQUE copies. If we prefer an incoming STB_GNU_UNIQUE to |
| 521 | // an existing STB_WEAK, there may be discarded section errors because the |
| 522 | // selected copy may be in a non-prevailing COMDAT. |
| 523 | return !isGlobal() && other.isGlobal(); |
| 524 | } |
| 525 | |
| 526 | void elf::reportDuplicate(Ctx &ctx, const Symbol &sym, const InputFile *newFile, |
| 527 | InputSectionBase *errSec, uint64_t errOffset) { |
| 528 | if (ctx.arg.allowMultipleDefinition) |
| 529 | return; |
| 530 | // In glibc<2.32, crti.o has .gnu.linkonce.t.__x86.get_pc_thunk.bx, which |
| 531 | // is sort of proto-comdat. There is actually no duplicate if we have |
| 532 | // full support for .gnu.linkonce. |
| 533 | const Defined *d = dyn_cast<Defined>(Val: &sym); |
| 534 | if (!d || d->getName() == "__x86.get_pc_thunk.bx" ) |
| 535 | return; |
| 536 | // Allow absolute symbols with the same value for GNU ld compatibility. |
| 537 | if (!d->section && !errSec && errOffset && d->value == errOffset) |
| 538 | return; |
| 539 | if (!d->section || !errSec) { |
| 540 | Err(ctx) << "duplicate symbol: " << &sym << "\n>>> defined in " << sym.file |
| 541 | << "\n>>> defined in " << newFile; |
| 542 | return; |
| 543 | } |
| 544 | |
| 545 | // Construct and print an error message in the form of: |
| 546 | // |
| 547 | // ld.lld: error: duplicate symbol: foo |
| 548 | // >>> defined at bar.c:30 |
| 549 | // >>> bar.o (/home/alice/src/bar.o) |
| 550 | // >>> defined at baz.c:563 |
| 551 | // >>> baz.o in archive libbaz.a |
| 552 | auto *sec1 = cast<InputSectionBase>(Val: d->section); |
| 553 | auto diag = Err(ctx); |
| 554 | diag << "duplicate symbol: " << &sym << "\n>>> defined at " ; |
| 555 | auto tell = diag.tell(); |
| 556 | diag << sec1->getSrcMsg(sym, offset: d->value); |
| 557 | if (tell != diag.tell()) |
| 558 | diag << "\n>>> " ; |
| 559 | diag << sec1->getObjMsg(offset: d->value) << "\n>>> defined at " ; |
| 560 | tell = diag.tell(); |
| 561 | diag << errSec->getSrcMsg(sym, offset: errOffset); |
| 562 | if (tell != diag.tell()) |
| 563 | diag << "\n>>> " ; |
| 564 | diag << errSec->getObjMsg(offset: errOffset); |
| 565 | } |
| 566 | |
| 567 | void Symbol::checkDuplicate(Ctx &ctx, const Defined &other) const { |
| 568 | if (isDefined() && !isWeak() && !other.isWeak()) |
| 569 | reportDuplicate(ctx, sym: *this, newFile: other.file, |
| 570 | errSec: dyn_cast_or_null<InputSectionBase>(Val: other.section), |
| 571 | errOffset: other.value); |
| 572 | } |
| 573 | |
| 574 | void Symbol::resolve(Ctx &ctx, const CommonSymbol &other) { |
| 575 | if (other.visibility() != STV_DEFAULT) { |
| 576 | uint8_t v = visibility(), ov = other.visibility(); |
| 577 | setVisibility(v == STV_DEFAULT ? ov : std::min(a: v, b: ov)); |
| 578 | } |
| 579 | if (isDefined() && !isWeak()) { |
| 580 | if (ctx.arg.warnCommon) |
| 581 | Warn(ctx) << "common " << getName() << " is overridden" ; |
| 582 | return; |
| 583 | } |
| 584 | |
| 585 | if (CommonSymbol *oldSym = dyn_cast<CommonSymbol>(Val: this)) { |
| 586 | if (ctx.arg.warnCommon) |
| 587 | Warn(ctx) << "multiple common of " << getName(); |
| 588 | oldSym->alignment = std::max(a: oldSym->alignment, b: other.alignment); |
| 589 | if (oldSym->size < other.size) { |
| 590 | oldSym->file = other.file; |
| 591 | oldSym->size = other.size; |
| 592 | } |
| 593 | return; |
| 594 | } |
| 595 | |
| 596 | if (auto *s = dyn_cast<SharedSymbol>(Val: this)) { |
| 597 | // Increase st_size if the shared symbol has a larger st_size. The shared |
| 598 | // symbol may be created from common symbols. The fact that some object |
| 599 | // files were linked into a shared object first should not change the |
| 600 | // regular rule that picks the largest st_size. |
| 601 | uint64_t size = s->size; |
| 602 | other.overwrite(sym&: *this); |
| 603 | if (size > cast<CommonSymbol>(Val: this)->size) |
| 604 | cast<CommonSymbol>(Val: this)->size = size; |
| 605 | } else { |
| 606 | other.overwrite(sym&: *this); |
| 607 | } |
| 608 | } |
| 609 | |
| 610 | void Symbol::resolve(Ctx &ctx, const Defined &other) { |
| 611 | if (other.visibility() != STV_DEFAULT) { |
| 612 | uint8_t v = visibility(), ov = other.visibility(); |
| 613 | setVisibility(v == STV_DEFAULT ? ov : std::min(a: v, b: ov)); |
| 614 | } |
| 615 | if (shouldReplace(ctx, other)) |
| 616 | other.overwrite(sym&: *this); |
| 617 | } |
| 618 | |
| 619 | void Symbol::resolve(Ctx &ctx, const LazySymbol &other) { |
| 620 | if (isPlaceholder()) { |
| 621 | other.overwrite(sym&: *this); |
| 622 | return; |
| 623 | } |
| 624 | |
| 625 | if (LLVM_UNLIKELY(!isUndefined())) { |
| 626 | // See the comment in resolve(Ctx &, const Undefined &). |
| 627 | if (isDefined()) { |
| 628 | ctx.backwardReferences.erase(Val: this); |
| 629 | } else if (isCommon() && ctx.arg.fortranCommon && |
| 630 | other.file->shouldExtractForCommon(name: getName())) { |
| 631 | // For common objects, we want to look for global or weak definitions that |
| 632 | // should be extracted as the canonical definition instead. |
| 633 | ctx.backwardReferences.erase(Val: this); |
| 634 | other.overwrite(sym&: *this); |
| 635 | other.extract(ctx); |
| 636 | } |
| 637 | return; |
| 638 | } |
| 639 | |
| 640 | // An undefined weak will not extract archive members. See comment on Lazy in |
| 641 | // Symbols.h for the details. |
| 642 | if (isWeak()) { |
| 643 | uint8_t ty = type; |
| 644 | other.overwrite(sym&: *this); |
| 645 | type = ty; |
| 646 | binding = STB_WEAK; |
| 647 | return; |
| 648 | } |
| 649 | |
| 650 | const InputFile *oldFile = file; |
| 651 | other.extract(ctx); |
| 652 | if (!ctx.arg.whyExtract.empty()) |
| 653 | recordWhyExtract(ctx, reference: oldFile, extracted: *file, sym: *this); |
| 654 | } |
| 655 | |
| 656 | void Symbol::resolve(Ctx &ctx, const SharedSymbol &other) { |
| 657 | isExported = true; |
| 658 | if (isPlaceholder()) { |
| 659 | other.overwrite(sym&: *this); |
| 660 | return; |
| 661 | } |
| 662 | if (isCommon()) { |
| 663 | // See the comment in resolveCommon() above. |
| 664 | if (other.size > cast<CommonSymbol>(Val: this)->size) |
| 665 | cast<CommonSymbol>(Val: this)->size = other.size; |
| 666 | return; |
| 667 | } |
| 668 | if (visibility() == STV_DEFAULT && (isUndefined() || isLazy())) { |
| 669 | // An undefined symbol with non default visibility must be satisfied |
| 670 | // in the same DSO. |
| 671 | uint8_t bind = binding; |
| 672 | other.overwrite(sym&: *this); |
| 673 | binding = bind; |
| 674 | } else if (traced) |
| 675 | printTraceSymbol(sym: other, name: getName()); |
| 676 | } |
| 677 | |
| 678 | void Defined::overwrite(Symbol &sym) const { |
| 679 | if (isa_and_nonnull<SharedFile>(Val: sym.file)) |
| 680 | sym.versionId = VER_NDX_GLOBAL; |
| 681 | Symbol::overwrite(sym, k: DefinedKind); |
| 682 | auto &s = static_cast<Defined &>(sym); |
| 683 | s.value = value; |
| 684 | s.size = size; |
| 685 | s.section = section; |
| 686 | } |
| 687 | |