1 | //===- SymbolTable.cpp ----------------------------------------------------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | |
9 | #include "SymbolTable.h" |
10 | #include "COFFLinkerContext.h" |
11 | #include "Config.h" |
12 | #include "Driver.h" |
13 | #include "LTO.h" |
14 | #include "PDB.h" |
15 | #include "Symbols.h" |
16 | #include "lld/Common/ErrorHandler.h" |
17 | #include "lld/Common/Memory.h" |
18 | #include "lld/Common/Timer.h" |
19 | #include "llvm/DebugInfo/DIContext.h" |
20 | #include "llvm/IR/LLVMContext.h" |
21 | #include "llvm/LTO/LTO.h" |
22 | #include "llvm/Support/Debug.h" |
23 | #include "llvm/Support/TimeProfiler.h" |
24 | #include "llvm/Support/raw_ostream.h" |
25 | #include <utility> |
26 | |
27 | using namespace llvm; |
28 | |
29 | namespace lld::coff { |
30 | |
31 | StringRef ltrim1(StringRef s, const char *chars) { |
32 | if (!s.empty() && strchr(s: chars, c: s[0])) |
33 | return s.substr(Start: 1); |
34 | return s; |
35 | } |
36 | |
37 | static bool compatibleMachineType(COFFLinkerContext &ctx, MachineTypes mt) { |
38 | if (mt == IMAGE_FILE_MACHINE_UNKNOWN) |
39 | return true; |
40 | switch (ctx.config.machine) { |
41 | case ARM64: |
42 | return mt == ARM64 || mt == ARM64X; |
43 | case ARM64EC: |
44 | return COFF::isArm64EC(Machine: mt) || mt == AMD64; |
45 | case ARM64X: |
46 | return COFF::isAnyArm64(Machine: mt) || mt == AMD64; |
47 | default: |
48 | return ctx.config.machine == mt; |
49 | } |
50 | } |
51 | |
52 | void SymbolTable::addFile(InputFile *file) { |
53 | log(msg: "Reading " + toString(file)); |
54 | if (file->lazy) { |
55 | if (auto *f = dyn_cast<BitcodeFile>(Val: file)) |
56 | f->parseLazy(); |
57 | else |
58 | cast<ObjFile>(Val: file)->parseLazy(); |
59 | } else { |
60 | file->parse(); |
61 | if (auto *f = dyn_cast<ObjFile>(Val: file)) { |
62 | ctx.objFileInstances.push_back(x: f); |
63 | } else if (auto *f = dyn_cast<BitcodeFile>(Val: file)) { |
64 | if (ltoCompilationDone) { |
65 | error(msg: "LTO object file " + toString(file) + " linked in after " |
66 | "doing LTO compilation." ); |
67 | } |
68 | ctx.bitcodeFileInstances.push_back(x: f); |
69 | } else if (auto *f = dyn_cast<ImportFile>(Val: file)) { |
70 | ctx.importFileInstances.push_back(x: f); |
71 | } |
72 | } |
73 | |
74 | MachineTypes mt = file->getMachineType(); |
75 | if (ctx.config.machine == IMAGE_FILE_MACHINE_UNKNOWN) { |
76 | ctx.config.machine = mt; |
77 | ctx.driver.addWinSysRootLibSearchPaths(); |
78 | } else if (!compatibleMachineType(ctx, mt)) { |
79 | error(msg: toString(file) + ": machine type " + machineToStr(MT: mt) + |
80 | " conflicts with " + machineToStr(MT: ctx.config.machine)); |
81 | return; |
82 | } |
83 | |
84 | ctx.driver.parseDirectives(file); |
85 | } |
86 | |
87 | static void errorOrWarn(const Twine &s, bool forceUnresolved) { |
88 | if (forceUnresolved) |
89 | warn(msg: s); |
90 | else |
91 | error(msg: s); |
92 | } |
93 | |
94 | // Causes the file associated with a lazy symbol to be linked in. |
95 | static void forceLazy(Symbol *s) { |
96 | s->pendingArchiveLoad = true; |
97 | switch (s->kind()) { |
98 | case Symbol::Kind::LazyArchiveKind: { |
99 | auto *l = cast<LazyArchive>(Val: s); |
100 | l->file->addMember(sym: l->sym); |
101 | break; |
102 | } |
103 | case Symbol::Kind::LazyObjectKind: { |
104 | InputFile *file = cast<LazyObject>(Val: s)->file; |
105 | file->ctx.symtab.addFile(file); |
106 | break; |
107 | } |
108 | case Symbol::Kind::LazyDLLSymbolKind: { |
109 | auto *l = cast<LazyDLLSymbol>(Val: s); |
110 | l->file->makeImport(s: l->sym); |
111 | break; |
112 | } |
113 | default: |
114 | llvm_unreachable( |
115 | "symbol passed to forceLazy is not a LazyArchive or LazyObject" ); |
116 | } |
117 | } |
118 | |
119 | // Returns the symbol in SC whose value is <= Addr that is closest to Addr. |
120 | // This is generally the global variable or function whose definition contains |
121 | // Addr. |
122 | static Symbol *getSymbol(SectionChunk *sc, uint32_t addr) { |
123 | DefinedRegular *candidate = nullptr; |
124 | |
125 | for (Symbol *s : sc->file->getSymbols()) { |
126 | auto *d = dyn_cast_or_null<DefinedRegular>(Val: s); |
127 | if (!d || !d->data || d->file != sc->file || d->getChunk() != sc || |
128 | d->getValue() > addr || |
129 | (candidate && d->getValue() < candidate->getValue())) |
130 | continue; |
131 | |
132 | candidate = d; |
133 | } |
134 | |
135 | return candidate; |
136 | } |
137 | |
138 | static std::vector<std::string> getSymbolLocations(BitcodeFile *file) { |
139 | std::string res("\n>>> referenced by " ); |
140 | StringRef source = file->obj->getSourceFileName(); |
141 | if (!source.empty()) |
142 | res += source.str() + "\n>>> " ; |
143 | res += toString(file); |
144 | return {res}; |
145 | } |
146 | |
147 | static std::optional<std::pair<StringRef, uint32_t>> |
148 | getFileLineDwarf(const SectionChunk *c, uint32_t addr) { |
149 | std::optional<DILineInfo> optionalLineInfo = |
150 | c->file->getDILineInfo(offset: addr, sectionIndex: c->getSectionNumber() - 1); |
151 | if (!optionalLineInfo) |
152 | return std::nullopt; |
153 | const DILineInfo &lineInfo = *optionalLineInfo; |
154 | if (lineInfo.FileName == DILineInfo::BadString) |
155 | return std::nullopt; |
156 | return std::make_pair(x: saver().save(S: lineInfo.FileName), y: lineInfo.Line); |
157 | } |
158 | |
159 | static std::optional<std::pair<StringRef, uint32_t>> |
160 | getFileLine(const SectionChunk *c, uint32_t addr) { |
161 | // MinGW can optionally use codeview, even if the default is dwarf. |
162 | std::optional<std::pair<StringRef, uint32_t>> fileLine = |
163 | getFileLineCodeView(c, addr); |
164 | // If codeview didn't yield any result, check dwarf in MinGW mode. |
165 | if (!fileLine && c->file->ctx.config.mingw) |
166 | fileLine = getFileLineDwarf(c, addr); |
167 | return fileLine; |
168 | } |
169 | |
170 | // Given a file and the index of a symbol in that file, returns a description |
171 | // of all references to that symbol from that file. If no debug information is |
172 | // available, returns just the name of the file, else one string per actual |
173 | // reference as described in the debug info. |
174 | // Returns up to maxStrings string descriptions, along with the total number of |
175 | // locations found. |
176 | static std::pair<std::vector<std::string>, size_t> |
177 | getSymbolLocations(ObjFile *file, uint32_t symIndex, size_t maxStrings) { |
178 | struct Location { |
179 | Symbol *sym; |
180 | std::pair<StringRef, uint32_t> fileLine; |
181 | }; |
182 | std::vector<Location> locations; |
183 | size_t numLocations = 0; |
184 | |
185 | for (Chunk *c : file->getChunks()) { |
186 | auto *sc = dyn_cast<SectionChunk>(Val: c); |
187 | if (!sc) |
188 | continue; |
189 | for (const coff_relocation &r : sc->getRelocs()) { |
190 | if (r.SymbolTableIndex != symIndex) |
191 | continue; |
192 | numLocations++; |
193 | if (locations.size() >= maxStrings) |
194 | continue; |
195 | |
196 | std::optional<std::pair<StringRef, uint32_t>> fileLine = |
197 | getFileLine(c: sc, addr: r.VirtualAddress); |
198 | Symbol *sym = getSymbol(sc, addr: r.VirtualAddress); |
199 | if (fileLine) |
200 | locations.push_back(x: {.sym: sym, .fileLine: *fileLine}); |
201 | else if (sym) |
202 | locations.push_back(x: {.sym: sym, .fileLine: {"" , 0}}); |
203 | } |
204 | } |
205 | |
206 | if (maxStrings == 0) |
207 | return std::make_pair(x: std::vector<std::string>(), y&: numLocations); |
208 | |
209 | if (numLocations == 0) |
210 | return std::make_pair( |
211 | x: std::vector<std::string>{"\n>>> referenced by " + toString(file)}, y: 1); |
212 | |
213 | std::vector<std::string> symbolLocations(locations.size()); |
214 | size_t i = 0; |
215 | for (Location loc : locations) { |
216 | llvm::raw_string_ostream os(symbolLocations[i++]); |
217 | os << "\n>>> referenced by " ; |
218 | if (!loc.fileLine.first.empty()) |
219 | os << loc.fileLine.first << ":" << loc.fileLine.second |
220 | << "\n>>> " ; |
221 | os << toString(file); |
222 | if (loc.sym) |
223 | os << ":(" << toString(ctx: file->ctx, b&: *loc.sym) << ')'; |
224 | } |
225 | return std::make_pair(x&: symbolLocations, y&: numLocations); |
226 | } |
227 | |
228 | std::vector<std::string> getSymbolLocations(ObjFile *file, uint32_t symIndex) { |
229 | return getSymbolLocations(file, symIndex, SIZE_MAX).first; |
230 | } |
231 | |
232 | static std::pair<std::vector<std::string>, size_t> |
233 | getSymbolLocations(InputFile *file, uint32_t symIndex, size_t maxStrings) { |
234 | if (auto *o = dyn_cast<ObjFile>(Val: file)) |
235 | return getSymbolLocations(file: o, symIndex, maxStrings); |
236 | if (auto *b = dyn_cast<BitcodeFile>(Val: file)) { |
237 | std::vector<std::string> symbolLocations = getSymbolLocations(file: b); |
238 | size_t numLocations = symbolLocations.size(); |
239 | if (symbolLocations.size() > maxStrings) |
240 | symbolLocations.resize(new_size: maxStrings); |
241 | return std::make_pair(x&: symbolLocations, y&: numLocations); |
242 | } |
243 | llvm_unreachable("unsupported file type passed to getSymbolLocations" ); |
244 | return std::make_pair(x: std::vector<std::string>(), y: (size_t)0); |
245 | } |
246 | |
247 | // For an undefined symbol, stores all files referencing it and the index of |
248 | // the undefined symbol in each file. |
249 | struct UndefinedDiag { |
250 | Symbol *sym; |
251 | struct File { |
252 | InputFile *file; |
253 | uint32_t symIndex; |
254 | }; |
255 | std::vector<File> files; |
256 | }; |
257 | |
258 | static void reportUndefinedSymbol(const COFFLinkerContext &ctx, |
259 | const UndefinedDiag &undefDiag) { |
260 | std::string out; |
261 | llvm::raw_string_ostream os(out); |
262 | os << "undefined symbol: " << toString(ctx, b&: *undefDiag.sym); |
263 | |
264 | const size_t maxUndefReferences = 3; |
265 | size_t numDisplayedRefs = 0, numRefs = 0; |
266 | for (const UndefinedDiag::File &ref : undefDiag.files) { |
267 | auto [symbolLocations, totalLocations] = getSymbolLocations( |
268 | file: ref.file, symIndex: ref.symIndex, maxStrings: maxUndefReferences - numDisplayedRefs); |
269 | |
270 | numRefs += totalLocations; |
271 | numDisplayedRefs += symbolLocations.size(); |
272 | for (const std::string &s : symbolLocations) { |
273 | os << s; |
274 | } |
275 | } |
276 | if (numDisplayedRefs < numRefs) |
277 | os << "\n>>> referenced " << numRefs - numDisplayedRefs << " more times" ; |
278 | errorOrWarn(s: os.str(), forceUnresolved: ctx.config.forceUnresolved); |
279 | } |
280 | |
281 | void SymbolTable::loadMinGWSymbols() { |
282 | for (auto &i : symMap) { |
283 | Symbol *sym = i.second; |
284 | auto *undef = dyn_cast<Undefined>(Val: sym); |
285 | if (!undef) |
286 | continue; |
287 | if (undef->getWeakAlias()) |
288 | continue; |
289 | |
290 | StringRef name = undef->getName(); |
291 | |
292 | if (ctx.config.machine == I386 && ctx.config.stdcallFixup) { |
293 | // Check if we can resolve an undefined decorated symbol by finding |
294 | // the intended target as an undecorated symbol (only with a leading |
295 | // underscore). |
296 | StringRef origName = name; |
297 | StringRef baseName = name; |
298 | // Trim down stdcall/fastcall/vectorcall symbols to the base name. |
299 | baseName = ltrim1(s: baseName, chars: "_@" ); |
300 | baseName = baseName.substr(Start: 0, N: baseName.find(C: '@')); |
301 | // Add a leading underscore, as it would be in cdecl form. |
302 | std::string newName = ("_" + baseName).str(); |
303 | Symbol *l; |
304 | if (newName != origName && (l = find(name: newName)) != nullptr) { |
305 | // If we found a symbol and it is lazy; load it. |
306 | if (l->isLazy() && !l->pendingArchiveLoad) { |
307 | log(msg: "Loading lazy " + l->getName() + " from " + |
308 | l->getFile()->getName() + " for stdcall fixup" ); |
309 | forceLazy(s: l); |
310 | } |
311 | // If it's lazy or already defined, hook it up as weak alias. |
312 | if (l->isLazy() || isa<Defined>(Val: l)) { |
313 | if (ctx.config.warnStdcallFixup) |
314 | warn(msg: "Resolving " + origName + " by linking to " + newName); |
315 | else |
316 | log(msg: "Resolving " + origName + " by linking to " + newName); |
317 | undef->weakAlias = l; |
318 | continue; |
319 | } |
320 | } |
321 | } |
322 | |
323 | if (ctx.config.autoImport) { |
324 | if (name.starts_with(Prefix: "__imp_" )) |
325 | continue; |
326 | // If we have an undefined symbol, but we have a lazy symbol we could |
327 | // load, load it. |
328 | Symbol *l = find(name: ("__imp_" + name).str()); |
329 | if (!l || l->pendingArchiveLoad || !l->isLazy()) |
330 | continue; |
331 | |
332 | log(msg: "Loading lazy " + l->getName() + " from " + l->getFile()->getName() + |
333 | " for automatic import" ); |
334 | forceLazy(s: l); |
335 | } |
336 | } |
337 | } |
338 | |
339 | Defined *SymbolTable::impSymbol(StringRef name) { |
340 | if (name.starts_with(Prefix: "__imp_" )) |
341 | return nullptr; |
342 | return dyn_cast_or_null<Defined>(Val: find(name: ("__imp_" + name).str())); |
343 | } |
344 | |
345 | bool SymbolTable::handleMinGWAutomaticImport(Symbol *sym, StringRef name) { |
346 | Defined *imp = impSymbol(name); |
347 | if (!imp) |
348 | return false; |
349 | |
350 | // Replace the reference directly to a variable with a reference |
351 | // to the import address table instead. This obviously isn't right, |
352 | // but we mark the symbol as isRuntimePseudoReloc, and a later pass |
353 | // will add runtime pseudo relocations for every relocation against |
354 | // this Symbol. The runtime pseudo relocation framework expects the |
355 | // reference itself to point at the IAT entry. |
356 | size_t impSize = 0; |
357 | if (isa<DefinedImportData>(Val: imp)) { |
358 | log(msg: "Automatically importing " + name + " from " + |
359 | cast<DefinedImportData>(Val: imp)->getDLLName()); |
360 | impSize = sizeof(DefinedImportData); |
361 | } else if (isa<DefinedRegular>(Val: imp)) { |
362 | log(msg: "Automatically importing " + name + " from " + |
363 | toString(file: cast<DefinedRegular>(Val: imp)->file)); |
364 | impSize = sizeof(DefinedRegular); |
365 | } else { |
366 | warn(msg: "unable to automatically import " + name + " from " + imp->getName() + |
367 | " from " + toString(file: cast<DefinedRegular>(Val: imp)->file) + |
368 | "; unexpected symbol type" ); |
369 | return false; |
370 | } |
371 | sym->replaceKeepingName(other: imp, size: impSize); |
372 | sym->isRuntimePseudoReloc = true; |
373 | |
374 | // There may exist symbols named .refptr.<name> which only consist |
375 | // of a single pointer to <name>. If it turns out <name> is |
376 | // automatically imported, we don't need to keep the .refptr.<name> |
377 | // pointer at all, but redirect all accesses to it to the IAT entry |
378 | // for __imp_<name> instead, and drop the whole .refptr.<name> chunk. |
379 | DefinedRegular *refptr = |
380 | dyn_cast_or_null<DefinedRegular>(Val: find(name: (".refptr." + name).str())); |
381 | if (refptr && refptr->getChunk()->getSize() == ctx.config.wordsize) { |
382 | SectionChunk *sc = dyn_cast_or_null<SectionChunk>(Val: refptr->getChunk()); |
383 | if (sc && sc->getRelocs().size() == 1 && *sc->symbols().begin() == sym) { |
384 | log(msg: "Replacing .refptr." + name + " with " + imp->getName()); |
385 | refptr->getChunk()->live = false; |
386 | refptr->replaceKeepingName(other: imp, size: impSize); |
387 | } |
388 | } |
389 | return true; |
390 | } |
391 | |
392 | /// Helper function for reportUnresolvable and resolveRemainingUndefines. |
393 | /// This function emits an "undefined symbol" diagnostic for each symbol in |
394 | /// undefs. If localImports is not nullptr, it also emits a "locally |
395 | /// defined symbol imported" diagnostic for symbols in localImports. |
396 | /// objFiles and bitcodeFiles (if not nullptr) are used to report where |
397 | /// undefined symbols are referenced. |
398 | static void reportProblemSymbols( |
399 | const COFFLinkerContext &ctx, const SmallPtrSetImpl<Symbol *> &undefs, |
400 | const DenseMap<Symbol *, Symbol *> *localImports, bool needBitcodeFiles) { |
401 | // Return early if there is nothing to report (which should be |
402 | // the common case). |
403 | if (undefs.empty() && (!localImports || localImports->empty())) |
404 | return; |
405 | |
406 | for (Symbol *b : ctx.config.gcroot) { |
407 | if (undefs.count(Ptr: b)) |
408 | errorOrWarn(s: "<root>: undefined symbol: " + toString(ctx, b&: *b), |
409 | forceUnresolved: ctx.config.forceUnresolved); |
410 | if (localImports) |
411 | if (Symbol *imp = localImports->lookup(Val: b)) |
412 | warn(msg: "<root>: locally defined symbol imported: " + toString(ctx, b&: *imp) + |
413 | " (defined in " + toString(file: imp->getFile()) + ") [LNK4217]" ); |
414 | } |
415 | |
416 | std::vector<UndefinedDiag> undefDiags; |
417 | DenseMap<Symbol *, int> firstDiag; |
418 | |
419 | auto processFile = [&](InputFile *file, ArrayRef<Symbol *> symbols) { |
420 | uint32_t symIndex = (uint32_t)-1; |
421 | for (Symbol *sym : symbols) { |
422 | ++symIndex; |
423 | if (!sym) |
424 | continue; |
425 | if (undefs.count(Ptr: sym)) { |
426 | auto it = firstDiag.find(Val: sym); |
427 | if (it == firstDiag.end()) { |
428 | firstDiag[sym] = undefDiags.size(); |
429 | undefDiags.push_back(x: {.sym: sym, .files: {{.file: file, .symIndex: symIndex}}}); |
430 | } else { |
431 | undefDiags[it->second].files.push_back(x: {.file: file, .symIndex: symIndex}); |
432 | } |
433 | } |
434 | if (localImports) |
435 | if (Symbol *imp = localImports->lookup(Val: sym)) |
436 | warn(msg: toString(file) + |
437 | ": locally defined symbol imported: " + toString(ctx, b&: *imp) + |
438 | " (defined in " + toString(file: imp->getFile()) + ") [LNK4217]" ); |
439 | } |
440 | }; |
441 | |
442 | for (ObjFile *file : ctx.objFileInstances) |
443 | processFile(file, file->getSymbols()); |
444 | |
445 | if (needBitcodeFiles) |
446 | for (BitcodeFile *file : ctx.bitcodeFileInstances) |
447 | processFile(file, file->getSymbols()); |
448 | |
449 | for (const UndefinedDiag &undefDiag : undefDiags) |
450 | reportUndefinedSymbol(ctx, undefDiag); |
451 | } |
452 | |
453 | void SymbolTable::reportUnresolvable() { |
454 | SmallPtrSet<Symbol *, 8> undefs; |
455 | for (auto &i : symMap) { |
456 | Symbol *sym = i.second; |
457 | auto *undef = dyn_cast<Undefined>(Val: sym); |
458 | if (!undef || sym->deferUndefined) |
459 | continue; |
460 | if (undef->getWeakAlias()) |
461 | continue; |
462 | StringRef name = undef->getName(); |
463 | if (name.starts_with(Prefix: "__imp_" )) { |
464 | Symbol *imp = find(name: name.substr(Start: strlen(s: "__imp_" ))); |
465 | if (Defined *def = dyn_cast_or_null<Defined>(Val: imp)) { |
466 | def->isUsedInRegularObj = true; |
467 | continue; |
468 | } |
469 | } |
470 | if (name.contains(Other: "_PchSym_" )) |
471 | continue; |
472 | if (ctx.config.autoImport && impSymbol(name)) |
473 | continue; |
474 | undefs.insert(Ptr: sym); |
475 | } |
476 | |
477 | reportProblemSymbols(ctx, undefs, |
478 | /* localImports */ nullptr, needBitcodeFiles: true); |
479 | } |
480 | |
481 | void SymbolTable::resolveRemainingUndefines() { |
482 | llvm::TimeTraceScope timeScope("Resolve remaining undefined symbols" ); |
483 | SmallPtrSet<Symbol *, 8> undefs; |
484 | DenseMap<Symbol *, Symbol *> localImports; |
485 | |
486 | for (auto &i : symMap) { |
487 | Symbol *sym = i.second; |
488 | auto *undef = dyn_cast<Undefined>(Val: sym); |
489 | if (!undef) |
490 | continue; |
491 | if (!sym->isUsedInRegularObj) |
492 | continue; |
493 | |
494 | StringRef name = undef->getName(); |
495 | |
496 | // A weak alias may have been resolved, so check for that. |
497 | if (Defined *d = undef->getWeakAlias()) { |
498 | // We want to replace Sym with D. However, we can't just blindly |
499 | // copy sizeof(SymbolUnion) bytes from D to Sym because D may be an |
500 | // internal symbol, and internal symbols are stored as "unparented" |
501 | // Symbols. For that reason we need to check which type of symbol we |
502 | // are dealing with and copy the correct number of bytes. |
503 | if (isa<DefinedRegular>(Val: d)) |
504 | memcpy(dest: sym, src: d, n: sizeof(DefinedRegular)); |
505 | else if (isa<DefinedAbsolute>(Val: d)) |
506 | memcpy(dest: sym, src: d, n: sizeof(DefinedAbsolute)); |
507 | else |
508 | memcpy(dest: sym, src: d, n: sizeof(SymbolUnion)); |
509 | continue; |
510 | } |
511 | |
512 | // If we can resolve a symbol by removing __imp_ prefix, do that. |
513 | // This odd rule is for compatibility with MSVC linker. |
514 | if (name.starts_with(Prefix: "__imp_" )) { |
515 | Symbol *imp = find(name: name.substr(Start: strlen(s: "__imp_" ))); |
516 | if (imp && isa<Defined>(Val: imp)) { |
517 | auto *d = cast<Defined>(Val: imp); |
518 | replaceSymbol<DefinedLocalImport>(s: sym, arg&: ctx, arg&: name, arg&: d); |
519 | localImportChunks.push_back(x: cast<DefinedLocalImport>(Val: sym)->getChunk()); |
520 | localImports[sym] = d; |
521 | continue; |
522 | } |
523 | } |
524 | |
525 | // We don't want to report missing Microsoft precompiled headers symbols. |
526 | // A proper message will be emitted instead in PDBLinker::aquirePrecompObj |
527 | if (name.contains(Other: "_PchSym_" )) |
528 | continue; |
529 | |
530 | if (ctx.config.autoImport && handleMinGWAutomaticImport(sym, name)) |
531 | continue; |
532 | |
533 | // Remaining undefined symbols are not fatal if /force is specified. |
534 | // They are replaced with dummy defined symbols. |
535 | if (ctx.config.forceUnresolved) |
536 | replaceSymbol<DefinedAbsolute>(s: sym, arg&: ctx, arg&: name, arg: 0); |
537 | undefs.insert(Ptr: sym); |
538 | } |
539 | |
540 | reportProblemSymbols( |
541 | ctx, undefs, |
542 | localImports: ctx.config.warnLocallyDefinedImported ? &localImports : nullptr, needBitcodeFiles: false); |
543 | } |
544 | |
545 | std::pair<Symbol *, bool> SymbolTable::insert(StringRef name) { |
546 | bool inserted = false; |
547 | Symbol *&sym = symMap[CachedHashStringRef(name)]; |
548 | if (!sym) { |
549 | sym = reinterpret_cast<Symbol *>(make<SymbolUnion>()); |
550 | sym->isUsedInRegularObj = false; |
551 | sym->pendingArchiveLoad = false; |
552 | sym->canInline = true; |
553 | inserted = true; |
554 | } |
555 | return {sym, inserted}; |
556 | } |
557 | |
558 | std::pair<Symbol *, bool> SymbolTable::insert(StringRef name, InputFile *file) { |
559 | std::pair<Symbol *, bool> result = insert(name); |
560 | if (!file || !isa<BitcodeFile>(Val: file)) |
561 | result.first->isUsedInRegularObj = true; |
562 | return result; |
563 | } |
564 | |
565 | void SymbolTable::addEntryThunk(Symbol *from, Symbol *to) { |
566 | entryThunks.push_back(x: {from, to}); |
567 | } |
568 | |
569 | void SymbolTable::initializeEntryThunks() { |
570 | for (auto it : entryThunks) { |
571 | auto *to = dyn_cast<Defined>(Val: it.second); |
572 | if (!to) |
573 | continue; |
574 | auto *from = dyn_cast<DefinedRegular>(Val: it.first); |
575 | // We need to be able to add padding to the function and fill it with an |
576 | // offset to its entry thunks. To ensure that padding the function is |
577 | // feasible, functions are required to be COMDAT symbols with no offset. |
578 | if (!from || !from->getChunk()->isCOMDAT() || |
579 | cast<DefinedRegular>(Val: from)->getValue()) { |
580 | error(msg: "non COMDAT symbol '" + from->getName() + "' in hybrid map" ); |
581 | continue; |
582 | } |
583 | from->getChunk()->setEntryThunk(to); |
584 | } |
585 | } |
586 | |
587 | Symbol *SymbolTable::addUndefined(StringRef name, InputFile *f, |
588 | bool isWeakAlias) { |
589 | auto [s, wasInserted] = insert(name, file: f); |
590 | if (wasInserted || (s->isLazy() && isWeakAlias)) { |
591 | replaceSymbol<Undefined>(s, arg&: name); |
592 | return s; |
593 | } |
594 | if (s->isLazy()) |
595 | forceLazy(s); |
596 | return s; |
597 | } |
598 | |
599 | void SymbolTable::addLazyArchive(ArchiveFile *f, const Archive::Symbol &sym) { |
600 | StringRef name = sym.getName(); |
601 | auto [s, wasInserted] = insert(name); |
602 | if (wasInserted) { |
603 | replaceSymbol<LazyArchive>(s, arg&: f, arg: sym); |
604 | return; |
605 | } |
606 | auto *u = dyn_cast<Undefined>(Val: s); |
607 | if (!u || u->weakAlias || s->pendingArchiveLoad) |
608 | return; |
609 | s->pendingArchiveLoad = true; |
610 | f->addMember(sym); |
611 | } |
612 | |
613 | void SymbolTable::addLazyObject(InputFile *f, StringRef n) { |
614 | assert(f->lazy); |
615 | auto [s, wasInserted] = insert(name: n, file: f); |
616 | if (wasInserted) { |
617 | replaceSymbol<LazyObject>(s, arg&: f, arg&: n); |
618 | return; |
619 | } |
620 | auto *u = dyn_cast<Undefined>(Val: s); |
621 | if (!u || u->weakAlias || s->pendingArchiveLoad) |
622 | return; |
623 | s->pendingArchiveLoad = true; |
624 | f->lazy = false; |
625 | addFile(file: f); |
626 | } |
627 | |
628 | void SymbolTable::addLazyDLLSymbol(DLLFile *f, DLLFile::Symbol *sym, |
629 | StringRef n) { |
630 | auto [s, wasInserted] = insert(name: n); |
631 | if (wasInserted) { |
632 | replaceSymbol<LazyDLLSymbol>(s, arg&: f, arg&: sym, arg&: n); |
633 | return; |
634 | } |
635 | auto *u = dyn_cast<Undefined>(Val: s); |
636 | if (!u || u->weakAlias || s->pendingArchiveLoad) |
637 | return; |
638 | s->pendingArchiveLoad = true; |
639 | f->makeImport(s: sym); |
640 | } |
641 | |
642 | static std::string getSourceLocationBitcode(BitcodeFile *file) { |
643 | std::string res("\n>>> defined at " ); |
644 | StringRef source = file->obj->getSourceFileName(); |
645 | if (!source.empty()) |
646 | res += source.str() + "\n>>> " ; |
647 | res += toString(file); |
648 | return res; |
649 | } |
650 | |
651 | static std::string getSourceLocationObj(ObjFile *file, SectionChunk *sc, |
652 | uint32_t offset, StringRef name) { |
653 | std::optional<std::pair<StringRef, uint32_t>> fileLine; |
654 | if (sc) |
655 | fileLine = getFileLine(c: sc, addr: offset); |
656 | if (!fileLine) |
657 | fileLine = file->getVariableLocation(var: name); |
658 | |
659 | std::string res; |
660 | llvm::raw_string_ostream os(res); |
661 | os << "\n>>> defined at " ; |
662 | if (fileLine) |
663 | os << fileLine->first << ":" << fileLine->second << "\n>>> " ; |
664 | os << toString(file); |
665 | return os.str(); |
666 | } |
667 | |
668 | static std::string getSourceLocation(InputFile *file, SectionChunk *sc, |
669 | uint32_t offset, StringRef name) { |
670 | if (!file) |
671 | return "" ; |
672 | if (auto *o = dyn_cast<ObjFile>(Val: file)) |
673 | return getSourceLocationObj(file: o, sc, offset, name); |
674 | if (auto *b = dyn_cast<BitcodeFile>(Val: file)) |
675 | return getSourceLocationBitcode(file: b); |
676 | return "\n>>> defined at " + toString(file); |
677 | } |
678 | |
679 | // Construct and print an error message in the form of: |
680 | // |
681 | // lld-link: error: duplicate symbol: foo |
682 | // >>> defined at bar.c:30 |
683 | // >>> bar.o |
684 | // >>> defined at baz.c:563 |
685 | // >>> baz.o |
686 | void SymbolTable::reportDuplicate(Symbol *existing, InputFile *newFile, |
687 | SectionChunk *newSc, |
688 | uint32_t newSectionOffset) { |
689 | std::string msg; |
690 | llvm::raw_string_ostream os(msg); |
691 | os << "duplicate symbol: " << toString(ctx, b&: *existing); |
692 | |
693 | DefinedRegular *d = dyn_cast<DefinedRegular>(Val: existing); |
694 | if (d && isa<ObjFile>(Val: d->getFile())) { |
695 | os << getSourceLocation(file: d->getFile(), sc: d->getChunk(), offset: d->getValue(), |
696 | name: existing->getName()); |
697 | } else { |
698 | os << getSourceLocation(file: existing->getFile(), sc: nullptr, offset: 0, name: "" ); |
699 | } |
700 | os << getSourceLocation(file: newFile, sc: newSc, offset: newSectionOffset, |
701 | name: existing->getName()); |
702 | |
703 | if (ctx.config.forceMultiple) |
704 | warn(msg: os.str()); |
705 | else |
706 | error(msg: os.str()); |
707 | } |
708 | |
709 | Symbol *SymbolTable::addAbsolute(StringRef n, COFFSymbolRef sym) { |
710 | auto [s, wasInserted] = insert(name: n, file: nullptr); |
711 | s->isUsedInRegularObj = true; |
712 | if (wasInserted || isa<Undefined>(Val: s) || s->isLazy()) |
713 | replaceSymbol<DefinedAbsolute>(s, arg&: ctx, arg&: n, arg&: sym); |
714 | else if (auto *da = dyn_cast<DefinedAbsolute>(Val: s)) { |
715 | if (da->getVA() != sym.getValue()) |
716 | reportDuplicate(existing: s, newFile: nullptr); |
717 | } else if (!isa<DefinedCOFF>(Val: s)) |
718 | reportDuplicate(existing: s, newFile: nullptr); |
719 | return s; |
720 | } |
721 | |
722 | Symbol *SymbolTable::addAbsolute(StringRef n, uint64_t va) { |
723 | auto [s, wasInserted] = insert(name: n, file: nullptr); |
724 | s->isUsedInRegularObj = true; |
725 | if (wasInserted || isa<Undefined>(Val: s) || s->isLazy()) |
726 | replaceSymbol<DefinedAbsolute>(s, arg&: ctx, arg&: n, arg&: va); |
727 | else if (auto *da = dyn_cast<DefinedAbsolute>(Val: s)) { |
728 | if (da->getVA() != va) |
729 | reportDuplicate(existing: s, newFile: nullptr); |
730 | } else if (!isa<DefinedCOFF>(Val: s)) |
731 | reportDuplicate(existing: s, newFile: nullptr); |
732 | return s; |
733 | } |
734 | |
735 | Symbol *SymbolTable::addSynthetic(StringRef n, Chunk *c) { |
736 | auto [s, wasInserted] = insert(name: n, file: nullptr); |
737 | s->isUsedInRegularObj = true; |
738 | if (wasInserted || isa<Undefined>(Val: s) || s->isLazy()) |
739 | replaceSymbol<DefinedSynthetic>(s, arg&: n, arg&: c); |
740 | else if (!isa<DefinedCOFF>(Val: s)) |
741 | reportDuplicate(existing: s, newFile: nullptr); |
742 | return s; |
743 | } |
744 | |
745 | Symbol *SymbolTable::addRegular(InputFile *f, StringRef n, |
746 | const coff_symbol_generic *sym, SectionChunk *c, |
747 | uint32_t sectionOffset, bool isWeak) { |
748 | auto [s, wasInserted] = insert(name: n, file: f); |
749 | if (wasInserted || !isa<DefinedRegular>(Val: s) || s->isWeak) |
750 | replaceSymbol<DefinedRegular>(s, arg&: f, arg&: n, /*IsCOMDAT*/ arg: false, |
751 | /*IsExternal*/ arg: true, arg&: sym, arg&: c, arg&: isWeak); |
752 | else if (!isWeak) |
753 | reportDuplicate(existing: s, newFile: f, newSc: c, newSectionOffset: sectionOffset); |
754 | return s; |
755 | } |
756 | |
757 | std::pair<DefinedRegular *, bool> |
758 | SymbolTable::addComdat(InputFile *f, StringRef n, |
759 | const coff_symbol_generic *sym) { |
760 | auto [s, wasInserted] = insert(name: n, file: f); |
761 | if (wasInserted || !isa<DefinedRegular>(Val: s)) { |
762 | replaceSymbol<DefinedRegular>(s, arg&: f, arg&: n, /*IsCOMDAT*/ arg: true, |
763 | /*IsExternal*/ arg: true, arg&: sym, arg: nullptr); |
764 | return {cast<DefinedRegular>(Val: s), true}; |
765 | } |
766 | auto *existingSymbol = cast<DefinedRegular>(Val: s); |
767 | if (!existingSymbol->isCOMDAT) |
768 | reportDuplicate(existing: s, newFile: f); |
769 | return {existingSymbol, false}; |
770 | } |
771 | |
772 | Symbol *SymbolTable::addCommon(InputFile *f, StringRef n, uint64_t size, |
773 | const coff_symbol_generic *sym, CommonChunk *c) { |
774 | auto [s, wasInserted] = insert(name: n, file: f); |
775 | if (wasInserted || !isa<DefinedCOFF>(Val: s)) |
776 | replaceSymbol<DefinedCommon>(s, arg&: f, arg&: n, arg&: size, arg&: sym, arg&: c); |
777 | else if (auto *dc = dyn_cast<DefinedCommon>(Val: s)) |
778 | if (size > dc->getSize()) |
779 | replaceSymbol<DefinedCommon>(s, arg&: f, arg&: n, arg&: size, arg&: sym, arg&: c); |
780 | return s; |
781 | } |
782 | |
783 | Symbol *SymbolTable::addImportData(StringRef n, ImportFile *f) { |
784 | auto [s, wasInserted] = insert(name: n, file: nullptr); |
785 | s->isUsedInRegularObj = true; |
786 | if (wasInserted || isa<Undefined>(Val: s) || s->isLazy()) { |
787 | replaceSymbol<DefinedImportData>(s, arg&: n, arg&: f); |
788 | return s; |
789 | } |
790 | |
791 | reportDuplicate(existing: s, newFile: f); |
792 | return nullptr; |
793 | } |
794 | |
795 | Symbol *SymbolTable::addImportThunk(StringRef name, DefinedImportData *id, |
796 | uint16_t machine) { |
797 | auto [s, wasInserted] = insert(name, file: nullptr); |
798 | s->isUsedInRegularObj = true; |
799 | if (wasInserted || isa<Undefined>(Val: s) || s->isLazy()) { |
800 | replaceSymbol<DefinedImportThunk>(s, arg&: ctx, arg&: name, arg&: id, arg&: machine); |
801 | return s; |
802 | } |
803 | |
804 | reportDuplicate(existing: s, newFile: id->file); |
805 | return nullptr; |
806 | } |
807 | |
808 | void SymbolTable::addLibcall(StringRef name) { |
809 | Symbol *sym = findUnderscore(name); |
810 | if (!sym) |
811 | return; |
812 | |
813 | if (auto *l = dyn_cast<LazyArchive>(Val: sym)) { |
814 | MemoryBufferRef mb = l->getMemberBuffer(); |
815 | if (isBitcode(mb)) |
816 | addUndefined(name: sym->getName()); |
817 | } else if (LazyObject *o = dyn_cast<LazyObject>(Val: sym)) { |
818 | if (isBitcode(mb: o->file->mb)) |
819 | addUndefined(name: sym->getName()); |
820 | } |
821 | } |
822 | |
823 | std::vector<Chunk *> SymbolTable::getChunks() const { |
824 | std::vector<Chunk *> res; |
825 | for (ObjFile *file : ctx.objFileInstances) { |
826 | ArrayRef<Chunk *> v = file->getChunks(); |
827 | res.insert(position: res.end(), first: v.begin(), last: v.end()); |
828 | } |
829 | return res; |
830 | } |
831 | |
832 | Symbol *SymbolTable::find(StringRef name) const { |
833 | return symMap.lookup(Val: CachedHashStringRef(name)); |
834 | } |
835 | |
836 | Symbol *SymbolTable::findUnderscore(StringRef name) const { |
837 | if (ctx.config.machine == I386) |
838 | return find(name: ("_" + name).str()); |
839 | return find(name); |
840 | } |
841 | |
842 | // Return all symbols that start with Prefix, possibly ignoring the first |
843 | // character of Prefix or the first character symbol. |
844 | std::vector<Symbol *> SymbolTable::getSymsWithPrefix(StringRef prefix) { |
845 | std::vector<Symbol *> syms; |
846 | for (auto pair : symMap) { |
847 | StringRef name = pair.first.val(); |
848 | if (name.starts_with(Prefix: prefix) || name.starts_with(Prefix: prefix.drop_front()) || |
849 | name.drop_front().starts_with(Prefix: prefix) || |
850 | name.drop_front().starts_with(Prefix: prefix.drop_front())) { |
851 | syms.push_back(x: pair.second); |
852 | } |
853 | } |
854 | return syms; |
855 | } |
856 | |
857 | Symbol *SymbolTable::findMangle(StringRef name) { |
858 | if (Symbol *sym = find(name)) { |
859 | if (auto *u = dyn_cast<Undefined>(Val: sym)) { |
860 | // We're specifically looking for weak aliases that ultimately resolve to |
861 | // defined symbols, hence the call to getWeakAlias() instead of just using |
862 | // the weakAlias member variable. This matches link.exe's behavior. |
863 | if (Symbol *weakAlias = u->getWeakAlias()) |
864 | return weakAlias; |
865 | } else { |
866 | return sym; |
867 | } |
868 | } |
869 | |
870 | // Efficient fuzzy string lookup is impossible with a hash table, so iterate |
871 | // the symbol table once and collect all possibly matching symbols into this |
872 | // vector. Then compare each possibly matching symbol with each possible |
873 | // mangling. |
874 | std::vector<Symbol *> syms = getSymsWithPrefix(prefix: name); |
875 | auto findByPrefix = [&syms](const Twine &t) -> Symbol * { |
876 | std::string prefix = t.str(); |
877 | for (auto *s : syms) |
878 | if (s->getName().starts_with(Prefix: prefix)) |
879 | return s; |
880 | return nullptr; |
881 | }; |
882 | |
883 | // For non-x86, just look for C++ functions. |
884 | if (ctx.config.machine != I386) |
885 | return findByPrefix("?" + name + "@@Y" ); |
886 | |
887 | if (!name.starts_with(Prefix: "_" )) |
888 | return nullptr; |
889 | // Search for x86 stdcall function. |
890 | if (Symbol *s = findByPrefix(name + "@" )) |
891 | return s; |
892 | // Search for x86 fastcall function. |
893 | if (Symbol *s = findByPrefix("@" + name.substr(Start: 1) + "@" )) |
894 | return s; |
895 | // Search for x86 vectorcall function. |
896 | if (Symbol *s = findByPrefix(name.substr(Start: 1) + "@@" )) |
897 | return s; |
898 | // Search for x86 C++ non-member function. |
899 | return findByPrefix("?" + name.substr(Start: 1) + "@@Y" ); |
900 | } |
901 | |
902 | Symbol *SymbolTable::addUndefined(StringRef name) { |
903 | return addUndefined(name, f: nullptr, isWeakAlias: false); |
904 | } |
905 | |
906 | void SymbolTable::compileBitcodeFiles() { |
907 | ltoCompilationDone = true; |
908 | if (ctx.bitcodeFileInstances.empty()) |
909 | return; |
910 | |
911 | llvm::TimeTraceScope timeScope("Compile bitcode" ); |
912 | ScopedTimer t(ctx.ltoTimer); |
913 | lto.reset(p: new BitcodeCompiler(ctx)); |
914 | for (BitcodeFile *f : ctx.bitcodeFileInstances) |
915 | lto->add(f&: *f); |
916 | for (InputFile *newObj : lto->compile()) { |
917 | ObjFile *obj = cast<ObjFile>(Val: newObj); |
918 | obj->parse(); |
919 | ctx.objFileInstances.push_back(x: obj); |
920 | } |
921 | } |
922 | |
923 | } // namespace lld::coff |
924 | |