| 1 | //===- SymbolTable.h --------------------------------------------*- C++ -*-===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | |
| 9 | #ifndef LLD_COFF_SYMBOL_TABLE_H |
| 10 | #define LLD_COFF_SYMBOL_TABLE_H |
| 11 | |
| 12 | #include "InputFiles.h" |
| 13 | #include "LTO.h" |
| 14 | #include "llvm/ADT/CachedHashString.h" |
| 15 | #include "llvm/ADT/DenseMap.h" |
| 16 | #include "llvm/ADT/DenseMapInfo.h" |
| 17 | #include "llvm/ADT/SmallPtrSet.h" |
| 18 | #include "llvm/Support/raw_ostream.h" |
| 19 | |
| 20 | namespace llvm { |
| 21 | struct LTOCodeGenerator; |
| 22 | } |
| 23 | |
| 24 | namespace lld::coff { |
| 25 | |
| 26 | class Chunk; |
| 27 | class CommonChunk; |
| 28 | class COFFLinkerContext; |
| 29 | class Defined; |
| 30 | class DefinedAbsolute; |
| 31 | class DefinedRegular; |
| 32 | class ImportThunkChunk; |
| 33 | class LazyArchive; |
| 34 | class SectionChunk; |
| 35 | class Symbol; |
| 36 | |
| 37 | // This data structure is instantiated for each -wrap option. |
| 38 | struct WrappedSymbol { |
| 39 | Symbol *sym; |
| 40 | Symbol *real; |
| 41 | Symbol *wrap; |
| 42 | }; |
| 43 | |
| 44 | struct UndefinedDiag; |
| 45 | |
| 46 | // SymbolTable is a bucket of all known symbols, including defined, |
| 47 | // undefined, or lazy symbols (the last one is symbols in archive |
| 48 | // files whose archive members are not yet loaded). |
| 49 | // |
| 50 | // We put all symbols of all files to a SymbolTable, and the |
| 51 | // SymbolTable selects the "best" symbols if there are name |
| 52 | // conflicts. For example, obviously, a defined symbol is better than |
| 53 | // an undefined symbol. Or, if there's a conflict between a lazy and a |
| 54 | // undefined, it'll read an archive member to read a real definition |
| 55 | // to replace the lazy symbol. The logic is implemented in the |
| 56 | // add*() functions, which are called by input files as they are parsed. |
| 57 | // There is one add* function per symbol type. |
| 58 | class SymbolTable { |
| 59 | public: |
| 60 | SymbolTable(COFFLinkerContext &c, |
| 61 | llvm::COFF::MachineTypes machine = IMAGE_FILE_MACHINE_UNKNOWN) |
| 62 | : ctx(c), machine(machine) {} |
| 63 | |
| 64 | // Emit errors for symbols that cannot be resolved. |
| 65 | void reportUnresolvable(); |
| 66 | |
| 67 | // Try to resolve any undefined symbols and update the symbol table |
| 68 | // accordingly, then print an error message for any remaining undefined |
| 69 | // symbols and warn about imported local symbols. |
| 70 | void resolveRemainingUndefines(); |
| 71 | |
| 72 | // Load lazy objects that are needed for MinGW automatic import and for |
| 73 | // doing stdcall fixups. |
| 74 | void loadMinGWSymbols(); |
| 75 | bool handleMinGWAutomaticImport(Symbol *sym, StringRef name); |
| 76 | |
| 77 | // Returns a symbol for a given name. Returns a nullptr if not found. |
| 78 | Symbol *find(StringRef name) const; |
| 79 | Symbol *findUnderscore(StringRef name) const; |
| 80 | |
| 81 | void addUndefinedGlob(StringRef arg); |
| 82 | |
| 83 | // Occasionally we have to resolve an undefined symbol to its |
| 84 | // mangled symbol. This function tries to find a mangled name |
| 85 | // for U from the symbol table, and if found, set the symbol as |
| 86 | // a weak alias for U. |
| 87 | Symbol *findMangle(StringRef name); |
| 88 | StringRef mangleMaybe(Symbol *s); |
| 89 | |
| 90 | // Symbol names are mangled by prepending "_" on x86. |
| 91 | StringRef mangle(StringRef sym); |
| 92 | |
| 93 | // Windows specific -- "main" is not the only main function in Windows. |
| 94 | // You can choose one from these four -- {w,}{WinMain,main}. |
| 95 | // There are four different entry point functions for them, |
| 96 | // {w,}{WinMain,main}CRTStartup, respectively. The linker needs to |
| 97 | // choose the right one depending on which "main" function is defined. |
| 98 | // This function looks up the symbol table and resolve corresponding |
| 99 | // entry point name. |
| 100 | StringRef findDefaultEntry(); |
| 101 | WindowsSubsystem inferSubsystem(); |
| 102 | |
| 103 | // Build a set of COFF objects representing the combined contents of |
| 104 | // BitcodeFiles and add them to the symbol table. Called after all files are |
| 105 | // added and before the writer writes results to a file. |
| 106 | void compileBitcodeFiles(); |
| 107 | |
| 108 | // Creates an Undefined symbol and marks it as live. |
| 109 | Symbol *addGCRoot(StringRef sym, bool aliasEC = false); |
| 110 | |
| 111 | // Creates an Undefined symbol for a given name. |
| 112 | Symbol *addUndefined(StringRef name); |
| 113 | |
| 114 | Symbol *addSynthetic(StringRef n, Chunk *c); |
| 115 | Symbol *addAbsolute(StringRef n, uint64_t va); |
| 116 | |
| 117 | Symbol *addUndefined(StringRef name, InputFile *f, bool overrideLazy); |
| 118 | void addLazyArchive(ArchiveFile *f, const Archive::Symbol &sym); |
| 119 | void addLazyObject(InputFile *f, StringRef n); |
| 120 | void addLazyDLLSymbol(DLLFile *f, DLLFile::Symbol *sym, StringRef n); |
| 121 | Symbol *addAbsolute(StringRef n, COFFSymbolRef s); |
| 122 | Symbol *addRegular(InputFile *f, StringRef n, |
| 123 | const llvm::object::coff_symbol_generic *s = nullptr, |
| 124 | SectionChunk *c = nullptr, uint32_t sectionOffset = 0, |
| 125 | bool isWeak = false); |
| 126 | std::pair<DefinedRegular *, bool> |
| 127 | addComdat(InputFile *f, StringRef n, |
| 128 | const llvm::object::coff_symbol_generic *s = nullptr); |
| 129 | Symbol *addCommon(InputFile *f, StringRef n, uint64_t size, |
| 130 | const llvm::object::coff_symbol_generic *s = nullptr, |
| 131 | CommonChunk *c = nullptr); |
| 132 | DefinedImportData *addImportData(StringRef n, ImportFile *f, |
| 133 | Chunk *&location); |
| 134 | Defined *addImportThunk(StringRef name, DefinedImportData *s, |
| 135 | ImportThunkChunk *chunk); |
| 136 | void addLibcall(StringRef name); |
| 137 | void addEntryThunk(Symbol *from, Symbol *to); |
| 138 | void addExitThunk(Symbol *from, Symbol *to); |
| 139 | void initializeECThunks(); |
| 140 | |
| 141 | void reportDuplicate(Symbol *existing, InputFile *newFile, |
| 142 | SectionChunk *newSc = nullptr, |
| 143 | uint32_t newSectionOffset = 0); |
| 144 | |
| 145 | COFFLinkerContext &ctx; |
| 146 | llvm::COFF::MachineTypes machine; |
| 147 | |
| 148 | bool isEC() const { return machine == ARM64EC; } |
| 149 | |
| 150 | // An entry point symbol. |
| 151 | Symbol *entry = nullptr; |
| 152 | |
| 153 | // A list of chunks which to be added to .rdata. |
| 154 | std::vector<Chunk *> localImportChunks; |
| 155 | |
| 156 | // A list of EC EXP+ symbols. |
| 157 | std::vector<Symbol *> expSymbols; |
| 158 | |
| 159 | // A list of DLL exports. |
| 160 | std::vector<Export> exports; |
| 161 | llvm::DenseSet<StringRef> directivesExports; |
| 162 | bool hadExplicitExports; |
| 163 | |
| 164 | Chunk *edataStart = nullptr; |
| 165 | Chunk *edataEnd = nullptr; |
| 166 | |
| 167 | Symbol *delayLoadHelper = nullptr; |
| 168 | Chunk *tailMergeUnwindInfoChunk = nullptr; |
| 169 | |
| 170 | // A list of wrapped symbols. |
| 171 | std::vector<WrappedSymbol> wrapped; |
| 172 | |
| 173 | // Used for /alternatename. |
| 174 | std::map<StringRef, StringRef> alternateNames; |
| 175 | |
| 176 | // Used for /aligncomm. |
| 177 | std::map<std::string, int> alignComm; |
| 178 | |
| 179 | void fixupExports(); |
| 180 | void assignExportOrdinals(); |
| 181 | void parseModuleDefs(StringRef path); |
| 182 | void parseAlternateName(StringRef); |
| 183 | void parseAligncomm(StringRef); |
| 184 | |
| 185 | // Iterates symbols in non-determinstic hash table order. |
| 186 | template <typename T> void forEachSymbol(T callback) { |
| 187 | for (auto &pair : symMap) |
| 188 | callback(pair.second); |
| 189 | } |
| 190 | |
| 191 | std::vector<BitcodeFile *> bitcodeFileInstances; |
| 192 | |
| 193 | DefinedRegular *loadConfigSym = nullptr; |
| 194 | uint32_t loadConfigSize = 0; |
| 195 | void initializeLoadConfig(); |
| 196 | |
| 197 | std::string printSymbol(Symbol *sym) const; |
| 198 | |
| 199 | private: |
| 200 | /// Given a name without "__imp_" prefix, returns a defined symbol |
| 201 | /// with the "__imp_" prefix, if it exists. |
| 202 | Defined *impSymbol(StringRef name); |
| 203 | /// Inserts symbol if not already present. |
| 204 | std::pair<Symbol *, bool> insert(StringRef name); |
| 205 | /// Same as insert(Name), but also sets isUsedInRegularObj. |
| 206 | std::pair<Symbol *, bool> insert(StringRef name, InputFile *f); |
| 207 | |
| 208 | bool findUnderscoreMangle(StringRef sym); |
| 209 | std::vector<Symbol *> getSymsWithPrefix(StringRef prefix); |
| 210 | |
| 211 | llvm::DenseMap<llvm::CachedHashStringRef, Symbol *> symMap; |
| 212 | std::unique_ptr<BitcodeCompiler> lto; |
| 213 | std::vector<std::pair<Symbol *, Symbol *>> entryThunks; |
| 214 | llvm::DenseMap<Symbol *, Symbol *> exitThunks; |
| 215 | |
| 216 | void |
| 217 | reportProblemSymbols(const llvm::SmallPtrSetImpl<Symbol *> &undefs, |
| 218 | const llvm::DenseMap<Symbol *, Symbol *> *localImports, |
| 219 | bool needBitcodeFiles); |
| 220 | void reportUndefinedSymbol(const UndefinedDiag &undefDiag); |
| 221 | }; |
| 222 | |
| 223 | std::vector<std::string> getSymbolLocations(ObjFile *file, uint32_t symIndex); |
| 224 | |
| 225 | StringRef ltrim1(StringRef s, const char *chars); |
| 226 | |
| 227 | } // namespace lld::coff |
| 228 | |
| 229 | #endif |
| 230 | |