1 | //===-- gsymutil.cpp - GSYM dumping and creation utility for llvm ---------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | |
9 | #include "llvm/ADT/STLExtras.h" |
10 | #include "llvm/DebugInfo/DIContext.h" |
11 | #include "llvm/DebugInfo/DWARF/DWARFContext.h" |
12 | #include "llvm/DebugInfo/GSYM/CallSiteInfo.h" |
13 | #include "llvm/Object/Archive.h" |
14 | #include "llvm/Object/ELFObjectFile.h" |
15 | #include "llvm/Object/MachOUniversal.h" |
16 | #include "llvm/Object/ObjectFile.h" |
17 | #include "llvm/Option/ArgList.h" |
18 | #include "llvm/Option/Option.h" |
19 | #include "llvm/Support/CommandLine.h" |
20 | #include "llvm/Support/Debug.h" |
21 | #include "llvm/Support/Format.h" |
22 | #include "llvm/Support/JSON.h" |
23 | #include "llvm/Support/LLVMDriver.h" |
24 | #include "llvm/Support/ManagedStatic.h" |
25 | #include "llvm/Support/MemoryBuffer.h" |
26 | #include "llvm/Support/PrettyStackTrace.h" |
27 | #include "llvm/Support/Regex.h" |
28 | #include "llvm/Support/Signals.h" |
29 | #include "llvm/Support/TargetSelect.h" |
30 | #include "llvm/Support/raw_ostream.h" |
31 | #include "llvm/TargetParser/Triple.h" |
32 | #include <algorithm> |
33 | #include <cstring> |
34 | #include <inttypes.h> |
35 | #include <iostream> |
36 | #include <optional> |
37 | #include <string> |
38 | #include <system_error> |
39 | #include <vector> |
40 | |
41 | #include "llvm/DebugInfo/GSYM/DwarfTransformer.h" |
42 | #include "llvm/DebugInfo/GSYM/FunctionInfo.h" |
43 | #include "llvm/DebugInfo/GSYM/GsymCreator.h" |
44 | #include "llvm/DebugInfo/GSYM/GsymReader.h" |
45 | #include "llvm/DebugInfo/GSYM/InlineInfo.h" |
46 | #include "llvm/DebugInfo/GSYM/LookupResult.h" |
47 | #include "llvm/DebugInfo/GSYM/ObjectFileTransformer.h" |
48 | #include "llvm/DebugInfo/GSYM/OutputAggregator.h" |
49 | |
50 | using namespace llvm; |
51 | using namespace gsym; |
52 | using namespace object; |
53 | |
54 | /// @} |
55 | /// Command line options. |
56 | /// @{ |
57 | |
58 | using namespace llvm::opt; |
59 | enum ID { |
60 | OPT_INVALID = 0, // This is not an option ID. |
61 | #define OPTION(...) LLVM_MAKE_OPT_ID(__VA_ARGS__), |
62 | #include "Opts.inc" |
63 | #undef OPTION |
64 | }; |
65 | |
66 | #define OPTTABLE_STR_TABLE_CODE |
67 | #include "Opts.inc" |
68 | #undef OPTTABLE_STR_TABLE_CODE |
69 | |
70 | #define OPTTABLE_PREFIXES_TABLE_CODE |
71 | #include "Opts.inc" |
72 | #undef OPTTABLE_PREFIXES_TABLE_CODE |
73 | |
74 | const opt::OptTable::Info InfoTable[] = { |
75 | #define OPTION(...) LLVM_CONSTRUCT_OPT_INFO(__VA_ARGS__), |
76 | #include "Opts.inc" |
77 | #undef OPTION |
78 | }; |
79 | |
80 | class GSYMUtilOptTable : public llvm::opt::GenericOptTable { |
81 | public: |
82 | GSYMUtilOptTable() |
83 | : GenericOptTable(OptionStrTable, OptionPrefixesTable, InfoTable) { |
84 | setGroupedShortOptions(true); |
85 | } |
86 | }; |
87 | |
88 | static bool Verbose; |
89 | static std::vector<std::string> InputFilenames; |
90 | static std::string ConvertFilename; |
91 | static std::vector<std::string> ArchFilters; |
92 | static std::string OutputFilename; |
93 | static std::string JsonSummaryFile; |
94 | static bool Verify; |
95 | static unsigned NumThreads; |
96 | static uint64_t SegmentSize; |
97 | static bool Quiet; |
98 | static std::vector<uint64_t> LookupAddresses; |
99 | static bool LookupAddressesFromStdin; |
100 | static bool UseMergedFunctions = false; |
101 | static bool LoadDwarfCallSites = false; |
102 | static std::string CallSiteYamlPath; |
103 | static std::vector<std::string> MergedFunctionsFilters; |
104 | |
105 | static void parseArgs(int argc, char **argv) { |
106 | GSYMUtilOptTable Tbl; |
107 | llvm::StringRef ToolName = argv[0]; |
108 | llvm::BumpPtrAllocator A; |
109 | llvm::StringSaver Saver{A}; |
110 | llvm::opt::InputArgList Args = |
111 | Tbl.parseArgs(Argc: argc, Argv: argv, Unknown: OPT_UNKNOWN, Saver, ErrorFn: [&](StringRef Msg) { |
112 | llvm::errs() << Msg << '\n'; |
113 | std::exit(status: 1); |
114 | }); |
115 | if (Args.hasArg(Ids: OPT_help)) { |
116 | const char *Overview = |
117 | "A tool for dumping, searching and creating GSYM files.\n\n" |
118 | "Specify one or more GSYM paths as arguments to dump all of the " |
119 | "information in each GSYM file.\n" |
120 | "Specify a single GSYM file along with one or more --lookup options to " |
121 | "lookup addresses within that GSYM file.\n" |
122 | "Use the --convert option to specify a file with option --out-file " |
123 | "option to convert to GSYM format.\n" ; |
124 | |
125 | Tbl.printHelp(OS&: llvm::outs(), Usage: "llvm-gsymutil [options] <input GSYM files>" , |
126 | Title: Overview); |
127 | std::exit(status: 0); |
128 | } |
129 | if (Args.hasArg(Ids: OPT_version)) { |
130 | llvm::outs() << ToolName << '\n'; |
131 | cl::PrintVersionMessage(); |
132 | std::exit(status: 0); |
133 | } |
134 | |
135 | Verbose = Args.hasArg(Ids: OPT_verbose); |
136 | |
137 | for (const llvm::opt::Arg *A : Args.filtered(Ids: OPT_INPUT)) |
138 | InputFilenames.emplace_back(args: A->getValue()); |
139 | |
140 | if (const llvm::opt::Arg *A = Args.getLastArg(Ids: OPT_convert_EQ)) |
141 | ConvertFilename = A->getValue(); |
142 | |
143 | for (const llvm::opt::Arg *A : Args.filtered(Ids: OPT_arch_EQ)) |
144 | ArchFilters.emplace_back(args: A->getValue()); |
145 | |
146 | if (const llvm::opt::Arg *A = Args.getLastArg(Ids: OPT_out_file_EQ)) |
147 | OutputFilename = A->getValue(); |
148 | |
149 | if (const llvm::opt::Arg *A = Args.getLastArg(Ids: OPT_json_summary_file_EQ)) |
150 | JsonSummaryFile = A->getValue(); |
151 | |
152 | Verify = Args.hasArg(Ids: OPT_verify); |
153 | |
154 | if (const llvm::opt::Arg *A = Args.getLastArg(Ids: OPT_num_threads_EQ)) { |
155 | StringRef S{A->getValue()}; |
156 | if (!llvm::to_integer(S, Num&: NumThreads, Base: 0)) { |
157 | llvm::errs() << ToolName << ": for the --num-threads option: '" << S |
158 | << "' value invalid for uint argument!\n" ; |
159 | std::exit(status: 1); |
160 | } |
161 | } |
162 | |
163 | if (const llvm::opt::Arg *A = Args.getLastArg(Ids: OPT_segment_size_EQ)) { |
164 | StringRef S{A->getValue()}; |
165 | if (!llvm::to_integer(S, Num&: SegmentSize, Base: 0)) { |
166 | llvm::errs() << ToolName << ": for the --segment-size option: '" << S |
167 | << "' value invalid for uint argument!\n" ; |
168 | std::exit(status: 1); |
169 | } |
170 | } |
171 | |
172 | Quiet = Args.hasArg(Ids: OPT_quiet); |
173 | |
174 | for (const llvm::opt::Arg *A : Args.filtered(Ids: OPT_address_EQ)) { |
175 | StringRef S{A->getValue()}; |
176 | if (!llvm::to_integer(S, Num&: LookupAddresses.emplace_back(), Base: 0)) { |
177 | llvm::errs() << ToolName << ": for the --address option: '" << S |
178 | << "' value invalid for uint argument!\n" ; |
179 | std::exit(status: 1); |
180 | } |
181 | } |
182 | |
183 | LookupAddressesFromStdin = Args.hasArg(Ids: OPT_addresses_from_stdin); |
184 | UseMergedFunctions = Args.hasArg(Ids: OPT_merged_functions); |
185 | |
186 | if (Args.hasArg(Ids: OPT_callsites_yaml_file_EQ)) { |
187 | CallSiteYamlPath = Args.getLastArgValue(Id: OPT_callsites_yaml_file_EQ); |
188 | if (CallSiteYamlPath.empty()) { |
189 | llvm::errs() |
190 | << ToolName |
191 | << ": --callsites-yaml-file option requires a non-empty argument.\n" ; |
192 | std::exit(status: 1); |
193 | } |
194 | } |
195 | |
196 | LoadDwarfCallSites = Args.hasArg(Ids: OPT_dwarf_callsites); |
197 | |
198 | for (const llvm::opt::Arg *A : |
199 | Args.filtered(Ids: OPT_merged_functions_filter_EQ)) { |
200 | MergedFunctionsFilters.push_back(x: A->getValue()); |
201 | // Validate the filter is only used with correct flags |
202 | if (LookupAddresses.empty() && !LookupAddressesFromStdin) { |
203 | llvm::errs() << ToolName |
204 | << ": --merged-functions-filter can only be used with " |
205 | "--address/--addresses-from-stdin\n" ; |
206 | std::exit(status: 1); |
207 | } |
208 | if (!UseMergedFunctions) { |
209 | llvm::errs() |
210 | << ToolName |
211 | << ": --merged-functions-filter requires --merged-functions\n" ; |
212 | std::exit(status: 1); |
213 | } |
214 | } |
215 | } |
216 | |
217 | /// @} |
218 | //===----------------------------------------------------------------------===// |
219 | |
220 | static void error(Error Err) { |
221 | if (!Err) |
222 | return; |
223 | WithColor::error() << toString(E: std::move(Err)) << "\n" ; |
224 | exit(status: 1); |
225 | } |
226 | |
227 | static void error(StringRef Prefix, llvm::Error Err) { |
228 | if (!Err) |
229 | return; |
230 | errs() << Prefix << ": " << Err << "\n" ; |
231 | consumeError(Err: std::move(Err)); |
232 | exit(status: 1); |
233 | } |
234 | |
235 | static void error(StringRef Prefix, std::error_code EC) { |
236 | if (!EC) |
237 | return; |
238 | errs() << Prefix << ": " << EC.message() << "\n" ; |
239 | exit(status: 1); |
240 | } |
241 | |
242 | static uint32_t getCPUType(MachOObjectFile &MachO) { |
243 | if (MachO.is64Bit()) |
244 | return MachO.getHeader64().cputype; |
245 | else |
246 | return MachO.getHeader().cputype; |
247 | } |
248 | |
249 | /// Return true if the object file has not been filtered by an --arch option. |
250 | static bool filterArch(MachOObjectFile &Obj) { |
251 | if (ArchFilters.empty()) |
252 | return true; |
253 | |
254 | Triple ObjTriple(Obj.getArchTriple()); |
255 | StringRef ObjArch = ObjTriple.getArchName(); |
256 | |
257 | for (StringRef Arch : ArchFilters) { |
258 | // Match name. |
259 | if (Arch == ObjArch) |
260 | return true; |
261 | |
262 | // Match architecture number. |
263 | unsigned Value; |
264 | if (!Arch.getAsInteger(Radix: 0, Result&: Value)) |
265 | if (Value == getCPUType(MachO&: Obj)) |
266 | return true; |
267 | } |
268 | return false; |
269 | } |
270 | |
271 | /// Determine the virtual address that is considered the base address of an ELF |
272 | /// object file. |
273 | /// |
274 | /// The base address of an ELF file is the "p_vaddr" of the first program |
275 | /// header whose "p_type" is PT_LOAD. |
276 | /// |
277 | /// \param ELFFile An ELF object file we will search. |
278 | /// |
279 | /// \returns A valid image base address if we are able to extract one. |
280 | template <class ELFT> |
281 | static std::optional<uint64_t> |
282 | getImageBaseAddress(const object::ELFFile<ELFT> &ELFFile) { |
283 | auto PhdrRangeOrErr = ELFFile.program_headers(); |
284 | if (!PhdrRangeOrErr) { |
285 | consumeError(PhdrRangeOrErr.takeError()); |
286 | return std::nullopt; |
287 | } |
288 | for (const typename ELFT::Phdr &Phdr : *PhdrRangeOrErr) |
289 | if (Phdr.p_type == ELF::PT_LOAD) |
290 | return (uint64_t)Phdr.p_vaddr; |
291 | return std::nullopt; |
292 | } |
293 | |
294 | /// Determine the virtual address that is considered the base address of mach-o |
295 | /// object file. |
296 | /// |
297 | /// The base address of a mach-o file is the vmaddr of the "__TEXT" segment. |
298 | /// |
299 | /// \param MachO A mach-o object file we will search. |
300 | /// |
301 | /// \returns A valid image base address if we are able to extract one. |
302 | static std::optional<uint64_t> |
303 | getImageBaseAddress(const object::MachOObjectFile *MachO) { |
304 | for (const auto &Command : MachO->load_commands()) { |
305 | if (Command.C.cmd == MachO::LC_SEGMENT) { |
306 | MachO::segment_command SLC = MachO->getSegmentLoadCommand(L: Command); |
307 | StringRef SegName = SLC.segname; |
308 | if (SegName == "__TEXT" ) |
309 | return SLC.vmaddr; |
310 | } else if (Command.C.cmd == MachO::LC_SEGMENT_64) { |
311 | MachO::segment_command_64 SLC = MachO->getSegment64LoadCommand(L: Command); |
312 | StringRef SegName = SLC.segname; |
313 | if (SegName == "__TEXT" ) |
314 | return SLC.vmaddr; |
315 | } |
316 | } |
317 | return std::nullopt; |
318 | } |
319 | |
320 | /// Determine the virtual address that is considered the base address of an |
321 | /// object file. |
322 | /// |
323 | /// Since GSYM files are used for symbolication, many clients will need to |
324 | /// easily adjust addresses they find in stack traces so the lookups happen |
325 | /// on unslid addresses from the original object file. If the base address of |
326 | /// a GSYM file is set to the base address of the image, then this address |
327 | /// adjusting is much easier. |
328 | /// |
329 | /// \param Obj An object file we will search. |
330 | /// |
331 | /// \returns A valid image base address if we are able to extract one. |
332 | static std::optional<uint64_t> getImageBaseAddress(object::ObjectFile &Obj) { |
333 | if (const auto *MachO = dyn_cast<object::MachOObjectFile>(Val: &Obj)) |
334 | return getImageBaseAddress(MachO); |
335 | else if (const auto *ELFObj = dyn_cast<object::ELF32LEObjectFile>(Val: &Obj)) |
336 | return getImageBaseAddress(ELFFile: ELFObj->getELFFile()); |
337 | else if (const auto *ELFObj = dyn_cast<object::ELF32BEObjectFile>(Val: &Obj)) |
338 | return getImageBaseAddress(ELFFile: ELFObj->getELFFile()); |
339 | else if (const auto *ELFObj = dyn_cast<object::ELF64LEObjectFile>(Val: &Obj)) |
340 | return getImageBaseAddress(ELFFile: ELFObj->getELFFile()); |
341 | else if (const auto *ELFObj = dyn_cast<object::ELF64BEObjectFile>(Val: &Obj)) |
342 | return getImageBaseAddress(ELFFile: ELFObj->getELFFile()); |
343 | return std::nullopt; |
344 | } |
345 | |
346 | static llvm::Error handleObjectFile(ObjectFile &Obj, const std::string &OutFile, |
347 | OutputAggregator &Out) { |
348 | auto ThreadCount = |
349 | NumThreads > 0 ? NumThreads : std::thread::hardware_concurrency(); |
350 | |
351 | GsymCreator Gsym(Quiet); |
352 | |
353 | // See if we can figure out the base address for a given object file, and if |
354 | // we can, then set the base address to use to this value. This will ease |
355 | // symbolication since clients can slide the GSYM lookup addresses by using |
356 | // the load bias of the shared library. |
357 | if (auto ImageBaseAddr = getImageBaseAddress(Obj)) |
358 | Gsym.setBaseAddress(*ImageBaseAddr); |
359 | |
360 | // We need to know where the valid sections are that contain instructions. |
361 | // See header documentation for DWARFTransformer::SetValidTextRanges() for |
362 | // defails. |
363 | AddressRanges ; |
364 | for (const object::SectionRef &Sect : Obj.sections()) { |
365 | if (!Sect.isText()) |
366 | continue; |
367 | const uint64_t Size = Sect.getSize(); |
368 | if (Size == 0) |
369 | continue; |
370 | const uint64_t StartAddr = Sect.getAddress(); |
371 | TextRanges.insert(Range: AddressRange(StartAddr, StartAddr + Size)); |
372 | } |
373 | |
374 | // Make sure there is DWARF to convert first. |
375 | std::unique_ptr<DWARFContext> DICtx = DWARFContext::create( |
376 | Obj, |
377 | /*RelocAction=*/DWARFContext::ProcessDebugRelocations::Process, |
378 | L: nullptr, |
379 | /*DWPName=*/"" , |
380 | /*RecoverableErrorHandler=*/WithColor::defaultErrorHandler, |
381 | /*WarningHandler=*/WithColor::defaultWarningHandler, |
382 | /*ThreadSafe*/true); |
383 | if (!DICtx) |
384 | return createStringError(EC: std::errc::invalid_argument, |
385 | Fmt: "unable to create DWARF context" ); |
386 | |
387 | // Make a DWARF transformer object and populate the ranges of the code |
388 | // so we don't end up adding invalid functions to GSYM data. |
389 | DwarfTransformer DT(*DICtx, Gsym, LoadDwarfCallSites); |
390 | if (!TextRanges.empty()) |
391 | Gsym.SetValidTextRanges(TextRanges); |
392 | |
393 | // Convert all DWARF to GSYM. |
394 | if (auto Err = DT.convert(NumThreads: ThreadCount, OS&: Out)) |
395 | return Err; |
396 | |
397 | // If enabled, merge functions with identical address ranges as merged |
398 | // functions in the first FunctionInfo with that address range. Do this right |
399 | // after loading the DWARF data so we don't have to deal with functions from |
400 | // the symbol table. |
401 | if (UseMergedFunctions) |
402 | Gsym.prepareMergedFunctions(Out); |
403 | |
404 | // Get the UUID and convert symbol table to GSYM. |
405 | if (auto Err = ObjectFileTransformer::convert(Obj, Output&: Out, Gsym)) |
406 | return Err; |
407 | |
408 | // If any call site YAML files were specified, load them now. |
409 | if (!CallSiteYamlPath.empty()) |
410 | if (auto Err = Gsym.loadCallSitesFromYAML(YAMLFile: CallSiteYamlPath)) |
411 | return Err; |
412 | |
413 | // Finalize the GSYM to make it ready to save to disk. This will remove |
414 | // duplicate FunctionInfo entries where we might have found an entry from |
415 | // debug info and also a symbol table entry from the object file. |
416 | if (auto Err = Gsym.finalize(OS&: Out)) |
417 | return Err; |
418 | |
419 | // Save the GSYM file to disk. |
420 | llvm::endianness Endian = Obj.makeTriple().isLittleEndian() |
421 | ? llvm::endianness::little |
422 | : llvm::endianness::big; |
423 | |
424 | std::optional<uint64_t> OptSegmentSize; |
425 | if (SegmentSize > 0) |
426 | OptSegmentSize = SegmentSize; |
427 | if (auto Err = Gsym.save(Path: OutFile, ByteOrder: Endian, SegmentSize: OptSegmentSize)) |
428 | return Err; |
429 | |
430 | // Verify the DWARF if requested. This will ensure all the info in the DWARF |
431 | // can be looked up in the GSYM and that all lookups get matching data. |
432 | if (Verify) { |
433 | if (auto Err = DT.verify(GsymPath: OutFile, OS&: Out)) |
434 | return Err; |
435 | } |
436 | |
437 | return Error::success(); |
438 | } |
439 | |
440 | static llvm::Error handleBuffer(StringRef Filename, MemoryBufferRef Buffer, |
441 | const std::string &OutFile, |
442 | OutputAggregator &Out) { |
443 | Expected<std::unique_ptr<Binary>> BinOrErr = object::createBinary(Source: Buffer); |
444 | error(Prefix: Filename, EC: errorToErrorCode(Err: BinOrErr.takeError())); |
445 | |
446 | if (auto *Obj = dyn_cast<ObjectFile>(Val: BinOrErr->get())) { |
447 | Triple ObjTriple(Obj->makeTriple()); |
448 | auto ArchName = ObjTriple.getArchName(); |
449 | outs() << "Output file (" << ArchName << "): " << OutFile << "\n" ; |
450 | if (auto Err = handleObjectFile(Obj&: *Obj, OutFile, Out)) |
451 | return Err; |
452 | } else if (auto *Fat = dyn_cast<MachOUniversalBinary>(Val: BinOrErr->get())) { |
453 | // Iterate over all contained architectures and filter out any that were |
454 | // not specified with the "--arch <arch>" option. If the --arch option was |
455 | // not specified on the command line, we will process all architectures. |
456 | std::vector<std::unique_ptr<MachOObjectFile>> FilterObjs; |
457 | for (auto &ObjForArch : Fat->objects()) { |
458 | if (auto MachOOrErr = ObjForArch.getAsObjectFile()) { |
459 | auto &Obj = **MachOOrErr; |
460 | if (filterArch(Obj)) |
461 | FilterObjs.emplace_back(args: MachOOrErr->release()); |
462 | } else { |
463 | error(Prefix: Filename, Err: MachOOrErr.takeError()); |
464 | } |
465 | } |
466 | if (FilterObjs.empty()) |
467 | error(Prefix: Filename, Err: createStringError(EC: std::errc::invalid_argument, |
468 | Fmt: "no matching architectures found" )); |
469 | |
470 | // Now handle each architecture we need to convert. |
471 | for (auto &Obj : FilterObjs) { |
472 | Triple ObjTriple(Obj->getArchTriple()); |
473 | auto ArchName = ObjTriple.getArchName(); |
474 | std::string ArchOutFile(OutFile); |
475 | // If we are only handling a single architecture, then we will use the |
476 | // normal output file. If we are handling multiple architectures append |
477 | // the architecture name to the end of the out file path so that we |
478 | // don't overwrite the previous architecture's gsym file. |
479 | if (FilterObjs.size() > 1) { |
480 | ArchOutFile.append(n: 1, c: '.'); |
481 | ArchOutFile.append(str: ArchName.str()); |
482 | } |
483 | outs() << "Output file (" << ArchName << "): " << ArchOutFile << "\n" ; |
484 | if (auto Err = handleObjectFile(Obj&: *Obj, OutFile: ArchOutFile, Out)) |
485 | return Err; |
486 | } |
487 | } |
488 | return Error::success(); |
489 | } |
490 | |
491 | static llvm::Error handleFileConversionToGSYM(StringRef Filename, |
492 | const std::string &OutFile, |
493 | OutputAggregator &Out) { |
494 | ErrorOr<std::unique_ptr<MemoryBuffer>> BuffOrErr = |
495 | MemoryBuffer::getFileOrSTDIN(Filename); |
496 | error(Prefix: Filename, EC: BuffOrErr.getError()); |
497 | std::unique_ptr<MemoryBuffer> Buffer = std::move(BuffOrErr.get()); |
498 | return handleBuffer(Filename, Buffer: *Buffer, OutFile, Out); |
499 | } |
500 | |
501 | static llvm::Error convertFileToGSYM(OutputAggregator &Out) { |
502 | // Expand any .dSYM bundles to the individual object files contained therein. |
503 | std::vector<std::string> Objects; |
504 | std::string OutFile = OutputFilename; |
505 | if (OutFile.empty()) { |
506 | OutFile = ConvertFilename; |
507 | OutFile += ".gsym" ; |
508 | } |
509 | |
510 | Out << "Input file: " << ConvertFilename << "\n" ; |
511 | |
512 | if (auto DsymObjectsOrErr = |
513 | MachOObjectFile::findDsymObjectMembers(Path: ConvertFilename)) { |
514 | if (DsymObjectsOrErr->empty()) |
515 | Objects.push_back(x: ConvertFilename); |
516 | else |
517 | llvm::append_range(C&: Objects, R&: *DsymObjectsOrErr); |
518 | } else { |
519 | error(Err: DsymObjectsOrErr.takeError()); |
520 | } |
521 | |
522 | for (StringRef Object : Objects) |
523 | if (Error Err = handleFileConversionToGSYM(Filename: Object, OutFile, Out)) |
524 | return Err; |
525 | return Error::success(); |
526 | } |
527 | |
528 | static void doLookup(GsymReader &Gsym, uint64_t Addr, raw_ostream &OS) { |
529 | if (UseMergedFunctions) { |
530 | if (auto Results = Gsym.lookupAll(Addr)) { |
531 | // If we have filters, count matching results first |
532 | size_t NumMatching = Results->size(); |
533 | if (!MergedFunctionsFilters.empty()) { |
534 | NumMatching = 0; |
535 | for (const auto &Result : *Results) { |
536 | bool Matches = false; |
537 | for (const auto &Filter : MergedFunctionsFilters) { |
538 | Regex Pattern(Filter); |
539 | if (Pattern.match(String: Result.FuncName)) { |
540 | Matches = true; |
541 | break; |
542 | } |
543 | } |
544 | if (Matches) |
545 | NumMatching++; |
546 | } |
547 | } |
548 | |
549 | OS << "Found " << NumMatching << " function" |
550 | << (NumMatching != 1 ? "s" : "" ) << " at address " << HEX64(Addr) |
551 | << ":\n" ; |
552 | |
553 | for (size_t i = 0; i < Results->size(); ++i) { |
554 | // Skip if doesn't match any filter |
555 | if (!MergedFunctionsFilters.empty()) { |
556 | bool Matches = false; |
557 | for (const auto &Filter : MergedFunctionsFilters) { |
558 | Regex Pattern(Filter); |
559 | if (Pattern.match(String: Results->at(n: i).FuncName)) { |
560 | Matches = true; |
561 | break; |
562 | } |
563 | } |
564 | if (!Matches) |
565 | continue; |
566 | } |
567 | |
568 | OS << " " << Results->at(n: i); |
569 | |
570 | if (i != Results->size() - 1) |
571 | OS << "\n" ; |
572 | } |
573 | } |
574 | } else { /* UseMergedFunctions == false */ |
575 | if (auto Result = Gsym.lookup(Addr)) { |
576 | // If verbose is enabled dump the full function info for the address. |
577 | if (Verbose) { |
578 | if (auto FI = Gsym.getFunctionInfo(Addr)) { |
579 | OS << "FunctionInfo for " << HEX64(Addr) << ":\n" ; |
580 | Gsym.dump(OS, FI: *FI); |
581 | OS << "\nLookupResult for " << HEX64(Addr) << ":\n" ; |
582 | } |
583 | } |
584 | // Don't print call site info if --merged-functions is not specified. |
585 | Result->CallSiteFuncRegex.clear(); |
586 | OS << Result.get(); |
587 | } else { |
588 | if (Verbose) |
589 | OS << "\nLookupResult for " << HEX64(Addr) << ":\n" ; |
590 | OS << HEX64(Addr) << ": " ; |
591 | logAllUnhandledErrors(E: Result.takeError(), OS, ErrorBanner: "error: " ); |
592 | } |
593 | if (Verbose) |
594 | OS << "\n" ; |
595 | } |
596 | } |
597 | |
598 | int llvm_gsymutil_main(int argc, char **argv, const llvm::ToolContext &) { |
599 | // Print a stack trace if we signal out. |
600 | sys::PrintStackTraceOnErrorSignal(Argv0: argv[0]); |
601 | PrettyStackTraceProgram X(argc, argv); |
602 | llvm_shutdown_obj Y; // Call llvm_shutdown() on exit. |
603 | |
604 | llvm::InitializeAllTargets(); |
605 | |
606 | parseArgs(argc, argv); |
607 | |
608 | raw_ostream &OS = outs(); |
609 | |
610 | OutputAggregator Aggregation(&OS); |
611 | if (!ConvertFilename.empty()) { |
612 | // Convert DWARF to GSYM |
613 | if (!InputFilenames.empty()) { |
614 | OS << "error: no input files can be specified when using the --convert " |
615 | "option.\n" ; |
616 | return 1; |
617 | } |
618 | // Call error() if we have an error and it will exit with a status of 1 |
619 | if (auto Err = convertFileToGSYM(Out&: Aggregation)) |
620 | error(Prefix: "DWARF conversion failed: " , Err: std::move(Err)); |
621 | |
622 | // Report the errors from aggregator: |
623 | Aggregation.EnumerateResults(handleCounts: [&](StringRef category, unsigned count) { |
624 | OS << category << " occurred " << count << " time(s)\n" ; |
625 | }); |
626 | if (!JsonSummaryFile.empty()) { |
627 | std::error_code EC; |
628 | raw_fd_ostream JsonStream(JsonSummaryFile, EC, sys::fs::OF_Text); |
629 | if (EC) { |
630 | OS << "error opening aggregate error json file '" << JsonSummaryFile |
631 | << "' for writing: " << EC.message() << '\n'; |
632 | return 1; |
633 | } |
634 | |
635 | llvm::json::Object Categories; |
636 | uint64_t ErrorCount = 0; |
637 | Aggregation.EnumerateResults(handleCounts: [&](StringRef Category, unsigned Count) { |
638 | llvm::json::Object Val; |
639 | Val.try_emplace(K: "count" , Args&: Count); |
640 | Categories.try_emplace(K: Category, Args: std::move(Val)); |
641 | ErrorCount += Count; |
642 | }); |
643 | llvm::json::Object RootNode; |
644 | RootNode.try_emplace(K: "error-categories" , Args: std::move(Categories)); |
645 | RootNode.try_emplace(K: "error-count" , Args&: ErrorCount); |
646 | |
647 | JsonStream << llvm::json::Value(std::move(RootNode)); |
648 | } |
649 | return 0; |
650 | } |
651 | |
652 | if (LookupAddressesFromStdin) { |
653 | if (!LookupAddresses.empty() || !InputFilenames.empty()) { |
654 | OS << "error: no input files or addresses can be specified when using " |
655 | "the --addresses-from-stdin " |
656 | "option.\n" ; |
657 | return 1; |
658 | } |
659 | |
660 | std::string InputLine; |
661 | std::string CurrentGSYMPath; |
662 | std::optional<Expected<GsymReader>> CurrentGsym; |
663 | |
664 | while (std::getline(is&: std::cin, str&: InputLine)) { |
665 | // Strip newline characters. |
666 | std::string StrippedInputLine(InputLine); |
667 | llvm::erase_if(C&: StrippedInputLine, |
668 | P: [](char c) { return c == '\r' || c == '\n'; }); |
669 | |
670 | StringRef AddrStr, GSYMPath; |
671 | std::tie(args&: AddrStr, args&: GSYMPath) = |
672 | llvm::StringRef{StrippedInputLine}.split(Separator: ' '); |
673 | |
674 | if (GSYMPath != CurrentGSYMPath) { |
675 | CurrentGsym = GsymReader::openFile(Path: GSYMPath); |
676 | if (!*CurrentGsym) |
677 | error(Prefix: GSYMPath, Err: CurrentGsym->takeError()); |
678 | CurrentGSYMPath = GSYMPath; |
679 | } |
680 | |
681 | uint64_t Addr; |
682 | if (AddrStr.getAsInteger(Radix: 0, Result&: Addr)) { |
683 | OS << "error: invalid address " << AddrStr |
684 | << ", expected: Address GsymFile.\n" ; |
685 | return 1; |
686 | } |
687 | |
688 | doLookup(Gsym&: **CurrentGsym, Addr, OS); |
689 | |
690 | OS << "\n" ; |
691 | OS.flush(); |
692 | } |
693 | |
694 | return EXIT_SUCCESS; |
695 | } |
696 | |
697 | // Dump or access data inside GSYM files |
698 | for (const auto &GSYMPath : InputFilenames) { |
699 | auto Gsym = GsymReader::openFile(Path: GSYMPath); |
700 | if (!Gsym) |
701 | error(Prefix: GSYMPath, Err: Gsym.takeError()); |
702 | |
703 | if (LookupAddresses.empty()) { |
704 | Gsym->dump(OS&: outs()); |
705 | continue; |
706 | } |
707 | |
708 | // Lookup an address in a GSYM file and print any matches. |
709 | OS << "Looking up addresses in \"" << GSYMPath << "\":\n" ; |
710 | for (auto Addr : LookupAddresses) { |
711 | doLookup(Gsym&: *Gsym, Addr, OS); |
712 | } |
713 | } |
714 | return EXIT_SUCCESS; |
715 | } |
716 | |