1 | //===- CoverageMappingReader.cpp - Code coverage mapping reader -----------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // This file contains support for reading coverage mapping data for |
10 | // instrumentation based coverage. |
11 | // |
12 | //===----------------------------------------------------------------------===// |
13 | |
14 | #include "llvm/ProfileData/Coverage/CoverageMappingReader.h" |
15 | #include "llvm/ADT/ArrayRef.h" |
16 | #include "llvm/ADT/DenseMap.h" |
17 | #include "llvm/ADT/STLExtras.h" |
18 | #include "llvm/ADT/SmallVector.h" |
19 | #include "llvm/ADT/Statistic.h" |
20 | #include "llvm/ADT/StringRef.h" |
21 | #include "llvm/Object/Archive.h" |
22 | #include "llvm/Object/Binary.h" |
23 | #include "llvm/Object/COFF.h" |
24 | #include "llvm/Object/Error.h" |
25 | #include "llvm/Object/MachOUniversal.h" |
26 | #include "llvm/Object/ObjectFile.h" |
27 | #include "llvm/ProfileData/InstrProf.h" |
28 | #include "llvm/Support/Casting.h" |
29 | #include "llvm/Support/Compression.h" |
30 | #include "llvm/Support/Debug.h" |
31 | #include "llvm/Support/Endian.h" |
32 | #include "llvm/Support/Error.h" |
33 | #include "llvm/Support/ErrorHandling.h" |
34 | #include "llvm/Support/LEB128.h" |
35 | #include "llvm/Support/MathExtras.h" |
36 | #include "llvm/Support/Path.h" |
37 | #include "llvm/Support/raw_ostream.h" |
38 | #include "llvm/TargetParser/Triple.h" |
39 | #include <vector> |
40 | |
41 | using namespace llvm; |
42 | using namespace coverage; |
43 | using namespace object; |
44 | |
45 | #define DEBUG_TYPE "coverage-mapping" |
46 | |
47 | STATISTIC(CovMapNumRecords, "The # of coverage function records" ); |
48 | STATISTIC(CovMapNumUsedRecords, "The # of used coverage function records" ); |
49 | |
50 | void CoverageMappingIterator::increment() { |
51 | if (ReadErr != coveragemap_error::success) |
52 | return; |
53 | |
54 | // Check if all the records were read or if an error occurred while reading |
55 | // the next record. |
56 | if (auto E = Reader->readNextRecord(Record)) |
57 | handleAllErrors(E: std::move(E), Handlers: [&](const CoverageMapError &CME) { |
58 | if (CME.get() == coveragemap_error::eof) |
59 | *this = CoverageMappingIterator(); |
60 | else |
61 | ReadErr = CME.get(); |
62 | }); |
63 | } |
64 | |
65 | Error RawCoverageReader::readULEB128(uint64_t &Result) { |
66 | if (Data.empty()) |
67 | return make_error<CoverageMapError>(Args: coveragemap_error::truncated); |
68 | unsigned N = 0; |
69 | Result = decodeULEB128(p: Data.bytes_begin(), n: &N); |
70 | if (N > Data.size()) |
71 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
72 | Args: "the size of ULEB128 is too big" ); |
73 | Data = Data.substr(Start: N); |
74 | return Error::success(); |
75 | } |
76 | |
77 | Error RawCoverageReader::readIntMax(uint64_t &Result, uint64_t MaxPlus1) { |
78 | if (auto Err = readULEB128(Result)) |
79 | return Err; |
80 | if (Result >= MaxPlus1) |
81 | return make_error<CoverageMapError>( |
82 | Args: coveragemap_error::malformed, |
83 | Args: "the value of ULEB128 is greater than or equal to MaxPlus1" ); |
84 | return Error::success(); |
85 | } |
86 | |
87 | Error RawCoverageReader::readSize(uint64_t &Result) { |
88 | if (auto Err = readULEB128(Result)) |
89 | return Err; |
90 | if (Result > Data.size()) |
91 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
92 | Args: "the value of ULEB128 is too big" ); |
93 | return Error::success(); |
94 | } |
95 | |
96 | Error RawCoverageReader::readString(StringRef &Result) { |
97 | uint64_t Length; |
98 | if (auto Err = readSize(Result&: Length)) |
99 | return Err; |
100 | Result = Data.substr(Start: 0, N: Length); |
101 | Data = Data.substr(Start: Length); |
102 | return Error::success(); |
103 | } |
104 | |
105 | Error RawCoverageFilenamesReader::read(CovMapVersion Version) { |
106 | uint64_t NumFilenames; |
107 | if (auto Err = readSize(Result&: NumFilenames)) |
108 | return Err; |
109 | if (!NumFilenames) |
110 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
111 | Args: "number of filenames is zero" ); |
112 | |
113 | if (Version < CovMapVersion::Version4) |
114 | return readUncompressed(Version, NumFilenames); |
115 | |
116 | // The uncompressed length may exceed the size of the encoded filenames. |
117 | // Skip size validation. |
118 | uint64_t UncompressedLen; |
119 | if (auto Err = readULEB128(Result&: UncompressedLen)) |
120 | return Err; |
121 | |
122 | uint64_t CompressedLen; |
123 | if (auto Err = readSize(Result&: CompressedLen)) |
124 | return Err; |
125 | |
126 | if (CompressedLen > 0) { |
127 | if (!compression::zlib::isAvailable()) |
128 | return make_error<CoverageMapError>( |
129 | Args: coveragemap_error::decompression_failed); |
130 | |
131 | // Allocate memory for the decompressed filenames. |
132 | SmallVector<uint8_t, 0> StorageBuf; |
133 | |
134 | // Read compressed filenames. |
135 | StringRef CompressedFilenames = Data.substr(Start: 0, N: CompressedLen); |
136 | Data = Data.substr(Start: CompressedLen); |
137 | auto Err = compression::zlib::decompress( |
138 | Input: arrayRefFromStringRef(Input: CompressedFilenames), Output&: StorageBuf, |
139 | UncompressedSize: UncompressedLen); |
140 | if (Err) { |
141 | consumeError(Err: std::move(Err)); |
142 | return make_error<CoverageMapError>( |
143 | Args: coveragemap_error::decompression_failed); |
144 | } |
145 | |
146 | RawCoverageFilenamesReader Delegate(toStringRef(Input: StorageBuf), Filenames, |
147 | CompilationDir); |
148 | return Delegate.readUncompressed(Version, NumFilenames); |
149 | } |
150 | |
151 | return readUncompressed(Version, NumFilenames); |
152 | } |
153 | |
154 | Error RawCoverageFilenamesReader::readUncompressed(CovMapVersion Version, |
155 | uint64_t NumFilenames) { |
156 | // Read uncompressed filenames. |
157 | if (Version < CovMapVersion::Version6) { |
158 | for (size_t I = 0; I < NumFilenames; ++I) { |
159 | StringRef Filename; |
160 | if (auto Err = readString(Result&: Filename)) |
161 | return Err; |
162 | Filenames.push_back(x: Filename.str()); |
163 | } |
164 | } else { |
165 | StringRef CWD; |
166 | if (auto Err = readString(Result&: CWD)) |
167 | return Err; |
168 | Filenames.push_back(x: CWD.str()); |
169 | |
170 | for (size_t I = 1; I < NumFilenames; ++I) { |
171 | StringRef Filename; |
172 | if (auto Err = readString(Result&: Filename)) |
173 | return Err; |
174 | if (sys::path::is_absolute(path: Filename)) { |
175 | Filenames.push_back(x: Filename.str()); |
176 | } else { |
177 | SmallString<256> P; |
178 | if (!CompilationDir.empty()) |
179 | P.assign(RHS: CompilationDir); |
180 | else |
181 | P.assign(RHS: CWD); |
182 | llvm::sys::path::append(path&: P, a: Filename); |
183 | sys::path::remove_dots(path&: P, /*remove_dot_dot=*/true); |
184 | Filenames.push_back(x: static_cast<std::string>(P.str())); |
185 | } |
186 | } |
187 | } |
188 | return Error::success(); |
189 | } |
190 | |
191 | Error RawCoverageMappingReader::decodeCounter(unsigned Value, Counter &C) { |
192 | auto Tag = Value & Counter::EncodingTagMask; |
193 | switch (Tag) { |
194 | case Counter::Zero: |
195 | C = Counter::getZero(); |
196 | return Error::success(); |
197 | case Counter::CounterValueReference: |
198 | C = Counter::getCounter(CounterId: Value >> Counter::EncodingTagBits); |
199 | return Error::success(); |
200 | default: |
201 | break; |
202 | } |
203 | Tag -= Counter::Expression; |
204 | switch (Tag) { |
205 | case CounterExpression::Subtract: |
206 | case CounterExpression::Add: { |
207 | auto ID = Value >> Counter::EncodingTagBits; |
208 | if (ID >= Expressions.size()) |
209 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
210 | Args: "counter expression is invalid" ); |
211 | Expressions[ID].Kind = CounterExpression::ExprKind(Tag); |
212 | C = Counter::getExpression(ExpressionId: ID); |
213 | break; |
214 | } |
215 | default: |
216 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
217 | Args: "counter expression kind is invalid" ); |
218 | } |
219 | return Error::success(); |
220 | } |
221 | |
222 | Error RawCoverageMappingReader::readCounter(Counter &C) { |
223 | uint64_t EncodedCounter; |
224 | if (auto Err = |
225 | readIntMax(Result&: EncodedCounter, MaxPlus1: std::numeric_limits<unsigned>::max())) |
226 | return Err; |
227 | if (auto Err = decodeCounter(Value: EncodedCounter, C)) |
228 | return Err; |
229 | return Error::success(); |
230 | } |
231 | |
232 | static const unsigned EncodingExpansionRegionBit = 1 |
233 | << Counter::EncodingTagBits; |
234 | |
235 | /// Read the sub-array of regions for the given inferred file id. |
236 | /// \param NumFileIDs the number of file ids that are defined for this |
237 | /// function. |
238 | Error RawCoverageMappingReader::readMappingRegionsSubArray( |
239 | std::vector<CounterMappingRegion> &MappingRegions, unsigned InferredFileID, |
240 | size_t NumFileIDs) { |
241 | uint64_t NumRegions; |
242 | if (auto Err = readSize(Result&: NumRegions)) |
243 | return Err; |
244 | unsigned LineStart = 0; |
245 | for (size_t I = 0; I < NumRegions; ++I) { |
246 | Counter C, C2; |
247 | uint64_t BIDX, NC; |
248 | // They are stored as internal values plus 1 (min is -1) |
249 | uint64_t ID1, TID1, FID1; |
250 | mcdc::Parameters Params; |
251 | CounterMappingRegion::RegionKind Kind = CounterMappingRegion::CodeRegion; |
252 | |
253 | // Read the combined counter + region kind. |
254 | uint64_t EncodedCounterAndRegion; |
255 | if (auto Err = readIntMax(Result&: EncodedCounterAndRegion, |
256 | MaxPlus1: std::numeric_limits<unsigned>::max())) |
257 | return Err; |
258 | unsigned Tag = EncodedCounterAndRegion & Counter::EncodingTagMask; |
259 | uint64_t ExpandedFileID = 0; |
260 | |
261 | // If Tag does not represent a ZeroCounter, then it is understood to refer |
262 | // to a counter or counter expression with region kind assumed to be |
263 | // "CodeRegion". In that case, EncodedCounterAndRegion actually encodes the |
264 | // referenced counter or counter expression (and nothing else). |
265 | // |
266 | // If Tag represents a ZeroCounter and EncodingExpansionRegionBit is set, |
267 | // then EncodedCounterAndRegion is interpreted to represent an |
268 | // ExpansionRegion. In all other cases, EncodedCounterAndRegion is |
269 | // interpreted to refer to a specific region kind, after which additional |
270 | // fields may be read (e.g. BranchRegions have two encoded counters that |
271 | // follow an encoded region kind value). |
272 | if (Tag != Counter::Zero) { |
273 | if (auto Err = decodeCounter(Value: EncodedCounterAndRegion, C)) |
274 | return Err; |
275 | } else { |
276 | // Is it an expansion region? |
277 | if (EncodedCounterAndRegion & EncodingExpansionRegionBit) { |
278 | Kind = CounterMappingRegion::ExpansionRegion; |
279 | ExpandedFileID = EncodedCounterAndRegion >> |
280 | Counter::EncodingCounterTagAndExpansionRegionTagBits; |
281 | if (ExpandedFileID >= NumFileIDs) |
282 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
283 | Args: "ExpandedFileID is invalid" ); |
284 | } else { |
285 | switch (EncodedCounterAndRegion >> |
286 | Counter::EncodingCounterTagAndExpansionRegionTagBits) { |
287 | case CounterMappingRegion::CodeRegion: |
288 | // Don't do anything when we have a code region with a zero counter. |
289 | break; |
290 | case CounterMappingRegion::SkippedRegion: |
291 | Kind = CounterMappingRegion::SkippedRegion; |
292 | break; |
293 | case CounterMappingRegion::BranchRegion: |
294 | // For a Branch Region, read two successive counters. |
295 | Kind = CounterMappingRegion::BranchRegion; |
296 | if (auto Err = readCounter(C)) |
297 | return Err; |
298 | if (auto Err = readCounter(C&: C2)) |
299 | return Err; |
300 | break; |
301 | case CounterMappingRegion::MCDCBranchRegion: |
302 | // For a MCDC Branch Region, read two successive counters and 3 IDs. |
303 | Kind = CounterMappingRegion::MCDCBranchRegion; |
304 | if (auto Err = readCounter(C)) |
305 | return Err; |
306 | if (auto Err = readCounter(C&: C2)) |
307 | return Err; |
308 | if (auto Err = readIntMax(Result&: ID1, MaxPlus1: std::numeric_limits<int16_t>::max())) |
309 | return Err; |
310 | if (auto Err = readIntMax(Result&: TID1, MaxPlus1: std::numeric_limits<int16_t>::max())) |
311 | return Err; |
312 | if (auto Err = readIntMax(Result&: FID1, MaxPlus1: std::numeric_limits<int16_t>::max())) |
313 | return Err; |
314 | if (ID1 == 0) |
315 | return make_error<CoverageMapError>( |
316 | Args: coveragemap_error::malformed, |
317 | Args: "MCDCConditionID shouldn't be zero" ); |
318 | Params = mcdc::BranchParameters{ |
319 | static_cast<int16_t>(static_cast<int16_t>(ID1) - 1), |
320 | {static_cast<int16_t>(static_cast<int16_t>(FID1) - 1), |
321 | static_cast<int16_t>(static_cast<int16_t>(TID1) - 1)}}; |
322 | break; |
323 | case CounterMappingRegion::MCDCDecisionRegion: |
324 | Kind = CounterMappingRegion::MCDCDecisionRegion; |
325 | if (auto Err = readIntMax(Result&: BIDX, MaxPlus1: std::numeric_limits<unsigned>::max())) |
326 | return Err; |
327 | if (auto Err = readIntMax(Result&: NC, MaxPlus1: std::numeric_limits<int16_t>::max())) |
328 | return Err; |
329 | Params = mcdc::DecisionParameters{static_cast<unsigned>(BIDX), |
330 | static_cast<uint16_t>(NC)}; |
331 | break; |
332 | default: |
333 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
334 | Args: "region kind is incorrect" ); |
335 | } |
336 | } |
337 | } |
338 | |
339 | // Read the source range. |
340 | uint64_t LineStartDelta, ColumnStart, NumLines, ColumnEnd; |
341 | if (auto Err = |
342 | readIntMax(Result&: LineStartDelta, MaxPlus1: std::numeric_limits<unsigned>::max())) |
343 | return Err; |
344 | if (auto Err = readULEB128(Result&: ColumnStart)) |
345 | return Err; |
346 | if (ColumnStart > std::numeric_limits<unsigned>::max()) |
347 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
348 | Args: "start column is too big" ); |
349 | if (auto Err = readIntMax(Result&: NumLines, MaxPlus1: std::numeric_limits<unsigned>::max())) |
350 | return Err; |
351 | if (auto Err = readIntMax(Result&: ColumnEnd, MaxPlus1: std::numeric_limits<unsigned>::max())) |
352 | return Err; |
353 | LineStart += LineStartDelta; |
354 | |
355 | // If the high bit of ColumnEnd is set, this is a gap region. |
356 | if (ColumnEnd & (1U << 31)) { |
357 | Kind = CounterMappingRegion::GapRegion; |
358 | ColumnEnd &= ~(1U << 31); |
359 | } |
360 | |
361 | // Adjust the column locations for the empty regions that are supposed to |
362 | // cover whole lines. Those regions should be encoded with the |
363 | // column range (1 -> std::numeric_limits<unsigned>::max()), but because |
364 | // the encoded std::numeric_limits<unsigned>::max() is several bytes long, |
365 | // we set the column range to (0 -> 0) to ensure that the column start and |
366 | // column end take up one byte each. |
367 | // The std::numeric_limits<unsigned>::max() is used to represent a column |
368 | // position at the end of the line without knowing the length of that line. |
369 | if (ColumnStart == 0 && ColumnEnd == 0) { |
370 | ColumnStart = 1; |
371 | ColumnEnd = std::numeric_limits<unsigned>::max(); |
372 | } |
373 | |
374 | LLVM_DEBUG({ |
375 | dbgs() << "Counter in file " << InferredFileID << " " << LineStart << ":" |
376 | << ColumnStart << " -> " << (LineStart + NumLines) << ":" |
377 | << ColumnEnd << ", " ; |
378 | if (Kind == CounterMappingRegion::ExpansionRegion) |
379 | dbgs() << "Expands to file " << ExpandedFileID; |
380 | else |
381 | CounterMappingContext(Expressions).dump(C, dbgs()); |
382 | dbgs() << "\n" ; |
383 | }); |
384 | |
385 | auto CMR = CounterMappingRegion( |
386 | C, C2, InferredFileID, ExpandedFileID, LineStart, ColumnStart, |
387 | LineStart + NumLines, ColumnEnd, Kind, Params); |
388 | if (CMR.startLoc() > CMR.endLoc()) |
389 | return make_error<CoverageMapError>( |
390 | Args: coveragemap_error::malformed, |
391 | Args: "counter mapping region locations are incorrect" ); |
392 | MappingRegions.push_back(x: CMR); |
393 | } |
394 | return Error::success(); |
395 | } |
396 | |
397 | Error RawCoverageMappingReader::read() { |
398 | // Read the virtual file mapping. |
399 | SmallVector<unsigned, 8> VirtualFileMapping; |
400 | uint64_t NumFileMappings; |
401 | if (auto Err = readSize(Result&: NumFileMappings)) |
402 | return Err; |
403 | for (size_t I = 0; I < NumFileMappings; ++I) { |
404 | uint64_t FilenameIndex; |
405 | if (auto Err = readIntMax(Result&: FilenameIndex, MaxPlus1: TranslationUnitFilenames.size())) |
406 | return Err; |
407 | VirtualFileMapping.push_back(Elt: FilenameIndex); |
408 | } |
409 | |
410 | // Construct the files using unique filenames and virtual file mapping. |
411 | for (auto I : VirtualFileMapping) { |
412 | Filenames.push_back(x: TranslationUnitFilenames[I]); |
413 | } |
414 | |
415 | // Read the expressions. |
416 | uint64_t NumExpressions; |
417 | if (auto Err = readSize(Result&: NumExpressions)) |
418 | return Err; |
419 | // Create an array of dummy expressions that get the proper counters |
420 | // when the expressions are read, and the proper kinds when the counters |
421 | // are decoded. |
422 | Expressions.resize( |
423 | new_size: NumExpressions, |
424 | x: CounterExpression(CounterExpression::Subtract, Counter(), Counter())); |
425 | for (size_t I = 0; I < NumExpressions; ++I) { |
426 | if (auto Err = readCounter(C&: Expressions[I].LHS)) |
427 | return Err; |
428 | if (auto Err = readCounter(C&: Expressions[I].RHS)) |
429 | return Err; |
430 | } |
431 | |
432 | // Read the mapping regions sub-arrays. |
433 | for (unsigned InferredFileID = 0, S = VirtualFileMapping.size(); |
434 | InferredFileID < S; ++InferredFileID) { |
435 | if (auto Err = readMappingRegionsSubArray(MappingRegions, InferredFileID, |
436 | NumFileIDs: VirtualFileMapping.size())) |
437 | return Err; |
438 | } |
439 | |
440 | // Set the counters for the expansion regions. |
441 | // i.e. Counter of expansion region = counter of the first region |
442 | // from the expanded file. |
443 | // Perform multiple passes to correctly propagate the counters through |
444 | // all the nested expansion regions. |
445 | SmallVector<CounterMappingRegion *, 8> FileIDExpansionRegionMapping; |
446 | FileIDExpansionRegionMapping.resize(N: VirtualFileMapping.size(), NV: nullptr); |
447 | for (unsigned Pass = 1, S = VirtualFileMapping.size(); Pass < S; ++Pass) { |
448 | for (auto &R : MappingRegions) { |
449 | if (R.Kind != CounterMappingRegion::ExpansionRegion) |
450 | continue; |
451 | assert(!FileIDExpansionRegionMapping[R.ExpandedFileID]); |
452 | FileIDExpansionRegionMapping[R.ExpandedFileID] = &R; |
453 | } |
454 | for (auto &R : MappingRegions) { |
455 | if (FileIDExpansionRegionMapping[R.FileID]) { |
456 | FileIDExpansionRegionMapping[R.FileID]->Count = R.Count; |
457 | FileIDExpansionRegionMapping[R.FileID] = nullptr; |
458 | } |
459 | } |
460 | } |
461 | |
462 | return Error::success(); |
463 | } |
464 | |
465 | Expected<bool> RawCoverageMappingDummyChecker::isDummy() { |
466 | // A dummy coverage mapping data consists of just one region with zero count. |
467 | uint64_t NumFileMappings; |
468 | if (Error Err = readSize(Result&: NumFileMappings)) |
469 | return std::move(Err); |
470 | if (NumFileMappings != 1) |
471 | return false; |
472 | // We don't expect any specific value for the filename index, just skip it. |
473 | uint64_t FilenameIndex; |
474 | if (Error Err = |
475 | readIntMax(Result&: FilenameIndex, MaxPlus1: std::numeric_limits<unsigned>::max())) |
476 | return std::move(Err); |
477 | uint64_t NumExpressions; |
478 | if (Error Err = readSize(Result&: NumExpressions)) |
479 | return std::move(Err); |
480 | if (NumExpressions != 0) |
481 | return false; |
482 | uint64_t NumRegions; |
483 | if (Error Err = readSize(Result&: NumRegions)) |
484 | return std::move(Err); |
485 | if (NumRegions != 1) |
486 | return false; |
487 | uint64_t EncodedCounterAndRegion; |
488 | if (Error Err = readIntMax(Result&: EncodedCounterAndRegion, |
489 | MaxPlus1: std::numeric_limits<unsigned>::max())) |
490 | return std::move(Err); |
491 | unsigned Tag = EncodedCounterAndRegion & Counter::EncodingTagMask; |
492 | return Tag == Counter::Zero; |
493 | } |
494 | |
495 | Error InstrProfSymtab::create(SectionRef &Section) { |
496 | Expected<StringRef> DataOrErr = Section.getContents(); |
497 | if (!DataOrErr) |
498 | return DataOrErr.takeError(); |
499 | Data = *DataOrErr; |
500 | Address = Section.getAddress(); |
501 | |
502 | // If this is a linked PE/COFF file, then we have to skip over the null byte |
503 | // that is allocated in the .lprfn$A section in the LLVM profiling runtime. |
504 | // If the name section is .lprfcovnames, it doesn't have the null byte at the |
505 | // beginning. |
506 | const ObjectFile *Obj = Section.getObject(); |
507 | if (isa<COFFObjectFile>(Val: Obj) && !Obj->isRelocatableObject()) |
508 | if (Expected<StringRef> NameOrErr = Section.getName()) |
509 | if (*NameOrErr != getInstrProfSectionName(IPSK: IPSK_covname, OF: Triple::COFF)) |
510 | Data = Data.drop_front(N: 1); |
511 | |
512 | return Error::success(); |
513 | } |
514 | |
515 | StringRef InstrProfSymtab::getFuncName(uint64_t Pointer, size_t Size) { |
516 | if (Pointer < Address) |
517 | return StringRef(); |
518 | auto Offset = Pointer - Address; |
519 | if (Offset + Size > Data.size()) |
520 | return StringRef(); |
521 | return Data.substr(Start: Pointer - Address, N: Size); |
522 | } |
523 | |
524 | // Check if the mapping data is a dummy, i.e. is emitted for an unused function. |
525 | static Expected<bool> isCoverageMappingDummy(uint64_t Hash, StringRef Mapping) { |
526 | // The hash value of dummy mapping records is always zero. |
527 | if (Hash) |
528 | return false; |
529 | return RawCoverageMappingDummyChecker(Mapping).isDummy(); |
530 | } |
531 | |
532 | /// A range of filename indices. Used to specify the location of a batch of |
533 | /// filenames in a vector-like container. |
534 | struct FilenameRange { |
535 | unsigned StartingIndex; |
536 | unsigned Length; |
537 | |
538 | FilenameRange(unsigned StartingIndex, unsigned Length) |
539 | : StartingIndex(StartingIndex), Length(Length) {} |
540 | |
541 | void markInvalid() { Length = 0; } |
542 | bool isInvalid() const { return Length == 0; } |
543 | }; |
544 | |
545 | namespace { |
546 | |
547 | /// The interface to read coverage mapping function records for a module. |
548 | struct CovMapFuncRecordReader { |
549 | virtual ~CovMapFuncRecordReader() = default; |
550 | |
551 | // Read a coverage header. |
552 | // |
553 | // \p CovBuf points to the buffer containing the \c CovHeader of the coverage |
554 | // mapping data associated with the module. |
555 | // |
556 | // Returns a pointer to the next \c CovHeader if it exists, or to an address |
557 | // greater than \p CovEnd if not. |
558 | virtual Expected<const char *> (const char *CovBuf, |
559 | const char *CovBufEnd) = 0; |
560 | |
561 | // Read function records. |
562 | // |
563 | // \p FuncRecBuf points to the buffer containing a batch of function records. |
564 | // \p FuncRecBufEnd points past the end of the batch of records. |
565 | // |
566 | // Prior to Version4, \p OutOfLineFileRange points to a sequence of filenames |
567 | // associated with the function records. It is unused in Version4. |
568 | // |
569 | // Prior to Version4, \p OutOfLineMappingBuf points to a sequence of coverage |
570 | // mappings associated with the function records. It is unused in Version4. |
571 | virtual Error |
572 | readFunctionRecords(const char *FuncRecBuf, const char *FuncRecBufEnd, |
573 | std::optional<FilenameRange> OutOfLineFileRange, |
574 | const char *OutOfLineMappingBuf, |
575 | const char *OutOfLineMappingBufEnd) = 0; |
576 | |
577 | template <class IntPtrT, llvm::endianness Endian> |
578 | static Expected<std::unique_ptr<CovMapFuncRecordReader>> |
579 | get(CovMapVersion Version, InstrProfSymtab &P, |
580 | std::vector<BinaryCoverageReader::ProfileMappingRecord> &R, StringRef D, |
581 | std::vector<std::string> &F); |
582 | }; |
583 | |
584 | // A class for reading coverage mapping function records for a module. |
585 | template <CovMapVersion Version, class IntPtrT, llvm::endianness Endian> |
586 | class VersionedCovMapFuncRecordReader : public CovMapFuncRecordReader { |
587 | using FuncRecordType = |
588 | typename CovMapTraits<Version, IntPtrT>::CovMapFuncRecordType; |
589 | using NameRefType = typename CovMapTraits<Version, IntPtrT>::NameRefType; |
590 | |
591 | // Maps function's name references to the indexes of their records |
592 | // in \c Records. |
593 | DenseMap<NameRefType, size_t> FunctionRecords; |
594 | InstrProfSymtab &ProfileNames; |
595 | StringRef CompilationDir; |
596 | std::vector<std::string> &Filenames; |
597 | std::vector<BinaryCoverageReader::ProfileMappingRecord> &Records; |
598 | |
599 | // Maps a hash of the filenames in a TU to a \c FileRange. The range |
600 | // specifies the location of the hashed filenames in \c Filenames. |
601 | DenseMap<uint64_t, FilenameRange> FileRangeMap; |
602 | |
603 | // Add the record to the collection if we don't already have a record that |
604 | // points to the same function name. This is useful to ignore the redundant |
605 | // records for the functions with ODR linkage. |
606 | // In addition, prefer records with real coverage mapping data to dummy |
607 | // records, which were emitted for inline functions which were seen but |
608 | // not used in the corresponding translation unit. |
609 | Error insertFunctionRecordIfNeeded(const FuncRecordType *CFR, |
610 | StringRef Mapping, |
611 | FilenameRange FileRange) { |
612 | ++CovMapNumRecords; |
613 | uint64_t FuncHash = CFR->template getFuncHash<Endian>(); |
614 | NameRefType NameRef = CFR->template getFuncNameRef<Endian>(); |
615 | auto InsertResult = |
616 | FunctionRecords.insert(std::make_pair(NameRef, Records.size())); |
617 | if (InsertResult.second) { |
618 | StringRef FuncName; |
619 | if (Error Err = CFR->template getFuncName<Endian>(ProfileNames, FuncName)) |
620 | return Err; |
621 | if (FuncName.empty()) |
622 | return make_error<InstrProfError>(Args: instrprof_error::malformed, |
623 | Args: "function name is empty" ); |
624 | ++CovMapNumUsedRecords; |
625 | Records.emplace_back(args: Version, args&: FuncName, args&: FuncHash, args&: Mapping, |
626 | args&: FileRange.StartingIndex, args&: FileRange.Length); |
627 | return Error::success(); |
628 | } |
629 | // Update the existing record if it's a dummy and the new record is real. |
630 | size_t OldRecordIndex = InsertResult.first->second; |
631 | BinaryCoverageReader::ProfileMappingRecord &OldRecord = |
632 | Records[OldRecordIndex]; |
633 | Expected<bool> OldIsDummyExpected = isCoverageMappingDummy( |
634 | Hash: OldRecord.FunctionHash, Mapping: OldRecord.CoverageMapping); |
635 | if (Error Err = OldIsDummyExpected.takeError()) |
636 | return Err; |
637 | if (!*OldIsDummyExpected) |
638 | return Error::success(); |
639 | Expected<bool> NewIsDummyExpected = |
640 | isCoverageMappingDummy(Hash: FuncHash, Mapping); |
641 | if (Error Err = NewIsDummyExpected.takeError()) |
642 | return Err; |
643 | if (*NewIsDummyExpected) |
644 | return Error::success(); |
645 | ++CovMapNumUsedRecords; |
646 | OldRecord.FunctionHash = FuncHash; |
647 | OldRecord.CoverageMapping = Mapping; |
648 | OldRecord.FilenamesBegin = FileRange.StartingIndex; |
649 | OldRecord.FilenamesSize = FileRange.Length; |
650 | return Error::success(); |
651 | } |
652 | |
653 | public: |
654 | VersionedCovMapFuncRecordReader( |
655 | InstrProfSymtab &P, |
656 | std::vector<BinaryCoverageReader::ProfileMappingRecord> &R, StringRef D, |
657 | std::vector<std::string> &F) |
658 | : ProfileNames(P), CompilationDir(D), Filenames(F), Records(R) {} |
659 | |
660 | ~VersionedCovMapFuncRecordReader() override = default; |
661 | |
662 | Expected<const char *> (const char *CovBuf, |
663 | const char *CovBufEnd) override { |
664 | using namespace support; |
665 | |
666 | if (CovBuf + sizeof(CovMapHeader) > CovBufEnd) |
667 | return make_error<CoverageMapError>( |
668 | Args: coveragemap_error::malformed, |
669 | Args: "coverage mapping header section is larger than buffer size" ); |
670 | auto = reinterpret_cast<const CovMapHeader *>(CovBuf); |
671 | uint32_t NRecords = CovHeader->getNRecords<Endian>(); |
672 | uint32_t FilenamesSize = CovHeader->getFilenamesSize<Endian>(); |
673 | uint32_t CoverageSize = CovHeader->getCoverageSize<Endian>(); |
674 | assert((CovMapVersion)CovHeader->getVersion<Endian>() == Version); |
675 | CovBuf = reinterpret_cast<const char *>(CovHeader + 1); |
676 | |
677 | // Skip past the function records, saving the start and end for later. |
678 | // This is a no-op in Version4 (function records are read after all headers |
679 | // are read). |
680 | const char *FuncRecBuf = nullptr; |
681 | const char *FuncRecBufEnd = nullptr; |
682 | if (Version < CovMapVersion::Version4) |
683 | FuncRecBuf = CovBuf; |
684 | CovBuf += NRecords * sizeof(FuncRecordType); |
685 | if (Version < CovMapVersion::Version4) |
686 | FuncRecBufEnd = CovBuf; |
687 | |
688 | // Get the filenames. |
689 | if (CovBuf + FilenamesSize > CovBufEnd) |
690 | return make_error<CoverageMapError>( |
691 | Args: coveragemap_error::malformed, |
692 | Args: "filenames section is larger than buffer size" ); |
693 | size_t FilenamesBegin = Filenames.size(); |
694 | StringRef FilenameRegion(CovBuf, FilenamesSize); |
695 | RawCoverageFilenamesReader Reader(FilenameRegion, Filenames, |
696 | CompilationDir); |
697 | if (auto Err = Reader.read(Version)) |
698 | return std::move(Err); |
699 | CovBuf += FilenamesSize; |
700 | FilenameRange FileRange(FilenamesBegin, Filenames.size() - FilenamesBegin); |
701 | |
702 | if (Version >= CovMapVersion::Version4) { |
703 | // Map a hash of the filenames region to the filename range associated |
704 | // with this coverage header. |
705 | int64_t FilenamesRef = |
706 | llvm::IndexedInstrProf::ComputeHash(K: FilenameRegion); |
707 | auto Insert = |
708 | FileRangeMap.insert(KV: std::make_pair(x&: FilenamesRef, y&: FileRange)); |
709 | if (!Insert.second) { |
710 | // The same filenames ref was encountered twice. It's possible that |
711 | // the associated filenames are the same. |
712 | auto It = Filenames.begin(); |
713 | FilenameRange &OrigRange = Insert.first->getSecond(); |
714 | if (std::equal(first1: It + OrigRange.StartingIndex, |
715 | last1: It + OrigRange.StartingIndex + OrigRange.Length, |
716 | first2: It + FileRange.StartingIndex, |
717 | last2: It + FileRange.StartingIndex + FileRange.Length)) |
718 | // Map the new range to the original one. |
719 | FileRange = OrigRange; |
720 | else |
721 | // This is a hash collision. Mark the filenames ref invalid. |
722 | OrigRange.markInvalid(); |
723 | } |
724 | } |
725 | |
726 | // We'll read the coverage mapping records in the loop below. |
727 | // This is a no-op in Version4 (coverage mappings are not affixed to the |
728 | // coverage header). |
729 | const char *MappingBuf = CovBuf; |
730 | if (Version >= CovMapVersion::Version4 && CoverageSize != 0) |
731 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
732 | Args: "coverage mapping size is not zero" ); |
733 | CovBuf += CoverageSize; |
734 | const char *MappingEnd = CovBuf; |
735 | |
736 | if (CovBuf > CovBufEnd) |
737 | return make_error<CoverageMapError>( |
738 | Args: coveragemap_error::malformed, |
739 | Args: "function records section is larger than buffer size" ); |
740 | |
741 | if (Version < CovMapVersion::Version4) { |
742 | // Read each function record. |
743 | if (Error E = readFunctionRecords(FuncRecBuf, FuncRecBufEnd, OutOfLineFileRange: FileRange, |
744 | OutOfLineMappingBuf: MappingBuf, OutOfLineMappingBufEnd: MappingEnd)) |
745 | return std::move(E); |
746 | } |
747 | |
748 | // Each coverage map has an alignment of 8, so we need to adjust alignment |
749 | // before reading the next map. |
750 | CovBuf += offsetToAlignedAddr(Addr: CovBuf, Alignment: Align(8)); |
751 | |
752 | return CovBuf; |
753 | } |
754 | |
755 | Error readFunctionRecords(const char *FuncRecBuf, const char *FuncRecBufEnd, |
756 | std::optional<FilenameRange> OutOfLineFileRange, |
757 | const char *OutOfLineMappingBuf, |
758 | const char *OutOfLineMappingBufEnd) override { |
759 | auto CFR = reinterpret_cast<const FuncRecordType *>(FuncRecBuf); |
760 | while ((const char *)CFR < FuncRecBufEnd) { |
761 | // Validate the length of the coverage mapping for this function. |
762 | const char *NextMappingBuf; |
763 | const FuncRecordType *NextCFR; |
764 | std::tie(NextMappingBuf, NextCFR) = |
765 | CFR->template advanceByOne<Endian>(OutOfLineMappingBuf); |
766 | if (Version < CovMapVersion::Version4) |
767 | if (NextMappingBuf > OutOfLineMappingBufEnd) |
768 | return make_error<CoverageMapError>( |
769 | Args: coveragemap_error::malformed, |
770 | Args: "next mapping buffer is larger than buffer size" ); |
771 | |
772 | // Look up the set of filenames associated with this function record. |
773 | std::optional<FilenameRange> FileRange; |
774 | if (Version < CovMapVersion::Version4) { |
775 | FileRange = OutOfLineFileRange; |
776 | } else { |
777 | uint64_t FilenamesRef = CFR->template getFilenamesRef<Endian>(); |
778 | auto It = FileRangeMap.find(Val: FilenamesRef); |
779 | if (It == FileRangeMap.end()) |
780 | return make_error<CoverageMapError>( |
781 | Args: coveragemap_error::malformed, |
782 | Args: "no filename found for function with hash=0x" + |
783 | Twine::utohexstr(Val: FilenamesRef)); |
784 | else |
785 | FileRange = It->getSecond(); |
786 | } |
787 | |
788 | // Now, read the coverage data. |
789 | if (FileRange && !FileRange->isInvalid()) { |
790 | StringRef Mapping = |
791 | CFR->template getCoverageMapping<Endian>(OutOfLineMappingBuf); |
792 | if (Version >= CovMapVersion::Version4 && |
793 | Mapping.data() + Mapping.size() > FuncRecBufEnd) |
794 | return make_error<CoverageMapError>( |
795 | Args: coveragemap_error::malformed, |
796 | Args: "coverage mapping data is larger than buffer size" ); |
797 | if (Error Err = insertFunctionRecordIfNeeded(CFR, Mapping, FileRange: *FileRange)) |
798 | return Err; |
799 | } |
800 | |
801 | std::tie(OutOfLineMappingBuf, CFR) = std::tie(NextMappingBuf, NextCFR); |
802 | } |
803 | return Error::success(); |
804 | } |
805 | }; |
806 | |
807 | } // end anonymous namespace |
808 | |
809 | template <class IntPtrT, llvm::endianness Endian> |
810 | Expected<std::unique_ptr<CovMapFuncRecordReader>> CovMapFuncRecordReader::get( |
811 | CovMapVersion Version, InstrProfSymtab &P, |
812 | std::vector<BinaryCoverageReader::ProfileMappingRecord> &R, StringRef D, |
813 | std::vector<std::string> &F) { |
814 | using namespace coverage; |
815 | |
816 | switch (Version) { |
817 | case CovMapVersion::Version1: |
818 | return std::make_unique<VersionedCovMapFuncRecordReader< |
819 | CovMapVersion::Version1, IntPtrT, Endian>>(P, R, D, F); |
820 | case CovMapVersion::Version2: |
821 | case CovMapVersion::Version3: |
822 | case CovMapVersion::Version4: |
823 | case CovMapVersion::Version5: |
824 | case CovMapVersion::Version6: |
825 | case CovMapVersion::Version7: |
826 | // Decompress the name data. |
827 | if (Error E = P.create(NameStrings: P.getNameData())) |
828 | return std::move(E); |
829 | if (Version == CovMapVersion::Version2) |
830 | return std::make_unique<VersionedCovMapFuncRecordReader< |
831 | CovMapVersion::Version2, IntPtrT, Endian>>(P, R, D, F); |
832 | else if (Version == CovMapVersion::Version3) |
833 | return std::make_unique<VersionedCovMapFuncRecordReader< |
834 | CovMapVersion::Version3, IntPtrT, Endian>>(P, R, D, F); |
835 | else if (Version == CovMapVersion::Version4) |
836 | return std::make_unique<VersionedCovMapFuncRecordReader< |
837 | CovMapVersion::Version4, IntPtrT, Endian>>(P, R, D, F); |
838 | else if (Version == CovMapVersion::Version5) |
839 | return std::make_unique<VersionedCovMapFuncRecordReader< |
840 | CovMapVersion::Version5, IntPtrT, Endian>>(P, R, D, F); |
841 | else if (Version == CovMapVersion::Version6) |
842 | return std::make_unique<VersionedCovMapFuncRecordReader< |
843 | CovMapVersion::Version6, IntPtrT, Endian>>(P, R, D, F); |
844 | else if (Version == CovMapVersion::Version7) |
845 | return std::make_unique<VersionedCovMapFuncRecordReader< |
846 | CovMapVersion::Version7, IntPtrT, Endian>>(P, R, D, F); |
847 | } |
848 | llvm_unreachable("Unsupported version" ); |
849 | } |
850 | |
851 | template <typename T, llvm::endianness Endian> |
852 | static Error readCoverageMappingData( |
853 | InstrProfSymtab &ProfileNames, StringRef CovMap, StringRef FuncRecords, |
854 | std::vector<BinaryCoverageReader::ProfileMappingRecord> &Records, |
855 | StringRef CompilationDir, std::vector<std::string> &Filenames) { |
856 | using namespace coverage; |
857 | |
858 | // Read the records in the coverage data section. |
859 | auto = |
860 | reinterpret_cast<const CovMapHeader *>(CovMap.data()); |
861 | CovMapVersion Version = (CovMapVersion)CovHeader->getVersion<Endian>(); |
862 | if (Version > CovMapVersion::CurrentVersion) |
863 | return make_error<CoverageMapError>(Args: coveragemap_error::unsupported_version); |
864 | Expected<std::unique_ptr<CovMapFuncRecordReader>> ReaderExpected = |
865 | CovMapFuncRecordReader::get<T, Endian>(Version, ProfileNames, Records, |
866 | CompilationDir, Filenames); |
867 | if (Error E = ReaderExpected.takeError()) |
868 | return E; |
869 | auto Reader = std::move(ReaderExpected.get()); |
870 | const char *CovBuf = CovMap.data(); |
871 | const char *CovBufEnd = CovBuf + CovMap.size(); |
872 | const char *FuncRecBuf = FuncRecords.data(); |
873 | const char *FuncRecBufEnd = FuncRecords.data() + FuncRecords.size(); |
874 | while (CovBuf < CovBufEnd) { |
875 | // Read the current coverage header & filename data. |
876 | // |
877 | // Prior to Version4, this also reads all function records affixed to the |
878 | // header. |
879 | // |
880 | // Return a pointer to the next coverage header. |
881 | auto NextOrErr = Reader->readCoverageHeader(CovBuf, CovBufEnd); |
882 | if (auto E = NextOrErr.takeError()) |
883 | return E; |
884 | CovBuf = NextOrErr.get(); |
885 | } |
886 | // In Version4, function records are not affixed to coverage headers. Read |
887 | // the records from their dedicated section. |
888 | if (Version >= CovMapVersion::Version4) |
889 | return Reader->readFunctionRecords(FuncRecBuf, FuncRecBufEnd, OutOfLineFileRange: std::nullopt, |
890 | OutOfLineMappingBuf: nullptr, OutOfLineMappingBufEnd: nullptr); |
891 | return Error::success(); |
892 | } |
893 | |
894 | Expected<std::unique_ptr<BinaryCoverageReader>> |
895 | BinaryCoverageReader::createCoverageReaderFromBuffer( |
896 | StringRef Coverage, FuncRecordsStorage &&FuncRecords, |
897 | std::unique_ptr<InstrProfSymtab> ProfileNamesPtr, uint8_t BytesInAddress, |
898 | llvm::endianness Endian, StringRef CompilationDir) { |
899 | if (ProfileNamesPtr == nullptr) |
900 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
901 | Args: "Caller must provide ProfileNames" ); |
902 | std::unique_ptr<BinaryCoverageReader> Reader(new BinaryCoverageReader( |
903 | std::move(ProfileNamesPtr), std::move(FuncRecords))); |
904 | InstrProfSymtab &ProfileNames = *Reader->ProfileNames; |
905 | StringRef FuncRecordsRef = Reader->FuncRecords->getBuffer(); |
906 | if (BytesInAddress == 4 && Endian == llvm::endianness::little) { |
907 | if (Error E = readCoverageMappingData<uint32_t, llvm::endianness::little>( |
908 | ProfileNames, CovMap: Coverage, FuncRecords: FuncRecordsRef, Records&: Reader->MappingRecords, |
909 | CompilationDir, Filenames&: Reader->Filenames)) |
910 | return std::move(E); |
911 | } else if (BytesInAddress == 4 && Endian == llvm::endianness::big) { |
912 | if (Error E = readCoverageMappingData<uint32_t, llvm::endianness::big>( |
913 | ProfileNames, CovMap: Coverage, FuncRecords: FuncRecordsRef, Records&: Reader->MappingRecords, |
914 | CompilationDir, Filenames&: Reader->Filenames)) |
915 | return std::move(E); |
916 | } else if (BytesInAddress == 8 && Endian == llvm::endianness::little) { |
917 | if (Error E = readCoverageMappingData<uint64_t, llvm::endianness::little>( |
918 | ProfileNames, CovMap: Coverage, FuncRecords: FuncRecordsRef, Records&: Reader->MappingRecords, |
919 | CompilationDir, Filenames&: Reader->Filenames)) |
920 | return std::move(E); |
921 | } else if (BytesInAddress == 8 && Endian == llvm::endianness::big) { |
922 | if (Error E = readCoverageMappingData<uint64_t, llvm::endianness::big>( |
923 | ProfileNames, CovMap: Coverage, FuncRecords: FuncRecordsRef, Records&: Reader->MappingRecords, |
924 | CompilationDir, Filenames&: Reader->Filenames)) |
925 | return std::move(E); |
926 | } else |
927 | return make_error<CoverageMapError>( |
928 | Args: coveragemap_error::malformed, |
929 | Args: "not supported endianness or bytes in address" ); |
930 | return std::move(Reader); |
931 | } |
932 | |
933 | static Expected<std::unique_ptr<BinaryCoverageReader>> |
934 | loadTestingFormat(StringRef Data, StringRef CompilationDir) { |
935 | uint8_t BytesInAddress = 8; |
936 | llvm::endianness Endian = llvm::endianness::little; |
937 | |
938 | // Read the magic and version. |
939 | Data = Data.substr(Start: sizeof(TestingFormatMagic)); |
940 | if (Data.size() < sizeof(uint64_t)) |
941 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
942 | Args: "the size of data is too small" ); |
943 | auto TestingVersion = |
944 | support::endian::byte_swap<uint64_t, llvm::endianness::little>( |
945 | value: *reinterpret_cast<const uint64_t *>(Data.data())); |
946 | Data = Data.substr(Start: sizeof(uint64_t)); |
947 | |
948 | // Read the ProfileNames data. |
949 | if (Data.empty()) |
950 | return make_error<CoverageMapError>(Args: coveragemap_error::truncated); |
951 | unsigned N = 0; |
952 | uint64_t ProfileNamesSize = decodeULEB128(p: Data.bytes_begin(), n: &N); |
953 | if (N > Data.size()) |
954 | return make_error<CoverageMapError>( |
955 | Args: coveragemap_error::malformed, |
956 | Args: "the size of TestingFormatMagic is too big" ); |
957 | Data = Data.substr(Start: N); |
958 | if (Data.empty()) |
959 | return make_error<CoverageMapError>(Args: coveragemap_error::truncated); |
960 | N = 0; |
961 | uint64_t Address = decodeULEB128(p: Data.bytes_begin(), n: &N); |
962 | if (N > Data.size()) |
963 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
964 | Args: "the size of ULEB128 is too big" ); |
965 | Data = Data.substr(Start: N); |
966 | if (Data.size() < ProfileNamesSize) |
967 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
968 | Args: "the size of ProfileNames is too big" ); |
969 | auto ProfileNames = std::make_unique<InstrProfSymtab>(); |
970 | if (Error E = ProfileNames->create(D: Data.substr(Start: 0, N: ProfileNamesSize), BaseAddr: Address)) |
971 | return std::move(E); |
972 | Data = Data.substr(Start: ProfileNamesSize); |
973 | |
974 | // In Version2, the size of CoverageMapping is stored directly. |
975 | uint64_t CoverageMappingSize; |
976 | if (TestingVersion == uint64_t(TestingFormatVersion::Version2)) { |
977 | N = 0; |
978 | CoverageMappingSize = decodeULEB128(p: Data.bytes_begin(), n: &N); |
979 | if (N > Data.size()) |
980 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
981 | Args: "the size of ULEB128 is too big" ); |
982 | Data = Data.substr(Start: N); |
983 | if (CoverageMappingSize < sizeof(CovMapHeader)) |
984 | return make_error<CoverageMapError>( |
985 | Args: coveragemap_error::malformed, |
986 | Args: "the size of CoverageMapping is teoo small" ); |
987 | } else if (TestingVersion != uint64_t(TestingFormatVersion::Version1)) { |
988 | return make_error<CoverageMapError>(Args: coveragemap_error::unsupported_version); |
989 | } |
990 | |
991 | // Skip the padding bytes because coverage map data has an alignment of 8. |
992 | auto Pad = offsetToAlignedAddr(Addr: Data.data(), Alignment: Align(8)); |
993 | if (Data.size() < Pad) |
994 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
995 | Args: "insufficient padding" ); |
996 | Data = Data.substr(Start: Pad); |
997 | if (Data.size() < sizeof(CovMapHeader)) |
998 | return make_error<CoverageMapError>( |
999 | Args: coveragemap_error::malformed, |
1000 | Args: "coverage mapping header section is larger than data size" ); |
1001 | auto const * = reinterpret_cast<const CovMapHeader *>( |
1002 | Data.substr(Start: 0, N: sizeof(CovMapHeader)).data()); |
1003 | auto Version = |
1004 | CovMapVersion(CovHeader->getVersion<llvm::endianness::little>()); |
1005 | |
1006 | // In Version1, the size of CoverageMapping is calculated. |
1007 | if (TestingVersion == uint64_t(TestingFormatVersion::Version1)) { |
1008 | if (Version < CovMapVersion::Version4) { |
1009 | CoverageMappingSize = Data.size(); |
1010 | } else { |
1011 | auto FilenamesSize = |
1012 | CovHeader->getFilenamesSize<llvm::endianness::little>(); |
1013 | CoverageMappingSize = sizeof(CovMapHeader) + FilenamesSize; |
1014 | } |
1015 | } |
1016 | |
1017 | auto CoverageMapping = Data.substr(Start: 0, N: CoverageMappingSize); |
1018 | Data = Data.substr(Start: CoverageMappingSize); |
1019 | |
1020 | // Read the CoverageRecords data. |
1021 | if (Version < CovMapVersion::Version4) { |
1022 | if (!Data.empty()) |
1023 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
1024 | Args: "data is not empty" ); |
1025 | } else { |
1026 | // Skip the padding bytes because coverage records data has an alignment |
1027 | // of 8. |
1028 | Pad = offsetToAlignedAddr(Addr: Data.data(), Alignment: Align(8)); |
1029 | if (Data.size() < Pad) |
1030 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
1031 | Args: "insufficient padding" ); |
1032 | Data = Data.substr(Start: Pad); |
1033 | } |
1034 | BinaryCoverageReader::FuncRecordsStorage CoverageRecords = |
1035 | MemoryBuffer::getMemBuffer(InputData: Data); |
1036 | |
1037 | return BinaryCoverageReader::createCoverageReaderFromBuffer( |
1038 | Coverage: CoverageMapping, FuncRecords: std::move(CoverageRecords), ProfileNamesPtr: std::move(ProfileNames), |
1039 | BytesInAddress, Endian, CompilationDir); |
1040 | } |
1041 | |
1042 | /// Find all sections that match \p IPSK name. There may be more than one if |
1043 | /// comdats are in use, e.g. for the __llvm_covfun section on ELF. |
1044 | static Expected<std::vector<SectionRef>> |
1045 | lookupSections(ObjectFile &OF, InstrProfSectKind IPSK) { |
1046 | auto ObjFormat = OF.getTripleObjectFormat(); |
1047 | auto Name = |
1048 | getInstrProfSectionName(IPSK, OF: ObjFormat, /*AddSegmentInfo=*/false); |
1049 | // On COFF, the object file section name may end in "$M". This tells the |
1050 | // linker to sort these sections between "$A" and "$Z". The linker removes the |
1051 | // dollar and everything after it in the final binary. Do the same to match. |
1052 | bool IsCOFF = isa<COFFObjectFile>(Val: OF); |
1053 | auto stripSuffix = [IsCOFF](StringRef N) { |
1054 | return IsCOFF ? N.split(Separator: '$').first : N; |
1055 | }; |
1056 | Name = stripSuffix(Name); |
1057 | |
1058 | std::vector<SectionRef> Sections; |
1059 | for (const auto &Section : OF.sections()) { |
1060 | Expected<StringRef> NameOrErr = Section.getName(); |
1061 | if (!NameOrErr) |
1062 | return NameOrErr.takeError(); |
1063 | if (stripSuffix(*NameOrErr) == Name) { |
1064 | // COFF profile name section contains two null bytes indicating the |
1065 | // start/end of the section. If its size is 2 bytes, it's empty. |
1066 | if (IsCOFF && IPSK == IPSK_name && Section.getSize() == 2) |
1067 | continue; |
1068 | Sections.push_back(x: Section); |
1069 | } |
1070 | } |
1071 | if (Sections.empty()) |
1072 | return make_error<CoverageMapError>(Args: coveragemap_error::no_data_found); |
1073 | return Sections; |
1074 | } |
1075 | |
1076 | static Expected<std::unique_ptr<BinaryCoverageReader>> |
1077 | loadBinaryFormat(std::unique_ptr<Binary> Bin, StringRef Arch, |
1078 | StringRef CompilationDir = "" , |
1079 | object::BuildIDRef *BinaryID = nullptr) { |
1080 | std::unique_ptr<ObjectFile> OF; |
1081 | if (auto *Universal = dyn_cast<MachOUniversalBinary>(Val: Bin.get())) { |
1082 | // If we have a universal binary, try to look up the object for the |
1083 | // appropriate architecture. |
1084 | auto ObjectFileOrErr = Universal->getMachOObjectForArch(ArchName: Arch); |
1085 | if (!ObjectFileOrErr) |
1086 | return ObjectFileOrErr.takeError(); |
1087 | OF = std::move(ObjectFileOrErr.get()); |
1088 | } else if (isa<ObjectFile>(Val: Bin.get())) { |
1089 | // For any other object file, upcast and take ownership. |
1090 | OF.reset(p: cast<ObjectFile>(Val: Bin.release())); |
1091 | // If we've asked for a particular arch, make sure they match. |
1092 | if (!Arch.empty() && OF->getArch() != Triple(Arch).getArch()) |
1093 | return errorCodeToError(EC: object_error::arch_not_found); |
1094 | } else |
1095 | // We can only handle object files. |
1096 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
1097 | Args: "binary is not an object file" ); |
1098 | |
1099 | // The coverage uses native pointer sizes for the object it's written in. |
1100 | uint8_t BytesInAddress = OF->getBytesInAddress(); |
1101 | llvm::endianness Endian = |
1102 | OF->isLittleEndian() ? llvm::endianness::little : llvm::endianness::big; |
1103 | |
1104 | // Look for the sections that we are interested in. |
1105 | auto ProfileNames = std::make_unique<InstrProfSymtab>(); |
1106 | std::vector<SectionRef> NamesSectionRefs; |
1107 | // If IPSK_name is not found, fallback to search for IPK_covname, which is |
1108 | // used when binary correlation is enabled. |
1109 | auto NamesSection = lookupSections(OF&: *OF, IPSK: IPSK_name); |
1110 | if (auto E = NamesSection.takeError()) { |
1111 | consumeError(Err: std::move(E)); |
1112 | NamesSection = lookupSections(OF&: *OF, IPSK: IPSK_covname); |
1113 | if (auto E = NamesSection.takeError()) |
1114 | return std::move(E); |
1115 | } |
1116 | NamesSectionRefs = *NamesSection; |
1117 | |
1118 | if (NamesSectionRefs.size() != 1) |
1119 | return make_error<CoverageMapError>( |
1120 | Args: coveragemap_error::malformed, |
1121 | Args: "the size of coverage mapping section is not one" ); |
1122 | if (Error E = ProfileNames->create(Section&: NamesSectionRefs.back())) |
1123 | return std::move(E); |
1124 | |
1125 | auto CoverageSection = lookupSections(OF&: *OF, IPSK: IPSK_covmap); |
1126 | if (auto E = CoverageSection.takeError()) |
1127 | return std::move(E); |
1128 | std::vector<SectionRef> CoverageSectionRefs = *CoverageSection; |
1129 | if (CoverageSectionRefs.size() != 1) |
1130 | return make_error<CoverageMapError>(Args: coveragemap_error::malformed, |
1131 | Args: "the size of name section is not one" ); |
1132 | auto CoverageMappingOrErr = CoverageSectionRefs.back().getContents(); |
1133 | if (!CoverageMappingOrErr) |
1134 | return CoverageMappingOrErr.takeError(); |
1135 | StringRef CoverageMapping = CoverageMappingOrErr.get(); |
1136 | |
1137 | // Look for the coverage records section (Version4 only). |
1138 | auto CoverageRecordsSections = lookupSections(OF&: *OF, IPSK: IPSK_covfun); |
1139 | |
1140 | BinaryCoverageReader::FuncRecordsStorage FuncRecords; |
1141 | if (auto E = CoverageRecordsSections.takeError()) { |
1142 | consumeError(Err: std::move(E)); |
1143 | FuncRecords = MemoryBuffer::getMemBuffer(InputData: "" ); |
1144 | } else { |
1145 | // Compute the FuncRecordsBuffer of the buffer, taking into account the |
1146 | // padding between each record, and making sure the first block is aligned |
1147 | // in memory to maintain consistency between buffer address and size |
1148 | // alignment. |
1149 | const Align RecordAlignment(8); |
1150 | uint64_t FuncRecordsSize = 0; |
1151 | for (SectionRef Section : *CoverageRecordsSections) { |
1152 | auto CoverageRecordsOrErr = Section.getContents(); |
1153 | if (!CoverageRecordsOrErr) |
1154 | return CoverageRecordsOrErr.takeError(); |
1155 | FuncRecordsSize += alignTo(Size: CoverageRecordsOrErr->size(), A: RecordAlignment); |
1156 | } |
1157 | auto WritableBuffer = |
1158 | WritableMemoryBuffer::getNewUninitMemBuffer(Size: FuncRecordsSize); |
1159 | char *FuncRecordsBuffer = WritableBuffer->getBufferStart(); |
1160 | assert(isAddrAligned(RecordAlignment, FuncRecordsBuffer) && |
1161 | "Allocated memory is correctly aligned" ); |
1162 | |
1163 | for (SectionRef Section : *CoverageRecordsSections) { |
1164 | auto CoverageRecordsOrErr = Section.getContents(); |
1165 | if (!CoverageRecordsOrErr) |
1166 | return CoverageRecordsOrErr.takeError(); |
1167 | const auto &CoverageRecords = CoverageRecordsOrErr.get(); |
1168 | FuncRecordsBuffer = std::copy(first: CoverageRecords.begin(), |
1169 | last: CoverageRecords.end(), result: FuncRecordsBuffer); |
1170 | FuncRecordsBuffer = |
1171 | std::fill_n(first: FuncRecordsBuffer, |
1172 | n: alignAddr(Addr: FuncRecordsBuffer, Alignment: RecordAlignment) - |
1173 | (uintptr_t)FuncRecordsBuffer, |
1174 | value: '\0'); |
1175 | } |
1176 | assert(FuncRecordsBuffer == WritableBuffer->getBufferEnd() && |
1177 | "consistent init" ); |
1178 | FuncRecords = std::move(WritableBuffer); |
1179 | } |
1180 | |
1181 | if (BinaryID) |
1182 | *BinaryID = getBuildID(Obj: OF.get()); |
1183 | |
1184 | return BinaryCoverageReader::createCoverageReaderFromBuffer( |
1185 | Coverage: CoverageMapping, FuncRecords: std::move(FuncRecords), ProfileNamesPtr: std::move(ProfileNames), |
1186 | BytesInAddress, Endian, CompilationDir); |
1187 | } |
1188 | |
1189 | /// Determine whether \p Arch is invalid or empty, given \p Bin. |
1190 | static bool isArchSpecifierInvalidOrMissing(Binary *Bin, StringRef Arch) { |
1191 | // If we have a universal binary and Arch doesn't identify any of its slices, |
1192 | // it's user error. |
1193 | if (auto *Universal = dyn_cast<MachOUniversalBinary>(Val: Bin)) { |
1194 | for (auto &ObjForArch : Universal->objects()) |
1195 | if (Arch == ObjForArch.getArchFlagName()) |
1196 | return false; |
1197 | return true; |
1198 | } |
1199 | return false; |
1200 | } |
1201 | |
1202 | Expected<std::vector<std::unique_ptr<BinaryCoverageReader>>> |
1203 | BinaryCoverageReader::create( |
1204 | MemoryBufferRef ObjectBuffer, StringRef Arch, |
1205 | SmallVectorImpl<std::unique_ptr<MemoryBuffer>> &ObjectFileBuffers, |
1206 | StringRef CompilationDir, SmallVectorImpl<object::BuildIDRef> *BinaryIDs) { |
1207 | std::vector<std::unique_ptr<BinaryCoverageReader>> Readers; |
1208 | |
1209 | if (ObjectBuffer.getBuffer().size() > sizeof(TestingFormatMagic)) { |
1210 | uint64_t Magic = |
1211 | support::endian::byte_swap<uint64_t, llvm::endianness::little>( |
1212 | value: *reinterpret_cast<const uint64_t *>(ObjectBuffer.getBufferStart())); |
1213 | if (Magic == TestingFormatMagic) { |
1214 | // This is a special format used for testing. |
1215 | auto ReaderOrErr = |
1216 | loadTestingFormat(Data: ObjectBuffer.getBuffer(), CompilationDir); |
1217 | if (!ReaderOrErr) |
1218 | return ReaderOrErr.takeError(); |
1219 | Readers.push_back(x: std::move(ReaderOrErr.get())); |
1220 | return std::move(Readers); |
1221 | } |
1222 | } |
1223 | |
1224 | auto BinOrErr = createBinary(Source: ObjectBuffer); |
1225 | if (!BinOrErr) |
1226 | return BinOrErr.takeError(); |
1227 | std::unique_ptr<Binary> Bin = std::move(BinOrErr.get()); |
1228 | |
1229 | if (isArchSpecifierInvalidOrMissing(Bin: Bin.get(), Arch)) |
1230 | return make_error<CoverageMapError>( |
1231 | Args: coveragemap_error::invalid_or_missing_arch_specifier); |
1232 | |
1233 | // MachO universal binaries which contain archives need to be treated as |
1234 | // archives, not as regular binaries. |
1235 | if (auto *Universal = dyn_cast<MachOUniversalBinary>(Val: Bin.get())) { |
1236 | for (auto &ObjForArch : Universal->objects()) { |
1237 | // Skip slices within the universal binary which target the wrong arch. |
1238 | std::string ObjArch = ObjForArch.getArchFlagName(); |
1239 | if (Arch != ObjArch) |
1240 | continue; |
1241 | |
1242 | auto ArchiveOrErr = ObjForArch.getAsArchive(); |
1243 | if (!ArchiveOrErr) { |
1244 | // If this is not an archive, try treating it as a regular object. |
1245 | consumeError(Err: ArchiveOrErr.takeError()); |
1246 | break; |
1247 | } |
1248 | |
1249 | return BinaryCoverageReader::create( |
1250 | ObjectBuffer: ArchiveOrErr.get()->getMemoryBufferRef(), Arch, ObjectFileBuffers, |
1251 | CompilationDir, BinaryIDs); |
1252 | } |
1253 | } |
1254 | |
1255 | // Load coverage out of archive members. |
1256 | if (auto *Ar = dyn_cast<Archive>(Val: Bin.get())) { |
1257 | Error Err = Error::success(); |
1258 | for (auto &Child : Ar->children(Err)) { |
1259 | Expected<MemoryBufferRef> ChildBufOrErr = Child.getMemoryBufferRef(); |
1260 | if (!ChildBufOrErr) |
1261 | return ChildBufOrErr.takeError(); |
1262 | |
1263 | auto ChildReadersOrErr = BinaryCoverageReader::create( |
1264 | ObjectBuffer: ChildBufOrErr.get(), Arch, ObjectFileBuffers, CompilationDir, |
1265 | BinaryIDs); |
1266 | if (!ChildReadersOrErr) |
1267 | return ChildReadersOrErr.takeError(); |
1268 | for (auto &Reader : ChildReadersOrErr.get()) |
1269 | Readers.push_back(x: std::move(Reader)); |
1270 | } |
1271 | if (Err) |
1272 | return std::move(Err); |
1273 | |
1274 | // Thin archives reference object files outside of the archive file, i.e. |
1275 | // files which reside in memory not owned by the caller. Transfer ownership |
1276 | // to the caller. |
1277 | if (Ar->isThin()) |
1278 | for (auto &Buffer : Ar->takeThinBuffers()) |
1279 | ObjectFileBuffers.push_back(Elt: std::move(Buffer)); |
1280 | |
1281 | return std::move(Readers); |
1282 | } |
1283 | |
1284 | object::BuildIDRef BinaryID; |
1285 | auto ReaderOrErr = loadBinaryFormat(Bin: std::move(Bin), Arch, CompilationDir, |
1286 | BinaryID: BinaryIDs ? &BinaryID : nullptr); |
1287 | if (!ReaderOrErr) |
1288 | return ReaderOrErr.takeError(); |
1289 | Readers.push_back(x: std::move(ReaderOrErr.get())); |
1290 | if (!BinaryID.empty()) |
1291 | BinaryIDs->push_back(Elt: BinaryID); |
1292 | return std::move(Readers); |
1293 | } |
1294 | |
1295 | Error BinaryCoverageReader::readNextRecord(CoverageMappingRecord &Record) { |
1296 | if (CurrentRecord >= MappingRecords.size()) |
1297 | return make_error<CoverageMapError>(Args: coveragemap_error::eof); |
1298 | |
1299 | FunctionsFilenames.clear(); |
1300 | Expressions.clear(); |
1301 | MappingRegions.clear(); |
1302 | auto &R = MappingRecords[CurrentRecord]; |
1303 | auto F = ArrayRef(Filenames).slice(N: R.FilenamesBegin, M: R.FilenamesSize); |
1304 | RawCoverageMappingReader Reader(R.CoverageMapping, F, FunctionsFilenames, |
1305 | Expressions, MappingRegions); |
1306 | if (auto Err = Reader.read()) |
1307 | return Err; |
1308 | |
1309 | Record.FunctionName = R.FunctionName; |
1310 | Record.FunctionHash = R.FunctionHash; |
1311 | Record.Filenames = FunctionsFilenames; |
1312 | Record.Expressions = Expressions; |
1313 | Record.MappingRegions = MappingRegions; |
1314 | |
1315 | ++CurrentRecord; |
1316 | return Error::success(); |
1317 | } |
1318 | |