1 | //===- CoverageMappingWriter.cpp - Code coverage mapping writer -----------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // This file contains support for writing coverage mapping data for |
10 | // instrumentation based coverage. |
11 | // |
12 | //===----------------------------------------------------------------------===// |
13 | |
14 | #include "llvm/ProfileData/Coverage/CoverageMappingWriter.h" |
15 | #include "llvm/ADT/ArrayRef.h" |
16 | #include "llvm/ADT/SmallVector.h" |
17 | #include "llvm/ADT/StringExtras.h" |
18 | #include "llvm/ProfileData/InstrProf.h" |
19 | #include "llvm/Support/Compression.h" |
20 | #include "llvm/Support/LEB128.h" |
21 | #include "llvm/Support/raw_ostream.h" |
22 | #include <cassert> |
23 | #include <limits> |
24 | #include <vector> |
25 | |
26 | using namespace llvm; |
27 | using namespace coverage; |
28 | |
29 | CoverageFilenamesSectionWriter::CoverageFilenamesSectionWriter( |
30 | ArrayRef<std::string> Filenames) |
31 | : Filenames(Filenames) { |
32 | #ifndef NDEBUG |
33 | StringSet<> NameSet; |
34 | for (StringRef Name : Filenames) |
35 | assert(NameSet.insert(Name).second && "Duplicate filename" ); |
36 | #endif |
37 | } |
38 | |
39 | void CoverageFilenamesSectionWriter::write(raw_ostream &OS, bool Compress) { |
40 | std::string FilenamesStr; |
41 | { |
42 | raw_string_ostream FilenamesOS{FilenamesStr}; |
43 | for (const auto &Filename : Filenames) { |
44 | encodeULEB128(Value: Filename.size(), OS&: FilenamesOS); |
45 | FilenamesOS << Filename; |
46 | } |
47 | } |
48 | |
49 | SmallVector<uint8_t, 128> CompressedStr; |
50 | bool doCompression = Compress && compression::zlib::isAvailable() && |
51 | DoInstrProfNameCompression; |
52 | if (doCompression) |
53 | compression::zlib::compress(Input: arrayRefFromStringRef(Input: FilenamesStr), |
54 | CompressedBuffer&: CompressedStr, |
55 | Level: compression::zlib::BestSizeCompression); |
56 | |
57 | // ::= <num-filenames> |
58 | // <uncompressed-len> |
59 | // <compressed-len-or-zero> |
60 | // (<compressed-filenames> | <uncompressed-filenames>) |
61 | encodeULEB128(Value: Filenames.size(), OS); |
62 | encodeULEB128(Value: FilenamesStr.size(), OS); |
63 | encodeULEB128(Value: doCompression ? CompressedStr.size() : 0U, OS); |
64 | OS << (doCompression ? toStringRef(Input: CompressedStr) : StringRef(FilenamesStr)); |
65 | } |
66 | |
67 | namespace { |
68 | |
69 | /// Gather only the expressions that are used by the mapping |
70 | /// regions in this function. |
71 | class CounterExpressionsMinimizer { |
72 | ArrayRef<CounterExpression> Expressions; |
73 | SmallVector<CounterExpression, 16> UsedExpressions; |
74 | std::vector<unsigned> AdjustedExpressionIDs; |
75 | |
76 | public: |
77 | CounterExpressionsMinimizer(ArrayRef<CounterExpression> Expressions, |
78 | ArrayRef<CounterMappingRegion> MappingRegions) |
79 | : Expressions(Expressions) { |
80 | AdjustedExpressionIDs.resize(new_size: Expressions.size(), x: 0); |
81 | for (const auto &I : MappingRegions) { |
82 | mark(C: I.Count); |
83 | mark(C: I.FalseCount); |
84 | } |
85 | for (const auto &I : MappingRegions) { |
86 | gatherUsed(C: I.Count); |
87 | gatherUsed(C: I.FalseCount); |
88 | } |
89 | } |
90 | |
91 | void mark(Counter C) { |
92 | if (!C.isExpression()) |
93 | return; |
94 | unsigned ID = C.getExpressionID(); |
95 | AdjustedExpressionIDs[ID] = 1; |
96 | mark(C: Expressions[ID].LHS); |
97 | mark(C: Expressions[ID].RHS); |
98 | } |
99 | |
100 | void gatherUsed(Counter C) { |
101 | if (!C.isExpression() || !AdjustedExpressionIDs[C.getExpressionID()]) |
102 | return; |
103 | AdjustedExpressionIDs[C.getExpressionID()] = UsedExpressions.size(); |
104 | const auto &E = Expressions[C.getExpressionID()]; |
105 | UsedExpressions.push_back(Elt: E); |
106 | gatherUsed(C: E.LHS); |
107 | gatherUsed(C: E.RHS); |
108 | } |
109 | |
110 | ArrayRef<CounterExpression> getExpressions() const { return UsedExpressions; } |
111 | |
112 | /// Adjust the given counter to correctly transition from the old |
113 | /// expression ids to the new expression ids. |
114 | Counter adjust(Counter C) const { |
115 | if (C.isExpression()) |
116 | C = Counter::getExpression(ExpressionId: AdjustedExpressionIDs[C.getExpressionID()]); |
117 | return C; |
118 | } |
119 | }; |
120 | |
121 | } // end anonymous namespace |
122 | |
123 | /// Encode the counter. |
124 | /// |
125 | /// The encoding uses the following format: |
126 | /// Low 2 bits - Tag: |
127 | /// Counter::Zero(0) - A Counter with kind Counter::Zero |
128 | /// Counter::CounterValueReference(1) - A counter with kind |
129 | /// Counter::CounterValueReference |
130 | /// Counter::Expression(2) + CounterExpression::Subtract(0) - |
131 | /// A counter with kind Counter::Expression and an expression |
132 | /// with kind CounterExpression::Subtract |
133 | /// Counter::Expression(2) + CounterExpression::Add(1) - |
134 | /// A counter with kind Counter::Expression and an expression |
135 | /// with kind CounterExpression::Add |
136 | /// Remaining bits - Counter/Expression ID. |
137 | static unsigned encodeCounter(ArrayRef<CounterExpression> Expressions, |
138 | Counter C) { |
139 | unsigned Tag = unsigned(C.getKind()); |
140 | if (C.isExpression()) |
141 | Tag += Expressions[C.getExpressionID()].Kind; |
142 | unsigned ID = C.getCounterID(); |
143 | assert(ID <= |
144 | (std::numeric_limits<unsigned>::max() >> Counter::EncodingTagBits)); |
145 | return Tag | (ID << Counter::EncodingTagBits); |
146 | } |
147 | |
148 | static void writeCounter(ArrayRef<CounterExpression> Expressions, Counter C, |
149 | raw_ostream &OS) { |
150 | encodeULEB128(Value: encodeCounter(Expressions, C), OS); |
151 | } |
152 | |
153 | void CoverageMappingWriter::write(raw_ostream &OS) { |
154 | // Check that we don't have any bogus regions. |
155 | assert(all_of(MappingRegions, |
156 | [](const CounterMappingRegion &CMR) { |
157 | return CMR.startLoc() <= CMR.endLoc(); |
158 | }) && |
159 | "Source region does not begin before it ends" ); |
160 | |
161 | // Sort the regions in an ascending order by the file id and the starting |
162 | // location. Sort by region kinds to ensure stable order for tests. |
163 | llvm::stable_sort(Range&: MappingRegions, C: [](const CounterMappingRegion &LHS, |
164 | const CounterMappingRegion &RHS) { |
165 | if (LHS.FileID != RHS.FileID) |
166 | return LHS.FileID < RHS.FileID; |
167 | if (LHS.startLoc() != RHS.startLoc()) |
168 | return LHS.startLoc() < RHS.startLoc(); |
169 | |
170 | // Put `Decision` before `Expansion`. |
171 | auto getKindKey = [](CounterMappingRegion::RegionKind Kind) { |
172 | return (Kind == CounterMappingRegion::MCDCDecisionRegion |
173 | ? 2 * CounterMappingRegion::ExpansionRegion - 1 |
174 | : 2 * Kind); |
175 | }; |
176 | |
177 | return getKindKey(LHS.Kind) < getKindKey(RHS.Kind); |
178 | }); |
179 | |
180 | // Write out the fileid -> filename mapping. |
181 | encodeULEB128(Value: VirtualFileMapping.size(), OS); |
182 | for (const auto &FileID : VirtualFileMapping) |
183 | encodeULEB128(Value: FileID, OS); |
184 | |
185 | // Write out the expressions. |
186 | CounterExpressionsMinimizer Minimizer(Expressions, MappingRegions); |
187 | auto MinExpressions = Minimizer.getExpressions(); |
188 | encodeULEB128(Value: MinExpressions.size(), OS); |
189 | for (const auto &E : MinExpressions) { |
190 | writeCounter(Expressions: MinExpressions, C: Minimizer.adjust(C: E.LHS), OS); |
191 | writeCounter(Expressions: MinExpressions, C: Minimizer.adjust(C: E.RHS), OS); |
192 | } |
193 | |
194 | // Write out the mapping regions. |
195 | // Split the regions into subarrays where each region in a |
196 | // subarray has a fileID which is the index of that subarray. |
197 | unsigned PrevLineStart = 0; |
198 | unsigned CurrentFileID = ~0U; |
199 | for (auto I = MappingRegions.begin(), E = MappingRegions.end(); I != E; ++I) { |
200 | if (I->FileID != CurrentFileID) { |
201 | // Ensure that all file ids have at least one mapping region. |
202 | assert(I->FileID == (CurrentFileID + 1)); |
203 | // Find the number of regions with this file id. |
204 | unsigned RegionCount = 1; |
205 | for (auto J = I + 1; J != E && I->FileID == J->FileID; ++J) |
206 | ++RegionCount; |
207 | // Start a new region sub-array. |
208 | encodeULEB128(Value: RegionCount, OS); |
209 | |
210 | CurrentFileID = I->FileID; |
211 | PrevLineStart = 0; |
212 | } |
213 | Counter Count = Minimizer.adjust(C: I->Count); |
214 | Counter FalseCount = Minimizer.adjust(C: I->FalseCount); |
215 | bool ParamsShouldBeNull = true; |
216 | switch (I->Kind) { |
217 | case CounterMappingRegion::CodeRegion: |
218 | case CounterMappingRegion::GapRegion: |
219 | writeCounter(Expressions: MinExpressions, C: Count, OS); |
220 | break; |
221 | case CounterMappingRegion::ExpansionRegion: { |
222 | assert(Count.isZero()); |
223 | assert(I->ExpandedFileID <= |
224 | (std::numeric_limits<unsigned>::max() >> |
225 | Counter::EncodingCounterTagAndExpansionRegionTagBits)); |
226 | // Mark an expansion region with a set bit that follows the counter tag, |
227 | // and pack the expanded file id into the remaining bits. |
228 | unsigned EncodedTagExpandedFileID = |
229 | (1 << Counter::EncodingTagBits) | |
230 | (I->ExpandedFileID |
231 | << Counter::EncodingCounterTagAndExpansionRegionTagBits); |
232 | encodeULEB128(Value: EncodedTagExpandedFileID, OS); |
233 | break; |
234 | } |
235 | case CounterMappingRegion::SkippedRegion: |
236 | assert(Count.isZero()); |
237 | encodeULEB128(Value: unsigned(I->Kind) |
238 | << Counter::EncodingCounterTagAndExpansionRegionTagBits, |
239 | OS); |
240 | break; |
241 | case CounterMappingRegion::BranchRegion: |
242 | encodeULEB128(Value: unsigned(I->Kind) |
243 | << Counter::EncodingCounterTagAndExpansionRegionTagBits, |
244 | OS); |
245 | writeCounter(Expressions: MinExpressions, C: Count, OS); |
246 | writeCounter(Expressions: MinExpressions, C: FalseCount, OS); |
247 | break; |
248 | case CounterMappingRegion::MCDCBranchRegion: |
249 | encodeULEB128(Value: unsigned(I->Kind) |
250 | << Counter::EncodingCounterTagAndExpansionRegionTagBits, |
251 | OS); |
252 | writeCounter(Expressions: MinExpressions, C: Count, OS); |
253 | writeCounter(Expressions: MinExpressions, C: FalseCount, OS); |
254 | { |
255 | // They are written as internal values plus 1. |
256 | const auto &BranchParams = I->getBranchParams(); |
257 | ParamsShouldBeNull = false; |
258 | unsigned ID1 = BranchParams.ID + 1; |
259 | unsigned TID1 = BranchParams.Conds[true] + 1; |
260 | unsigned FID1 = BranchParams.Conds[false] + 1; |
261 | encodeULEB128(Value: ID1, OS); |
262 | encodeULEB128(Value: TID1, OS); |
263 | encodeULEB128(Value: FID1, OS); |
264 | } |
265 | break; |
266 | case CounterMappingRegion::MCDCDecisionRegion: |
267 | encodeULEB128(Value: unsigned(I->Kind) |
268 | << Counter::EncodingCounterTagAndExpansionRegionTagBits, |
269 | OS); |
270 | { |
271 | const auto &DecisionParams = I->getDecisionParams(); |
272 | ParamsShouldBeNull = false; |
273 | encodeULEB128(Value: static_cast<unsigned>(DecisionParams.BitmapIdx), OS); |
274 | encodeULEB128(Value: static_cast<unsigned>(DecisionParams.NumConditions), OS); |
275 | } |
276 | break; |
277 | } |
278 | assert(I->LineStart >= PrevLineStart); |
279 | encodeULEB128(Value: I->LineStart - PrevLineStart, OS); |
280 | encodeULEB128(Value: I->ColumnStart, OS); |
281 | assert(I->LineEnd >= I->LineStart); |
282 | encodeULEB128(Value: I->LineEnd - I->LineStart, OS); |
283 | encodeULEB128(Value: I->ColumnEnd, OS); |
284 | PrevLineStart = I->LineStart; |
285 | assert((!ParamsShouldBeNull || std::get_if<0>(&I->MCDCParams)) && |
286 | "MCDCParams should be empty" ); |
287 | (void)ParamsShouldBeNull; |
288 | } |
289 | // Ensure that all file ids have at least one mapping region. |
290 | assert(CurrentFileID == (VirtualFileMapping.size() - 1)); |
291 | } |
292 | |
293 | void TestingFormatWriter::write(raw_ostream &OS, TestingFormatVersion Version) { |
294 | auto ByteSwap = [](uint64_t N) { |
295 | return support::endian::byte_swap<uint64_t, llvm::endianness::little>(value: N); |
296 | }; |
297 | |
298 | // Output a 64bit magic number. |
299 | auto Magic = ByteSwap(TestingFormatMagic); |
300 | OS.write(Ptr: reinterpret_cast<char *>(&Magic), Size: sizeof(Magic)); |
301 | |
302 | // Output a 64bit version field. |
303 | auto VersionLittle = ByteSwap(uint64_t(Version)); |
304 | OS.write(Ptr: reinterpret_cast<char *>(&VersionLittle), Size: sizeof(VersionLittle)); |
305 | |
306 | // Output the ProfileNames data. |
307 | encodeULEB128(Value: ProfileNamesData.size(), OS); |
308 | encodeULEB128(Value: ProfileNamesAddr, OS); |
309 | OS << ProfileNamesData; |
310 | |
311 | // Version2 adds an extra field to indicate the size of the |
312 | // CoverageMappingData. |
313 | if (Version == TestingFormatVersion::Version2) |
314 | encodeULEB128(Value: CoverageMappingData.size(), OS); |
315 | |
316 | // Coverage mapping data is expected to have an alignment of 8. |
317 | for (unsigned Pad = offsetToAlignment(Value: OS.tell(), Alignment: Align(8)); Pad; --Pad) |
318 | OS.write(C: uint8_t(0)); |
319 | OS << CoverageMappingData; |
320 | |
321 | // Coverage records data is expected to have an alignment of 8. |
322 | for (unsigned Pad = offsetToAlignment(Value: OS.tell(), Alignment: Align(8)); Pad; --Pad) |
323 | OS.write(C: uint8_t(0)); |
324 | OS << CoverageRecordsData; |
325 | } |
326 | |