LLVM 20.0.0git
CoverageMappingWriter.cpp
Go to the documentation of this file.
1//===- CoverageMappingWriter.cpp - Code coverage mapping writer -----------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file contains support for writing coverage mapping data for
10// instrumentation based coverage.
11//
12//===----------------------------------------------------------------------===//
13
15#include "llvm/ADT/ArrayRef.h"
20#include "llvm/Support/LEB128.h"
22#include <cassert>
23#include <limits>
24#include <vector>
25
26using namespace llvm;
27using namespace coverage;
28
30 ArrayRef<std::string> Filenames)
31 : Filenames(Filenames) {
32#ifndef NDEBUG
33 StringSet<> NameSet;
34 for (StringRef Name : Filenames)
35 assert(NameSet.insert(Name).second && "Duplicate filename");
36#endif
37}
38
40 std::string FilenamesStr;
41 {
42 raw_string_ostream FilenamesOS{FilenamesStr};
43 for (const auto &Filename : Filenames) {
44 encodeULEB128(Filename.size(), FilenamesOS);
45 FilenamesOS << Filename;
46 }
47 }
48
49 SmallVector<uint8_t, 128> CompressedStr;
50 bool doCompression = Compress && compression::zlib::isAvailable() &&
52 if (doCompression)
53 compression::zlib::compress(arrayRefFromStringRef(FilenamesStr),
54 CompressedStr,
56
57 // ::= <num-filenames>
58 // <uncompressed-len>
59 // <compressed-len-or-zero>
60 // (<compressed-filenames> | <uncompressed-filenames>)
61 encodeULEB128(Filenames.size(), OS);
62 encodeULEB128(FilenamesStr.size(), OS);
63 encodeULEB128(doCompression ? CompressedStr.size() : 0U, OS);
64 OS << (doCompression ? toStringRef(CompressedStr) : StringRef(FilenamesStr));
65}
66
67namespace {
68
69/// Gather only the expressions that are used by the mapping
70/// regions in this function.
71class CounterExpressionsMinimizer {
74 std::vector<unsigned> AdjustedExpressionIDs;
75
76public:
77 CounterExpressionsMinimizer(ArrayRef<CounterExpression> Expressions,
78 ArrayRef<CounterMappingRegion> MappingRegions)
79 : Expressions(Expressions) {
80 AdjustedExpressionIDs.resize(Expressions.size(), 0);
81 for (const auto &I : MappingRegions) {
82 mark(I.Count);
83 mark(I.FalseCount);
84 }
85 for (const auto &I : MappingRegions) {
86 gatherUsed(I.Count);
87 gatherUsed(I.FalseCount);
88 }
89 }
90
91 void mark(Counter C) {
92 if (!C.isExpression())
93 return;
94 unsigned ID = C.getExpressionID();
95 AdjustedExpressionIDs[ID] = 1;
96 mark(Expressions[ID].LHS);
97 mark(Expressions[ID].RHS);
98 }
99
100 void gatherUsed(Counter C) {
101 if (!C.isExpression() || !AdjustedExpressionIDs[C.getExpressionID()])
102 return;
103 AdjustedExpressionIDs[C.getExpressionID()] = UsedExpressions.size();
104 const auto &E = Expressions[C.getExpressionID()];
105 UsedExpressions.push_back(E);
106 gatherUsed(E.LHS);
107 gatherUsed(E.RHS);
108 }
109
110 ArrayRef<CounterExpression> getExpressions() const { return UsedExpressions; }
111
112 /// Adjust the given counter to correctly transition from the old
113 /// expression ids to the new expression ids.
114 Counter adjust(Counter C) const {
115 if (C.isExpression())
116 C = Counter::getExpression(AdjustedExpressionIDs[C.getExpressionID()]);
117 return C;
118 }
119};
120
121} // end anonymous namespace
122
123/// Encode the counter.
124///
125/// The encoding uses the following format:
126/// Low 2 bits - Tag:
127/// Counter::Zero(0) - A Counter with kind Counter::Zero
128/// Counter::CounterValueReference(1) - A counter with kind
129/// Counter::CounterValueReference
130/// Counter::Expression(2) + CounterExpression::Subtract(0) -
131/// A counter with kind Counter::Expression and an expression
132/// with kind CounterExpression::Subtract
133/// Counter::Expression(2) + CounterExpression::Add(1) -
134/// A counter with kind Counter::Expression and an expression
135/// with kind CounterExpression::Add
136/// Remaining bits - Counter/Expression ID.
137static unsigned encodeCounter(ArrayRef<CounterExpression> Expressions,
138 Counter C) {
139 unsigned Tag = unsigned(C.getKind());
140 if (C.isExpression())
141 Tag += Expressions[C.getExpressionID()].Kind;
142 unsigned ID = C.getCounterID();
143 assert(ID <=
144 (std::numeric_limits<unsigned>::max() >> Counter::EncodingTagBits));
145 return Tag | (ID << Counter::EncodingTagBits);
146}
147
149 raw_ostream &OS) {
150 encodeULEB128(encodeCounter(Expressions, C), OS);
151}
152
154 // Check that we don't have any bogus regions.
155 assert(all_of(MappingRegions,
156 [](const CounterMappingRegion &CMR) {
157 return CMR.startLoc() <= CMR.endLoc();
158 }) &&
159 "Source region does not begin before it ends");
160
161 // Sort the regions in an ascending order by the file id and the starting
162 // location. Sort by region kinds to ensure stable order for tests.
163 llvm::stable_sort(MappingRegions, [](const CounterMappingRegion &LHS,
164 const CounterMappingRegion &RHS) {
165 if (LHS.FileID != RHS.FileID)
166 return LHS.FileID < RHS.FileID;
167 if (LHS.startLoc() != RHS.startLoc())
168 return LHS.startLoc() < RHS.startLoc();
169
170 // Put `Decision` before `Expansion`.
171 auto getKindKey = [](CounterMappingRegion::RegionKind Kind) {
172 return (Kind == CounterMappingRegion::MCDCDecisionRegion
173 ? 2 * CounterMappingRegion::ExpansionRegion - 1
174 : 2 * Kind);
175 };
176
177 return getKindKey(LHS.Kind) < getKindKey(RHS.Kind);
178 });
179
180 // Write out the fileid -> filename mapping.
181 encodeULEB128(VirtualFileMapping.size(), OS);
182 for (const auto &FileID : VirtualFileMapping)
183 encodeULEB128(FileID, OS);
184
185 // Write out the expressions.
186 CounterExpressionsMinimizer Minimizer(Expressions, MappingRegions);
187 auto MinExpressions = Minimizer.getExpressions();
188 encodeULEB128(MinExpressions.size(), OS);
189 for (const auto &E : MinExpressions) {
190 writeCounter(MinExpressions, Minimizer.adjust(E.LHS), OS);
191 writeCounter(MinExpressions, Minimizer.adjust(E.RHS), OS);
192 }
193
194 // Write out the mapping regions.
195 // Split the regions into subarrays where each region in a
196 // subarray has a fileID which is the index of that subarray.
197 unsigned PrevLineStart = 0;
198 unsigned CurrentFileID = ~0U;
199 for (auto I = MappingRegions.begin(), E = MappingRegions.end(); I != E; ++I) {
200 if (I->FileID != CurrentFileID) {
201 // Ensure that all file ids have at least one mapping region.
202 assert(I->FileID == (CurrentFileID + 1));
203 // Find the number of regions with this file id.
204 unsigned RegionCount = 1;
205 for (auto J = I + 1; J != E && I->FileID == J->FileID; ++J)
206 ++RegionCount;
207 // Start a new region sub-array.
208 encodeULEB128(RegionCount, OS);
209
210 CurrentFileID = I->FileID;
211 PrevLineStart = 0;
212 }
213 Counter Count = Minimizer.adjust(I->Count);
214 Counter FalseCount = Minimizer.adjust(I->FalseCount);
215 bool ParamsShouldBeNull = true;
216 switch (I->Kind) {
219 writeCounter(MinExpressions, Count, OS);
220 break;
222 assert(Count.isZero());
223 assert(I->ExpandedFileID <=
224 (std::numeric_limits<unsigned>::max() >>
226 // Mark an expansion region with a set bit that follows the counter tag,
227 // and pack the expanded file id into the remaining bits.
228 unsigned EncodedTagExpandedFileID =
230 (I->ExpandedFileID
232 encodeULEB128(EncodedTagExpandedFileID, OS);
233 break;
234 }
236 assert(Count.isZero());
237 encodeULEB128(unsigned(I->Kind)
239 OS);
240 break;
242 encodeULEB128(unsigned(I->Kind)
244 OS);
245 writeCounter(MinExpressions, Count, OS);
246 writeCounter(MinExpressions, FalseCount, OS);
247 break;
249 encodeULEB128(unsigned(I->Kind)
251 OS);
252 writeCounter(MinExpressions, Count, OS);
253 writeCounter(MinExpressions, FalseCount, OS);
254 {
255 // They are written as internal values plus 1.
256 const auto &BranchParams = I->getBranchParams();
257 ParamsShouldBeNull = false;
258 unsigned ID1 = BranchParams.ID + 1;
259 unsigned TID1 = BranchParams.Conds[true] + 1;
260 unsigned FID1 = BranchParams.Conds[false] + 1;
261 encodeULEB128(ID1, OS);
262 encodeULEB128(TID1, OS);
263 encodeULEB128(FID1, OS);
264 }
265 break;
267 encodeULEB128(unsigned(I->Kind)
269 OS);
270 {
271 const auto &DecisionParams = I->getDecisionParams();
272 ParamsShouldBeNull = false;
273 encodeULEB128(static_cast<unsigned>(DecisionParams.BitmapIdx), OS);
274 encodeULEB128(static_cast<unsigned>(DecisionParams.NumConditions), OS);
275 }
276 break;
277 }
278 assert(I->LineStart >= PrevLineStart);
279 encodeULEB128(I->LineStart - PrevLineStart, OS);
280 encodeULEB128(I->ColumnStart, OS);
281 assert(I->LineEnd >= I->LineStart);
282 encodeULEB128(I->LineEnd - I->LineStart, OS);
283 encodeULEB128(I->ColumnEnd, OS);
284 PrevLineStart = I->LineStart;
285 assert((!ParamsShouldBeNull || std::get_if<0>(&I->MCDCParams)) &&
286 "MCDCParams should be empty");
287 (void)ParamsShouldBeNull;
288 }
289 // Ensure that all file ids have at least one mapping region.
290 assert(CurrentFileID == (VirtualFileMapping.size() - 1));
291}
292
294 auto ByteSwap = [](uint64_t N) {
295 return support::endian::byte_swap<uint64_t, llvm::endianness::little>(N);
296 };
297
298 // Output a 64bit magic number.
299 auto Magic = ByteSwap(TestingFormatMagic);
300 OS.write(reinterpret_cast<char *>(&Magic), sizeof(Magic));
301
302 // Output a 64bit version field.
303 auto VersionLittle = ByteSwap(uint64_t(Version));
304 OS.write(reinterpret_cast<char *>(&VersionLittle), sizeof(VersionLittle));
305
306 // Output the ProfileNames data.
307 encodeULEB128(ProfileNamesData.size(), OS);
308 encodeULEB128(ProfileNamesAddr, OS);
309 OS << ProfileNamesData;
310
311 // Version2 adds an extra field to indicate the size of the
312 // CoverageMappingData.
314 encodeULEB128(CoverageMappingData.size(), OS);
315
316 // Coverage mapping data is expected to have an alignment of 8.
317 for (unsigned Pad = offsetToAlignment(OS.tell(), Align(8)); Pad; --Pad)
318 OS.write(uint8_t(0));
319 OS << CoverageMappingData;
320
321 // Coverage records data is expected to have an alignment of 8.
322 for (unsigned Pad = offsetToAlignment(OS.tell(), Align(8)); Pad; --Pad)
323 OS.write(uint8_t(0));
324 OS << CoverageRecordsData;
325}
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static void writeCounter(ArrayRef< CounterExpression > Expressions, Counter C, raw_ostream &OS)
static unsigned encodeCounter(ArrayRef< CounterExpression > Expressions, Counter C)
Encode the counter.
std::string Name
#define I(x, y, z)
Definition: MD5.cpp:58
if(PassOpts->AAPipeline)
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
raw_pwrite_stream & OS
This file defines the SmallVector class.
This file contains some functions that are useful when dealing with strings.
Value * RHS
Value * LHS
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41
size_t size() const
size - Get the array size.
Definition: ArrayRef.h:168
size_t size() const
Definition: SmallVector.h:78
void push_back(const T &Elt)
Definition: SmallVector.h:413
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51
constexpr size_t size() const
size - Get the string size.
Definition: StringRef.h:150
StringSet - A wrapper for StringMap that provides set-like functionality.
Definition: StringSet.h:23
std::pair< typename Base::iterator, bool > insert(StringRef key)
Definition: StringSet.h:38
void write(raw_ostream &OS, bool Compress=true)
Write encoded filenames to the given output stream.
CoverageFilenamesSectionWriter(ArrayRef< std::string > Filenames)
void write(raw_ostream &OS)
Write encoded coverage mapping data to the given output stream.
void write(raw_ostream &OS, TestingFormatVersion Version=TestingFormatVersion::CurrentVersion)
Encode to the given output stream.
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:52
uint64_t tell() const
tell - Return the current offset with the file.
Definition: raw_ostream.h:147
raw_ostream & write(unsigned char C)
A raw_ostream that writes to an std::string.
Definition: raw_ostream.h:661
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24
void compress(ArrayRef< uint8_t > Input, SmallVectorImpl< uint8_t > &CompressedBuffer, int Level=DefaultCompression)
constexpr int BestSizeCompression
Definition: Compression.h:39
constexpr uint64_t TestingFormatMagic
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
void stable_sort(R &&Range)
Definition: STLExtras.h:2037
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1739
cl::opt< bool > DoInstrProfNameCompression
uint64_t offsetToAlignment(uint64_t Value, Align Alignment)
Returns the offset to the next integer (mod 2**64) that is greater than or equal to Value and is a mu...
Definition: Alignment.h:197
unsigned encodeULEB128(uint64_t Value, raw_ostream &OS, unsigned PadTo=0)
Utility function to encode a ULEB128 value to an output stream.
Definition: LEB128.h:80
#define N
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39
A Counter mapping region associates a source range with a specific counter.
@ ExpansionRegion
An ExpansionRegion represents a file expansion region that associates a source range with the expansi...
@ MCDCDecisionRegion
A DecisionRegion represents a top-level boolean expression and is associated with a variable length b...
@ MCDCBranchRegion
A Branch Region can be extended to include IDs to facilitate MC/DC.
@ SkippedRegion
A SkippedRegion represents a source range with code that was skipped by a preprocessor or similar mea...
@ GapRegion
A GapRegion is like a CodeRegion, but its count is only set as the line execution count when its the ...
@ BranchRegion
A BranchRegion represents leaf-level boolean expressions and is associated with two counters,...
@ CodeRegion
A CodeRegion associates some code with a counter.
A Counter is an abstract value that describes how to compute the execution count for a region of code...
static const unsigned EncodingTagBits
static const unsigned EncodingCounterTagAndExpansionRegionTagBits
static Counter getExpression(unsigned ExpressionId)
Return the counter that corresponds to a specific addition counter expression.