1 //===- CoverageMapping.cpp - Code coverage mapping support ----------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file contains support for clang's and llvm's instrumentation based
12 //===----------------------------------------------------------------------===//
14 #include "llvm/ProfileData/Coverage/CoverageMapping.h"
15 #include "llvm/ADT/ArrayRef.h"
16 #include "llvm/ADT/DenseMap.h"
17 #include "llvm/ADT/SmallBitVector.h"
18 #include "llvm/ADT/SmallString.h"
19 #include "llvm/ADT/SmallVector.h"
20 #include "llvm/ADT/StringExtras.h"
21 #include "llvm/ADT/StringRef.h"
22 #include "llvm/Object/BuildID.h"
23 #include "llvm/ProfileData/Coverage/CoverageMappingReader.h"
24 #include "llvm/ProfileData/InstrProfReader.h"
25 #include "llvm/Support/Debug.h"
26 #include "llvm/Support/Errc.h"
27 #include "llvm/Support/Error.h"
28 #include "llvm/Support/ErrorHandling.h"
29 #include "llvm/Support/MemoryBuffer.h"
30 #include "llvm/Support/VirtualFileSystem.h"
31 #include "llvm/Support/raw_ostream.h"
40 #include <system_error>
45 using namespace coverage
;
47 #define DEBUG_TYPE "coverage-mapping"
49 Counter
CounterExpressionBuilder::get(const CounterExpression
&E
) {
50 auto It
= ExpressionIndices
.find(E
);
51 if (It
!= ExpressionIndices
.end())
52 return Counter::getExpression(It
->second
);
53 unsigned I
= Expressions
.size();
54 Expressions
.push_back(E
);
55 ExpressionIndices
[E
] = I
;
56 return Counter::getExpression(I
);
59 void CounterExpressionBuilder::extractTerms(Counter C
, int Factor
,
60 SmallVectorImpl
<Term
> &Terms
) {
61 switch (C
.getKind()) {
64 case Counter::CounterValueReference
:
65 Terms
.emplace_back(C
.getCounterID(), Factor
);
67 case Counter::Expression
:
68 const auto &E
= Expressions
[C
.getExpressionID()];
69 extractTerms(E
.LHS
, Factor
, Terms
);
71 E
.RHS
, E
.Kind
== CounterExpression::Subtract
? -Factor
: Factor
, Terms
);
76 Counter
CounterExpressionBuilder::simplify(Counter ExpressionTree
) {
77 // Gather constant terms.
78 SmallVector
<Term
, 32> Terms
;
79 extractTerms(ExpressionTree
, +1, Terms
);
81 // If there are no terms, this is just a zero. The algorithm below assumes at
83 if (Terms
.size() == 0)
84 return Counter::getZero();
86 // Group the terms by counter ID.
87 llvm::sort(Terms
, [](const Term
&LHS
, const Term
&RHS
) {
88 return LHS
.CounterID
< RHS
.CounterID
;
91 // Combine terms by counter ID to eliminate counters that sum to zero.
92 auto Prev
= Terms
.begin();
93 for (auto I
= Prev
+ 1, E
= Terms
.end(); I
!= E
; ++I
) {
94 if (I
->CounterID
== Prev
->CounterID
) {
95 Prev
->Factor
+= I
->Factor
;
101 Terms
.erase(++Prev
, Terms
.end());
104 // Create additions. We do this before subtractions to avoid constructs like
105 // ((0 - X) + Y), as opposed to (Y - X).
106 for (auto T
: Terms
) {
109 for (int I
= 0; I
< T
.Factor
; ++I
)
111 C
= Counter::getCounter(T
.CounterID
);
113 C
= get(CounterExpression(CounterExpression::Add
, C
,
114 Counter::getCounter(T
.CounterID
)));
117 // Create subtractions.
118 for (auto T
: Terms
) {
121 for (int I
= 0; I
< -T
.Factor
; ++I
)
122 C
= get(CounterExpression(CounterExpression::Subtract
, C
,
123 Counter::getCounter(T
.CounterID
)));
128 Counter
CounterExpressionBuilder::add(Counter LHS
, Counter RHS
, bool Simplify
) {
129 auto Cnt
= get(CounterExpression(CounterExpression::Add
, LHS
, RHS
));
130 return Simplify
? simplify(Cnt
) : Cnt
;
133 Counter
CounterExpressionBuilder::subtract(Counter LHS
, Counter RHS
,
135 auto Cnt
= get(CounterExpression(CounterExpression::Subtract
, LHS
, RHS
));
136 return Simplify
? simplify(Cnt
) : Cnt
;
139 void CounterMappingContext::dump(const Counter
&C
, raw_ostream
&OS
) const {
140 switch (C
.getKind()) {
144 case Counter::CounterValueReference
:
145 OS
<< '#' << C
.getCounterID();
147 case Counter::Expression
: {
148 if (C
.getExpressionID() >= Expressions
.size())
150 const auto &E
= Expressions
[C
.getExpressionID()];
153 OS
<< (E
.Kind
== CounterExpression::Subtract
? " - " : " + ");
159 if (CounterValues
.empty())
161 Expected
<int64_t> Value
= evaluate(C
);
162 if (auto E
= Value
.takeError()) {
163 consumeError(std::move(E
));
166 OS
<< '[' << *Value
<< ']';
169 Expected
<int64_t> CounterMappingContext::evaluate(const Counter
&C
) const {
177 } VisitCount
= KNeverVisited
;
180 std::stack
<StackElem
> CounterStack
;
181 CounterStack
.push({C
});
183 int64_t LastPoppedValue
;
185 while (!CounterStack
.empty()) {
186 StackElem
&Current
= CounterStack
.top();
188 switch (Current
.ICounter
.getKind()) {
193 case Counter::CounterValueReference
:
194 if (Current
.ICounter
.getCounterID() >= CounterValues
.size())
195 return errorCodeToError(errc::argument_out_of_domain
);
196 LastPoppedValue
= CounterValues
[Current
.ICounter
.getCounterID()];
199 case Counter::Expression
: {
200 if (Current
.ICounter
.getExpressionID() >= Expressions
.size())
201 return errorCodeToError(errc::argument_out_of_domain
);
202 const auto &E
= Expressions
[Current
.ICounter
.getExpressionID()];
203 if (Current
.VisitCount
== StackElem::KNeverVisited
) {
204 CounterStack
.push(StackElem
{E
.LHS
});
205 Current
.VisitCount
= StackElem::KVisitedOnce
;
206 } else if (Current
.VisitCount
== StackElem::KVisitedOnce
) {
207 Current
.LHS
= LastPoppedValue
;
208 CounterStack
.push(StackElem
{E
.RHS
});
209 Current
.VisitCount
= StackElem::KVisitedTwice
;
211 int64_t LHS
= Current
.LHS
;
212 int64_t RHS
= LastPoppedValue
;
214 E
.Kind
== CounterExpression::Subtract
? LHS
- RHS
: LHS
+ RHS
;
222 return LastPoppedValue
;
225 unsigned CounterMappingContext::getMaxCounterID(const Counter
&C
) const {
226 switch (C
.getKind()) {
229 case Counter::CounterValueReference
:
230 return C
.getCounterID();
231 case Counter::Expression
: {
232 if (C
.getExpressionID() >= Expressions
.size())
234 const auto &E
= Expressions
[C
.getExpressionID()];
235 return std::max(getMaxCounterID(E
.LHS
), getMaxCounterID(E
.RHS
));
238 llvm_unreachable("Unhandled CounterKind");
241 void FunctionRecordIterator::skipOtherFiles() {
242 while (Current
!= Records
.end() && !Filename
.empty() &&
243 Filename
!= Current
->Filenames
[0])
245 if (Current
== Records
.end())
246 *this = FunctionRecordIterator();
249 ArrayRef
<unsigned> CoverageMapping::getImpreciseRecordIndicesForFilename(
250 StringRef Filename
) const {
251 size_t FilenameHash
= hash_value(Filename
);
252 auto RecordIt
= FilenameHash2RecordIndices
.find(FilenameHash
);
253 if (RecordIt
== FilenameHash2RecordIndices
.end())
255 return RecordIt
->second
;
258 static unsigned getMaxCounterID(const CounterMappingContext
&Ctx
,
259 const CoverageMappingRecord
&Record
) {
260 unsigned MaxCounterID
= 0;
261 for (const auto &Region
: Record
.MappingRegions
) {
262 MaxCounterID
= std::max(MaxCounterID
, Ctx
.getMaxCounterID(Region
.Count
));
267 Error
CoverageMapping::loadFunctionRecord(
268 const CoverageMappingRecord
&Record
,
269 IndexedInstrProfReader
&ProfileReader
) {
270 StringRef OrigFuncName
= Record
.FunctionName
;
271 if (OrigFuncName
.empty())
272 return make_error
<CoverageMapError
>(coveragemap_error::malformed
,
273 "record function name is empty");
275 if (Record
.Filenames
.empty())
276 OrigFuncName
= getFuncNameWithoutPrefix(OrigFuncName
);
278 OrigFuncName
= getFuncNameWithoutPrefix(OrigFuncName
, Record
.Filenames
[0]);
280 CounterMappingContext
Ctx(Record
.Expressions
);
282 std::vector
<uint64_t> Counts
;
283 if (Error E
= ProfileReader
.getFunctionCounts(Record
.FunctionName
,
284 Record
.FunctionHash
, Counts
)) {
285 instrprof_error IPE
= std::get
<0>(InstrProfError::take(std::move(E
)));
286 if (IPE
== instrprof_error::hash_mismatch
) {
287 FuncHashMismatches
.emplace_back(std::string(Record
.FunctionName
),
288 Record
.FunctionHash
);
289 return Error::success();
290 } else if (IPE
!= instrprof_error::unknown_function
)
291 return make_error
<InstrProfError
>(IPE
);
292 Counts
.assign(getMaxCounterID(Ctx
, Record
) + 1, 0);
294 Ctx
.setCounts(Counts
);
296 assert(!Record
.MappingRegions
.empty() && "Function has no regions");
298 // This coverage record is a zero region for a function that's unused in
299 // some TU, but used in a different TU. Ignore it. The coverage maps from the
300 // the other TU will either be loaded (providing full region counts) or they
301 // won't (in which case we don't unintuitively report functions as uncovered
302 // when they have non-zero counts in the profile).
303 if (Record
.MappingRegions
.size() == 1 &&
304 Record
.MappingRegions
[0].Count
.isZero() && Counts
[0] > 0)
305 return Error::success();
307 FunctionRecord
Function(OrigFuncName
, Record
.Filenames
);
308 for (const auto &Region
: Record
.MappingRegions
) {
309 Expected
<int64_t> ExecutionCount
= Ctx
.evaluate(Region
.Count
);
310 if (auto E
= ExecutionCount
.takeError()) {
311 consumeError(std::move(E
));
312 return Error::success();
314 Expected
<int64_t> AltExecutionCount
= Ctx
.evaluate(Region
.FalseCount
);
315 if (auto E
= AltExecutionCount
.takeError()) {
316 consumeError(std::move(E
));
317 return Error::success();
319 Function
.pushRegion(Region
, *ExecutionCount
, *AltExecutionCount
);
322 // Don't create records for (filenames, function) pairs we've already seen.
323 auto FilenamesHash
= hash_combine_range(Record
.Filenames
.begin(),
324 Record
.Filenames
.end());
325 if (!RecordProvenance
[FilenamesHash
].insert(hash_value(OrigFuncName
)).second
)
326 return Error::success();
328 Functions
.push_back(std::move(Function
));
330 // Performance optimization: keep track of the indices of the function records
331 // which correspond to each filename. This can be used to substantially speed
332 // up queries for coverage info in a file.
333 unsigned RecordIndex
= Functions
.size() - 1;
334 for (StringRef Filename
: Record
.Filenames
) {
335 auto &RecordIndices
= FilenameHash2RecordIndices
[hash_value(Filename
)];
336 // Note that there may be duplicates in the filename set for a function
337 // record, because of e.g. macro expansions in the function in which both
338 // the macro and the function are defined in the same file.
339 if (RecordIndices
.empty() || RecordIndices
.back() != RecordIndex
)
340 RecordIndices
.push_back(RecordIndex
);
343 return Error::success();
346 // This function is for memory optimization by shortening the lifetimes
347 // of CoverageMappingReader instances.
348 Error
CoverageMapping::loadFromReaders(
349 ArrayRef
<std::unique_ptr
<CoverageMappingReader
>> CoverageReaders
,
350 IndexedInstrProfReader
&ProfileReader
, CoverageMapping
&Coverage
) {
351 for (const auto &CoverageReader
: CoverageReaders
) {
352 for (auto RecordOrErr
: *CoverageReader
) {
353 if (Error E
= RecordOrErr
.takeError())
355 const auto &Record
= *RecordOrErr
;
356 if (Error E
= Coverage
.loadFunctionRecord(Record
, ProfileReader
))
360 return Error::success();
363 Expected
<std::unique_ptr
<CoverageMapping
>> CoverageMapping::load(
364 ArrayRef
<std::unique_ptr
<CoverageMappingReader
>> CoverageReaders
,
365 IndexedInstrProfReader
&ProfileReader
) {
366 auto Coverage
= std::unique_ptr
<CoverageMapping
>(new CoverageMapping());
367 if (Error E
= loadFromReaders(CoverageReaders
, ProfileReader
, *Coverage
))
369 return std::move(Coverage
);
372 // If E is a no_data_found error, returns success. Otherwise returns E.
373 static Error
handleMaybeNoDataFoundError(Error E
) {
375 std::move(E
), [](const CoverageMapError
&CME
) {
376 if (CME
.get() == coveragemap_error::no_data_found
)
377 return static_cast<Error
>(Error::success());
378 return make_error
<CoverageMapError
>(CME
.get(), CME
.getMessage());
382 Error
CoverageMapping::loadFromFile(
383 StringRef Filename
, StringRef Arch
, StringRef CompilationDir
,
384 IndexedInstrProfReader
&ProfileReader
, CoverageMapping
&Coverage
,
385 bool &DataFound
, SmallVectorImpl
<object::BuildID
> *FoundBinaryIDs
) {
386 auto CovMappingBufOrErr
= MemoryBuffer::getFileOrSTDIN(
387 Filename
, /*IsText=*/false, /*RequiresNullTerminator=*/false);
388 if (std::error_code EC
= CovMappingBufOrErr
.getError())
389 return createFileError(Filename
, errorCodeToError(EC
));
390 MemoryBufferRef CovMappingBufRef
=
391 CovMappingBufOrErr
.get()->getMemBufferRef();
392 SmallVector
<std::unique_ptr
<MemoryBuffer
>, 4> Buffers
;
394 SmallVector
<object::BuildIDRef
> BinaryIDs
;
395 auto CoverageReadersOrErr
= BinaryCoverageReader::create(
396 CovMappingBufRef
, Arch
, Buffers
, CompilationDir
,
397 FoundBinaryIDs
? &BinaryIDs
: nullptr);
398 if (Error E
= CoverageReadersOrErr
.takeError()) {
399 E
= handleMaybeNoDataFoundError(std::move(E
));
401 return createFileError(Filename
, std::move(E
));
405 SmallVector
<std::unique_ptr
<CoverageMappingReader
>, 4> Readers
;
406 for (auto &Reader
: CoverageReadersOrErr
.get())
407 Readers
.push_back(std::move(Reader
));
408 if (FoundBinaryIDs
&& !Readers
.empty()) {
409 llvm::append_range(*FoundBinaryIDs
,
410 llvm::map_range(BinaryIDs
, [](object::BuildIDRef BID
) {
411 return object::BuildID(BID
);
414 DataFound
|= !Readers
.empty();
415 if (Error E
= loadFromReaders(Readers
, ProfileReader
, Coverage
))
416 return createFileError(Filename
, std::move(E
));
417 return Error::success();
420 Expected
<std::unique_ptr
<CoverageMapping
>> CoverageMapping::load(
421 ArrayRef
<StringRef
> ObjectFilenames
, StringRef ProfileFilename
,
422 vfs::FileSystem
&FS
, ArrayRef
<StringRef
> Arches
, StringRef CompilationDir
,
423 const object::BuildIDFetcher
*BIDFetcher
, bool CheckBinaryIDs
) {
424 auto ProfileReaderOrErr
= IndexedInstrProfReader::create(ProfileFilename
, FS
);
425 if (Error E
= ProfileReaderOrErr
.takeError())
426 return createFileError(ProfileFilename
, std::move(E
));
427 auto ProfileReader
= std::move(ProfileReaderOrErr
.get());
428 auto Coverage
= std::unique_ptr
<CoverageMapping
>(new CoverageMapping());
429 bool DataFound
= false;
431 auto GetArch
= [&](size_t Idx
) {
434 if (Arches
.size() == 1)
435 return Arches
.front();
439 SmallVector
<object::BuildID
> FoundBinaryIDs
;
440 for (const auto &File
: llvm::enumerate(ObjectFilenames
)) {
442 loadFromFile(File
.value(), GetArch(File
.index()), CompilationDir
,
443 *ProfileReader
, *Coverage
, DataFound
, &FoundBinaryIDs
))
448 std::vector
<object::BuildID
> ProfileBinaryIDs
;
449 if (Error E
= ProfileReader
->readBinaryIds(ProfileBinaryIDs
))
450 return createFileError(ProfileFilename
, std::move(E
));
452 SmallVector
<object::BuildIDRef
> BinaryIDsToFetch
;
453 if (!ProfileBinaryIDs
.empty()) {
454 const auto &Compare
= [](object::BuildIDRef A
, object::BuildIDRef B
) {
455 return std::lexicographical_compare(A
.begin(), A
.end(), B
.begin(),
458 llvm::sort(FoundBinaryIDs
, Compare
);
460 ProfileBinaryIDs
.begin(), ProfileBinaryIDs
.end(),
461 FoundBinaryIDs
.begin(), FoundBinaryIDs
.end(),
462 std::inserter(BinaryIDsToFetch
, BinaryIDsToFetch
.end()), Compare
);
465 for (object::BuildIDRef BinaryID
: BinaryIDsToFetch
) {
466 std::optional
<std::string
> PathOpt
= BIDFetcher
->fetch(BinaryID
);
468 std::string Path
= std::move(*PathOpt
);
469 StringRef Arch
= Arches
.size() == 1 ? Arches
.front() : StringRef();
470 if (Error E
= loadFromFile(Path
, Arch
, CompilationDir
, *ProfileReader
,
471 *Coverage
, DataFound
))
473 } else if (CheckBinaryIDs
) {
474 return createFileError(
476 createStringError(errc::no_such_file_or_directory
,
477 "Missing binary ID: " +
478 llvm::toHex(BinaryID
, /*LowerCase=*/true)));
484 return createFileError(
485 join(ObjectFilenames
.begin(), ObjectFilenames
.end(), ", "),
486 make_error
<CoverageMapError
>(coveragemap_error::no_data_found
));
487 return std::move(Coverage
);
492 /// Distributes functions into instantiation sets.
494 /// An instantiation set is a collection of functions that have the same source
495 /// code, ie, template functions specializations.
496 class FunctionInstantiationSetCollector
{
497 using MapT
= std::map
<LineColPair
, std::vector
<const FunctionRecord
*>>;
498 MapT InstantiatedFunctions
;
501 void insert(const FunctionRecord
&Function
, unsigned FileID
) {
502 auto I
= Function
.CountedRegions
.begin(), E
= Function
.CountedRegions
.end();
503 while (I
!= E
&& I
->FileID
!= FileID
)
505 assert(I
!= E
&& "function does not cover the given file");
506 auto &Functions
= InstantiatedFunctions
[I
->startLoc()];
507 Functions
.push_back(&Function
);
510 MapT::iterator
begin() { return InstantiatedFunctions
.begin(); }
511 MapT::iterator
end() { return InstantiatedFunctions
.end(); }
514 class SegmentBuilder
{
515 std::vector
<CoverageSegment
> &Segments
;
516 SmallVector
<const CountedRegion
*, 8> ActiveRegions
;
518 SegmentBuilder(std::vector
<CoverageSegment
> &Segments
) : Segments(Segments
) {}
520 /// Emit a segment with the count from \p Region starting at \p StartLoc.
522 /// \p IsRegionEntry: The segment is at the start of a new non-gap region.
523 /// \p EmitSkippedRegion: The segment must be emitted as a skipped region.
524 void startSegment(const CountedRegion
&Region
, LineColPair StartLoc
,
525 bool IsRegionEntry
, bool EmitSkippedRegion
= false) {
526 bool HasCount
= !EmitSkippedRegion
&&
527 (Region
.Kind
!= CounterMappingRegion::SkippedRegion
);
529 // If the new segment wouldn't affect coverage rendering, skip it.
530 if (!Segments
.empty() && !IsRegionEntry
&& !EmitSkippedRegion
) {
531 const auto &Last
= Segments
.back();
532 if (Last
.HasCount
== HasCount
&& Last
.Count
== Region
.ExecutionCount
&&
538 Segments
.emplace_back(StartLoc
.first
, StartLoc
.second
,
539 Region
.ExecutionCount
, IsRegionEntry
,
540 Region
.Kind
== CounterMappingRegion::GapRegion
);
542 Segments
.emplace_back(StartLoc
.first
, StartLoc
.second
, IsRegionEntry
);
545 const auto &Last
= Segments
.back();
546 dbgs() << "Segment at " << Last
.Line
<< ":" << Last
.Col
547 << " (count = " << Last
.Count
<< ")"
548 << (Last
.IsRegionEntry
? ", RegionEntry" : "")
549 << (!Last
.HasCount
? ", Skipped" : "")
550 << (Last
.IsGapRegion
? ", Gap" : "") << "\n";
554 /// Emit segments for active regions which end before \p Loc.
556 /// \p Loc: The start location of the next region. If std::nullopt, all active
557 /// regions are completed.
558 /// \p FirstCompletedRegion: Index of the first completed region.
559 void completeRegionsUntil(std::optional
<LineColPair
> Loc
,
560 unsigned FirstCompletedRegion
) {
561 // Sort the completed regions by end location. This makes it simple to
562 // emit closing segments in sorted order.
563 auto CompletedRegionsIt
= ActiveRegions
.begin() + FirstCompletedRegion
;
564 std::stable_sort(CompletedRegionsIt
, ActiveRegions
.end(),
565 [](const CountedRegion
*L
, const CountedRegion
*R
) {
566 return L
->endLoc() < R
->endLoc();
569 // Emit segments for all completed regions.
570 for (unsigned I
= FirstCompletedRegion
+ 1, E
= ActiveRegions
.size(); I
< E
;
572 const auto *CompletedRegion
= ActiveRegions
[I
];
573 assert((!Loc
|| CompletedRegion
->endLoc() <= *Loc
) &&
574 "Completed region ends after start of new region");
576 const auto *PrevCompletedRegion
= ActiveRegions
[I
- 1];
577 auto CompletedSegmentLoc
= PrevCompletedRegion
->endLoc();
579 // Don't emit any more segments if they start where the new region begins.
580 if (Loc
&& CompletedSegmentLoc
== *Loc
)
583 // Don't emit a segment if the next completed region ends at the same
584 // location as this one.
585 if (CompletedSegmentLoc
== CompletedRegion
->endLoc())
588 // Use the count from the last completed region which ends at this loc.
589 for (unsigned J
= I
+ 1; J
< E
; ++J
)
590 if (CompletedRegion
->endLoc() == ActiveRegions
[J
]->endLoc())
591 CompletedRegion
= ActiveRegions
[J
];
593 startSegment(*CompletedRegion
, CompletedSegmentLoc
, false);
596 auto Last
= ActiveRegions
.back();
597 if (FirstCompletedRegion
&& Last
->endLoc() != *Loc
) {
598 // If there's a gap after the end of the last completed region and the
599 // start of the new region, use the last active region to fill the gap.
600 startSegment(*ActiveRegions
[FirstCompletedRegion
- 1], Last
->endLoc(),
602 } else if (!FirstCompletedRegion
&& (!Loc
|| *Loc
!= Last
->endLoc())) {
603 // Emit a skipped segment if there are no more active regions. This
604 // ensures that gaps between functions are marked correctly.
605 startSegment(*Last
, Last
->endLoc(), false, true);
608 // Pop the completed regions.
609 ActiveRegions
.erase(CompletedRegionsIt
, ActiveRegions
.end());
612 void buildSegmentsImpl(ArrayRef
<CountedRegion
> Regions
) {
613 for (const auto &CR
: enumerate(Regions
)) {
614 auto CurStartLoc
= CR
.value().startLoc();
616 // Active regions which end before the current region need to be popped.
617 auto CompletedRegions
=
618 std::stable_partition(ActiveRegions
.begin(), ActiveRegions
.end(),
619 [&](const CountedRegion
*Region
) {
620 return !(Region
->endLoc() <= CurStartLoc
);
622 if (CompletedRegions
!= ActiveRegions
.end()) {
623 unsigned FirstCompletedRegion
=
624 std::distance(ActiveRegions
.begin(), CompletedRegions
);
625 completeRegionsUntil(CurStartLoc
, FirstCompletedRegion
);
628 bool GapRegion
= CR
.value().Kind
== CounterMappingRegion::GapRegion
;
630 // Try to emit a segment for the current region.
631 if (CurStartLoc
== CR
.value().endLoc()) {
632 // Avoid making zero-length regions active. If it's the last region,
633 // emit a skipped segment. Otherwise use its predecessor's count.
635 (CR
.index() + 1) == Regions
.size() ||
636 CR
.value().Kind
== CounterMappingRegion::SkippedRegion
;
637 startSegment(ActiveRegions
.empty() ? CR
.value() : *ActiveRegions
.back(),
638 CurStartLoc
, !GapRegion
, Skipped
);
639 // If it is skipped segment, create a segment with last pushed
640 // regions's count at CurStartLoc.
641 if (Skipped
&& !ActiveRegions
.empty())
642 startSegment(*ActiveRegions
.back(), CurStartLoc
, false);
645 if (CR
.index() + 1 == Regions
.size() ||
646 CurStartLoc
!= Regions
[CR
.index() + 1].startLoc()) {
647 // Emit a segment if the next region doesn't start at the same location
649 startSegment(CR
.value(), CurStartLoc
, !GapRegion
);
652 // This region is active (i.e not completed).
653 ActiveRegions
.push_back(&CR
.value());
656 // Complete any remaining active regions.
657 if (!ActiveRegions
.empty())
658 completeRegionsUntil(std::nullopt
, 0);
661 /// Sort a nested sequence of regions from a single file.
662 static void sortNestedRegions(MutableArrayRef
<CountedRegion
> Regions
) {
663 llvm::sort(Regions
, [](const CountedRegion
&LHS
, const CountedRegion
&RHS
) {
664 if (LHS
.startLoc() != RHS
.startLoc())
665 return LHS
.startLoc() < RHS
.startLoc();
666 if (LHS
.endLoc() != RHS
.endLoc())
667 // When LHS completely contains RHS, we sort LHS first.
668 return RHS
.endLoc() < LHS
.endLoc();
669 // If LHS and RHS cover the same area, we need to sort them according
670 // to their kinds so that the most suitable region will become "active"
671 // in combineRegions(). Because we accumulate counter values only from
672 // regions of the same kind as the first region of the area, prefer
673 // CodeRegion to ExpansionRegion and ExpansionRegion to SkippedRegion.
674 static_assert(CounterMappingRegion::CodeRegion
<
675 CounterMappingRegion::ExpansionRegion
&&
676 CounterMappingRegion::ExpansionRegion
<
677 CounterMappingRegion::SkippedRegion
,
678 "Unexpected order of region kind values");
679 return LHS
.Kind
< RHS
.Kind
;
683 /// Combine counts of regions which cover the same area.
684 static ArrayRef
<CountedRegion
>
685 combineRegions(MutableArrayRef
<CountedRegion
> Regions
) {
688 auto Active
= Regions
.begin();
689 auto End
= Regions
.end();
690 for (auto I
= Regions
.begin() + 1; I
!= End
; ++I
) {
691 if (Active
->startLoc() != I
->startLoc() ||
692 Active
->endLoc() != I
->endLoc()) {
693 // Shift to the next region.
699 // Merge duplicate region.
700 // If CodeRegions and ExpansionRegions cover the same area, it's probably
701 // a macro which is fully expanded to another macro. In that case, we need
702 // to accumulate counts only from CodeRegions, or else the area will be
704 // On the other hand, a macro may have a nested macro in its body. If the
705 // outer macro is used several times, the ExpansionRegion for the nested
706 // macro will also be added several times. These ExpansionRegions cover
707 // the same source locations and have to be combined to reach the correct
708 // value for that area.
709 // We add counts of the regions of the same kind as the active region
710 // to handle the both situations.
711 if (I
->Kind
== Active
->Kind
)
712 Active
->ExecutionCount
+= I
->ExecutionCount
;
714 return Regions
.drop_back(std::distance(++Active
, End
));
718 /// Build a sorted list of CoverageSegments from a list of Regions.
719 static std::vector
<CoverageSegment
>
720 buildSegments(MutableArrayRef
<CountedRegion
> Regions
) {
721 std::vector
<CoverageSegment
> Segments
;
722 SegmentBuilder
Builder(Segments
);
724 sortNestedRegions(Regions
);
725 ArrayRef
<CountedRegion
> CombinedRegions
= combineRegions(Regions
);
728 dbgs() << "Combined regions:\n";
729 for (const auto &CR
: CombinedRegions
)
730 dbgs() << " " << CR
.LineStart
<< ":" << CR
.ColumnStart
<< " -> "
731 << CR
.LineEnd
<< ":" << CR
.ColumnEnd
732 << " (count=" << CR
.ExecutionCount
<< ")\n";
735 Builder
.buildSegmentsImpl(CombinedRegions
);
738 for (unsigned I
= 1, E
= Segments
.size(); I
< E
; ++I
) {
739 const auto &L
= Segments
[I
- 1];
740 const auto &R
= Segments
[I
];
741 if (!(L
.Line
< R
.Line
) && !(L
.Line
== R
.Line
&& L
.Col
< R
.Col
)) {
742 if (L
.Line
== R
.Line
&& L
.Col
== R
.Col
&& !L
.HasCount
)
744 LLVM_DEBUG(dbgs() << " ! Segment " << L
.Line
<< ":" << L
.Col
745 << " followed by " << R
.Line
<< ":" << R
.Col
<< "\n");
746 assert(false && "Coverage segments not unique or sorted");
755 } // end anonymous namespace
757 std::vector
<StringRef
> CoverageMapping::getUniqueSourceFiles() const {
758 std::vector
<StringRef
> Filenames
;
759 for (const auto &Function
: getCoveredFunctions())
760 llvm::append_range(Filenames
, Function
.Filenames
);
761 llvm::sort(Filenames
);
762 auto Last
= std::unique(Filenames
.begin(), Filenames
.end());
763 Filenames
.erase(Last
, Filenames
.end());
767 static SmallBitVector
gatherFileIDs(StringRef SourceFile
,
768 const FunctionRecord
&Function
) {
769 SmallBitVector
FilenameEquivalence(Function
.Filenames
.size(), false);
770 for (unsigned I
= 0, E
= Function
.Filenames
.size(); I
< E
; ++I
)
771 if (SourceFile
== Function
.Filenames
[I
])
772 FilenameEquivalence
[I
] = true;
773 return FilenameEquivalence
;
776 /// Return the ID of the file where the definition of the function is located.
777 static std::optional
<unsigned>
778 findMainViewFileID(const FunctionRecord
&Function
) {
779 SmallBitVector
IsNotExpandedFile(Function
.Filenames
.size(), true);
780 for (const auto &CR
: Function
.CountedRegions
)
781 if (CR
.Kind
== CounterMappingRegion::ExpansionRegion
)
782 IsNotExpandedFile
[CR
.ExpandedFileID
] = false;
783 int I
= IsNotExpandedFile
.find_first();
789 /// Check if SourceFile is the file that contains the definition of
790 /// the Function. Return the ID of the file in that case or std::nullopt
792 static std::optional
<unsigned>
793 findMainViewFileID(StringRef SourceFile
, const FunctionRecord
&Function
) {
794 std::optional
<unsigned> I
= findMainViewFileID(Function
);
795 if (I
&& SourceFile
== Function
.Filenames
[*I
])
800 static bool isExpansion(const CountedRegion
&R
, unsigned FileID
) {
801 return R
.Kind
== CounterMappingRegion::ExpansionRegion
&& R
.FileID
== FileID
;
804 CoverageData
CoverageMapping::getCoverageForFile(StringRef Filename
) const {
805 CoverageData
FileCoverage(Filename
);
806 std::vector
<CountedRegion
> Regions
;
808 // Look up the function records in the given file. Due to hash collisions on
809 // the filename, we may get back some records that are not in the file.
810 ArrayRef
<unsigned> RecordIndices
=
811 getImpreciseRecordIndicesForFilename(Filename
);
812 for (unsigned RecordIndex
: RecordIndices
) {
813 const FunctionRecord
&Function
= Functions
[RecordIndex
];
814 auto MainFileID
= findMainViewFileID(Filename
, Function
);
815 auto FileIDs
= gatherFileIDs(Filename
, Function
);
816 for (const auto &CR
: Function
.CountedRegions
)
817 if (FileIDs
.test(CR
.FileID
)) {
818 Regions
.push_back(CR
);
819 if (MainFileID
&& isExpansion(CR
, *MainFileID
))
820 FileCoverage
.Expansions
.emplace_back(CR
, Function
);
822 // Capture branch regions specific to the function (excluding expansions).
823 for (const auto &CR
: Function
.CountedBranchRegions
)
824 if (FileIDs
.test(CR
.FileID
) && (CR
.FileID
== CR
.ExpandedFileID
))
825 FileCoverage
.BranchRegions
.push_back(CR
);
828 LLVM_DEBUG(dbgs() << "Emitting segments for file: " << Filename
<< "\n");
829 FileCoverage
.Segments
= SegmentBuilder::buildSegments(Regions
);
834 std::vector
<InstantiationGroup
>
835 CoverageMapping::getInstantiationGroups(StringRef Filename
) const {
836 FunctionInstantiationSetCollector InstantiationSetCollector
;
837 // Look up the function records in the given file. Due to hash collisions on
838 // the filename, we may get back some records that are not in the file.
839 ArrayRef
<unsigned> RecordIndices
=
840 getImpreciseRecordIndicesForFilename(Filename
);
841 for (unsigned RecordIndex
: RecordIndices
) {
842 const FunctionRecord
&Function
= Functions
[RecordIndex
];
843 auto MainFileID
= findMainViewFileID(Filename
, Function
);
846 InstantiationSetCollector
.insert(Function
, *MainFileID
);
849 std::vector
<InstantiationGroup
> Result
;
850 for (auto &InstantiationSet
: InstantiationSetCollector
) {
851 InstantiationGroup IG
{InstantiationSet
.first
.first
,
852 InstantiationSet
.first
.second
,
853 std::move(InstantiationSet
.second
)};
854 Result
.emplace_back(std::move(IG
));
860 CoverageMapping::getCoverageForFunction(const FunctionRecord
&Function
) const {
861 auto MainFileID
= findMainViewFileID(Function
);
863 return CoverageData();
865 CoverageData
FunctionCoverage(Function
.Filenames
[*MainFileID
]);
866 std::vector
<CountedRegion
> Regions
;
867 for (const auto &CR
: Function
.CountedRegions
)
868 if (CR
.FileID
== *MainFileID
) {
869 Regions
.push_back(CR
);
870 if (isExpansion(CR
, *MainFileID
))
871 FunctionCoverage
.Expansions
.emplace_back(CR
, Function
);
873 // Capture branch regions specific to the function (excluding expansions).
874 for (const auto &CR
: Function
.CountedBranchRegions
)
875 if (CR
.FileID
== *MainFileID
)
876 FunctionCoverage
.BranchRegions
.push_back(CR
);
878 LLVM_DEBUG(dbgs() << "Emitting segments for function: " << Function
.Name
880 FunctionCoverage
.Segments
= SegmentBuilder::buildSegments(Regions
);
882 return FunctionCoverage
;
885 CoverageData
CoverageMapping::getCoverageForExpansion(
886 const ExpansionRecord
&Expansion
) const {
887 CoverageData
ExpansionCoverage(
888 Expansion
.Function
.Filenames
[Expansion
.FileID
]);
889 std::vector
<CountedRegion
> Regions
;
890 for (const auto &CR
: Expansion
.Function
.CountedRegions
)
891 if (CR
.FileID
== Expansion
.FileID
) {
892 Regions
.push_back(CR
);
893 if (isExpansion(CR
, Expansion
.FileID
))
894 ExpansionCoverage
.Expansions
.emplace_back(CR
, Expansion
.Function
);
896 for (const auto &CR
: Expansion
.Function
.CountedBranchRegions
)
897 // Capture branch regions that only pertain to the corresponding expansion.
898 if (CR
.FileID
== Expansion
.FileID
)
899 ExpansionCoverage
.BranchRegions
.push_back(CR
);
901 LLVM_DEBUG(dbgs() << "Emitting segments for expansion of file "
902 << Expansion
.FileID
<< "\n");
903 ExpansionCoverage
.Segments
= SegmentBuilder::buildSegments(Regions
);
905 return ExpansionCoverage
;
908 LineCoverageStats::LineCoverageStats(
909 ArrayRef
<const CoverageSegment
*> LineSegments
,
910 const CoverageSegment
*WrappedSegment
, unsigned Line
)
911 : ExecutionCount(0), HasMultipleRegions(false), Mapped(false), Line(Line
),
912 LineSegments(LineSegments
), WrappedSegment(WrappedSegment
) {
913 // Find the minimum number of regions which start in this line.
914 unsigned MinRegionCount
= 0;
915 auto isStartOfRegion
= [](const CoverageSegment
*S
) {
916 return !S
->IsGapRegion
&& S
->HasCount
&& S
->IsRegionEntry
;
918 for (unsigned I
= 0; I
< LineSegments
.size() && MinRegionCount
< 2; ++I
)
919 if (isStartOfRegion(LineSegments
[I
]))
922 bool StartOfSkippedRegion
= !LineSegments
.empty() &&
923 !LineSegments
.front()->HasCount
&&
924 LineSegments
.front()->IsRegionEntry
;
926 HasMultipleRegions
= MinRegionCount
> 1;
928 !StartOfSkippedRegion
&&
929 ((WrappedSegment
&& WrappedSegment
->HasCount
) || (MinRegionCount
> 0));
934 // Pick the max count from the non-gap, region entry segments and the
937 ExecutionCount
= WrappedSegment
->Count
;
940 for (const auto *LS
: LineSegments
)
941 if (isStartOfRegion(LS
))
942 ExecutionCount
= std::max(ExecutionCount
, LS
->Count
);
945 LineCoverageIterator
&LineCoverageIterator::operator++() {
946 if (Next
== CD
.end()) {
947 Stats
= LineCoverageStats();
952 WrappedSegment
= Segments
.back();
954 while (Next
!= CD
.end() && Next
->Line
== Line
)
955 Segments
.push_back(&*Next
++);
956 Stats
= LineCoverageStats(Segments
, WrappedSegment
, Line
);
961 static std::string
getCoverageMapErrString(coveragemap_error Err
,
962 const std::string
&ErrMsg
= "") {
964 raw_string_ostream
OS(Msg
);
967 case coveragemap_error::success
:
970 case coveragemap_error::eof
:
973 case coveragemap_error::no_data_found
:
974 OS
<< "no coverage data found";
976 case coveragemap_error::unsupported_version
:
977 OS
<< "unsupported coverage format version";
979 case coveragemap_error::truncated
:
980 OS
<< "truncated coverage data";
982 case coveragemap_error::malformed
:
983 OS
<< "malformed coverage data";
985 case coveragemap_error::decompression_failed
:
986 OS
<< "failed to decompress coverage data (zlib)";
988 case coveragemap_error::invalid_or_missing_arch_specifier
:
989 OS
<< "`-arch` specifier is invalid or missing for universal binary";
993 // If optional error message is not empty, append it to the message.
995 OS
<< ": " << ErrMsg
;
1002 // FIXME: This class is only here to support the transition to llvm::Error. It
1003 // will be removed once this transition is complete. Clients should prefer to
1004 // deal with the Error value directly, rather than converting to error_code.
1005 class CoverageMappingErrorCategoryType
: public std::error_category
{
1006 const char *name() const noexcept override
{ return "llvm.coveragemap"; }
1007 std::string
message(int IE
) const override
{
1008 return getCoverageMapErrString(static_cast<coveragemap_error
>(IE
));
1012 } // end anonymous namespace
1014 std::string
CoverageMapError::message() const {
1015 return getCoverageMapErrString(Err
, Msg
);
1018 const std::error_category
&llvm::coverage::coveragemap_category() {
1019 static CoverageMappingErrorCategoryType ErrorCategory
;
1020 return ErrorCategory
;
1023 char CoverageMapError::ID
= 0;