xref: /llvm-project/llvm/lib/ProfileData/Coverage/CoverageMapping.cpp (revision 68216d7bd3863ad25be934e91fbfbba8b35b641e)
1 //=-- CoverageMapping.cpp - Code coverage mapping support ---------*- C++ -*-=//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains support for clang's and llvm's instrumentation based
11 // code coverage.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "llvm/ProfileData/Coverage/CoverageMapping.h"
16 #include "llvm/ADT/DenseMap.h"
17 #include "llvm/ADT/Optional.h"
18 #include "llvm/ADT/SmallBitVector.h"
19 #include "llvm/ProfileData/Coverage/CoverageMappingReader.h"
20 #include "llvm/ProfileData/InstrProfReader.h"
21 #include "llvm/Support/Debug.h"
22 #include "llvm/Support/Errc.h"
23 #include "llvm/Support/ErrorHandling.h"
24 #include "llvm/Support/ManagedStatic.h"
25 #include "llvm/Support/Path.h"
26 #include "llvm/Support/raw_ostream.h"
27 
28 using namespace llvm;
29 using namespace coverage;
30 
31 #define DEBUG_TYPE "coverage-mapping"
32 
33 Counter CounterExpressionBuilder::get(const CounterExpression &E) {
34   auto It = ExpressionIndices.find(E);
35   if (It != ExpressionIndices.end())
36     return Counter::getExpression(It->second);
37   unsigned I = Expressions.size();
38   Expressions.push_back(E);
39   ExpressionIndices[E] = I;
40   return Counter::getExpression(I);
41 }
42 
43 void CounterExpressionBuilder::extractTerms(
44     Counter C, int Sign, SmallVectorImpl<std::pair<unsigned, int>> &Terms) {
45   switch (C.getKind()) {
46   case Counter::Zero:
47     break;
48   case Counter::CounterValueReference:
49     Terms.push_back(std::make_pair(C.getCounterID(), Sign));
50     break;
51   case Counter::Expression:
52     const auto &E = Expressions[C.getExpressionID()];
53     extractTerms(E.LHS, Sign, Terms);
54     extractTerms(E.RHS, E.Kind == CounterExpression::Subtract ? -Sign : Sign,
55                  Terms);
56     break;
57   }
58 }
59 
60 Counter CounterExpressionBuilder::simplify(Counter ExpressionTree) {
61   // Gather constant terms.
62   llvm::SmallVector<std::pair<unsigned, int>, 32> Terms;
63   extractTerms(ExpressionTree, +1, Terms);
64 
65   // If there are no terms, this is just a zero. The algorithm below assumes at
66   // least one term.
67   if (Terms.size() == 0)
68     return Counter::getZero();
69 
70   // Group the terms by counter ID.
71   std::sort(Terms.begin(), Terms.end(),
72             [](const std::pair<unsigned, int> &LHS,
73                const std::pair<unsigned, int> &RHS) {
74     return LHS.first < RHS.first;
75   });
76 
77   // Combine terms by counter ID to eliminate counters that sum to zero.
78   auto Prev = Terms.begin();
79   for (auto I = Prev + 1, E = Terms.end(); I != E; ++I) {
80     if (I->first == Prev->first) {
81       Prev->second += I->second;
82       continue;
83     }
84     ++Prev;
85     *Prev = *I;
86   }
87   Terms.erase(++Prev, Terms.end());
88 
89   Counter C;
90   // Create additions. We do this before subtractions to avoid constructs like
91   // ((0 - X) + Y), as opposed to (Y - X).
92   for (auto Term : Terms) {
93     if (Term.second <= 0)
94       continue;
95     for (int I = 0; I < Term.second; ++I)
96       if (C.isZero())
97         C = Counter::getCounter(Term.first);
98       else
99         C = get(CounterExpression(CounterExpression::Add, C,
100                                   Counter::getCounter(Term.first)));
101   }
102 
103   // Create subtractions.
104   for (auto Term : Terms) {
105     if (Term.second >= 0)
106       continue;
107     for (int I = 0; I < -Term.second; ++I)
108       C = get(CounterExpression(CounterExpression::Subtract, C,
109                                 Counter::getCounter(Term.first)));
110   }
111   return C;
112 }
113 
114 Counter CounterExpressionBuilder::add(Counter LHS, Counter RHS) {
115   return simplify(get(CounterExpression(CounterExpression::Add, LHS, RHS)));
116 }
117 
118 Counter CounterExpressionBuilder::subtract(Counter LHS, Counter RHS) {
119   return simplify(
120       get(CounterExpression(CounterExpression::Subtract, LHS, RHS)));
121 }
122 
123 void CounterMappingContext::dump(const Counter &C,
124                                  llvm::raw_ostream &OS) const {
125   switch (C.getKind()) {
126   case Counter::Zero:
127     OS << '0';
128     return;
129   case Counter::CounterValueReference:
130     OS << '#' << C.getCounterID();
131     break;
132   case Counter::Expression: {
133     if (C.getExpressionID() >= Expressions.size())
134       return;
135     const auto &E = Expressions[C.getExpressionID()];
136     OS << '(';
137     dump(E.LHS, OS);
138     OS << (E.Kind == CounterExpression::Subtract ? " - " : " + ");
139     dump(E.RHS, OS);
140     OS << ')';
141     break;
142   }
143   }
144   if (CounterValues.empty())
145     return;
146   Expected<int64_t> Value = evaluate(C);
147   if (auto E = Value.takeError()) {
148     llvm::consumeError(std::move(E));
149     return;
150   }
151   OS << '[' << *Value << ']';
152 }
153 
154 Expected<int64_t> CounterMappingContext::evaluate(const Counter &C) const {
155   switch (C.getKind()) {
156   case Counter::Zero:
157     return 0;
158   case Counter::CounterValueReference:
159     if (C.getCounterID() >= CounterValues.size())
160       return errorCodeToError(errc::argument_out_of_domain);
161     return CounterValues[C.getCounterID()];
162   case Counter::Expression: {
163     if (C.getExpressionID() >= Expressions.size())
164       return errorCodeToError(errc::argument_out_of_domain);
165     const auto &E = Expressions[C.getExpressionID()];
166     Expected<int64_t> LHS = evaluate(E.LHS);
167     if (!LHS)
168       return LHS;
169     Expected<int64_t> RHS = evaluate(E.RHS);
170     if (!RHS)
171       return RHS;
172     return E.Kind == CounterExpression::Subtract ? *LHS - *RHS : *LHS + *RHS;
173   }
174   }
175   llvm_unreachable("Unhandled CounterKind");
176 }
177 
178 void FunctionRecordIterator::skipOtherFiles() {
179   while (Current != Records.end() && !Filename.empty() &&
180          Filename != Current->Filenames[0])
181     ++Current;
182   if (Current == Records.end())
183     *this = FunctionRecordIterator();
184 }
185 
186 Error CoverageMapping::loadFunctionRecord(
187     const CoverageMappingRecord &Record,
188     IndexedInstrProfReader &ProfileReader) {
189   CounterMappingContext Ctx(Record.Expressions);
190 
191   std::vector<uint64_t> Counts;
192   if (Error E = ProfileReader.getFunctionCounts(Record.FunctionName,
193                                                 Record.FunctionHash, Counts)) {
194     instrprof_error IPE = InstrProfError::take(std::move(E));
195     if (IPE == instrprof_error::hash_mismatch) {
196       MismatchedFunctionCount++;
197       return Error::success();
198     } else if (IPE != instrprof_error::unknown_function)
199       return make_error<InstrProfError>(IPE);
200     Counts.assign(Record.MappingRegions.size(), 0);
201   }
202   Ctx.setCounts(Counts);
203 
204   assert(!Record.MappingRegions.empty() && "Function has no regions");
205 
206   StringRef OrigFuncName = Record.FunctionName;
207   if (Record.Filenames.empty())
208     OrigFuncName = getFuncNameWithoutPrefix(OrigFuncName);
209   else
210     OrigFuncName = getFuncNameWithoutPrefix(OrigFuncName, Record.Filenames[0]);
211   FunctionRecord Function(OrigFuncName, Record.Filenames);
212   for (const auto &Region : Record.MappingRegions) {
213     Expected<int64_t> ExecutionCount = Ctx.evaluate(Region.Count);
214     if (auto E = ExecutionCount.takeError()) {
215       llvm::consumeError(std::move(E));
216       return Error::success();
217     }
218     Function.pushRegion(Region, *ExecutionCount);
219   }
220   if (Function.CountedRegions.size() != Record.MappingRegions.size()) {
221     MismatchedFunctionCount++;
222     return Error::success();
223   }
224 
225   Functions.push_back(std::move(Function));
226   return Error::success();
227 }
228 
229 Expected<std::unique_ptr<CoverageMapping>>
230 CoverageMapping::load(CoverageMappingReader &CoverageReader,
231                       IndexedInstrProfReader &ProfileReader) {
232   auto Coverage = std::unique_ptr<CoverageMapping>(new CoverageMapping());
233 
234   for (const auto &Record : CoverageReader)
235     if (Error E = Coverage->loadFunctionRecord(Record, ProfileReader))
236       return std::move(E);
237 
238   return std::move(Coverage);
239 }
240 
241 Expected<std::unique_ptr<CoverageMapping>>
242 CoverageMapping::load(StringRef ObjectFilename, StringRef ProfileFilename,
243                       StringRef Arch) {
244   auto CounterMappingBuff = MemoryBuffer::getFileOrSTDIN(ObjectFilename);
245   if (std::error_code EC = CounterMappingBuff.getError())
246     return errorCodeToError(EC);
247   auto CoverageReaderOrErr =
248       BinaryCoverageReader::create(CounterMappingBuff.get(), Arch);
249   if (Error E = CoverageReaderOrErr.takeError())
250     return std::move(E);
251   auto CoverageReader = std::move(CoverageReaderOrErr.get());
252   auto ProfileReaderOrErr = IndexedInstrProfReader::create(ProfileFilename);
253   if (Error E = ProfileReaderOrErr.takeError())
254     return std::move(E);
255   auto ProfileReader = std::move(ProfileReaderOrErr.get());
256   return load(*CoverageReader, *ProfileReader);
257 }
258 
259 namespace {
260 /// \brief Distributes functions into instantiation sets.
261 ///
262 /// An instantiation set is a collection of functions that have the same source
263 /// code, ie, template functions specializations.
264 class FunctionInstantiationSetCollector {
265   typedef DenseMap<std::pair<unsigned, unsigned>,
266                    std::vector<const FunctionRecord *>> MapT;
267   MapT InstantiatedFunctions;
268 
269 public:
270   void insert(const FunctionRecord &Function, unsigned FileID) {
271     auto I = Function.CountedRegions.begin(), E = Function.CountedRegions.end();
272     while (I != E && I->FileID != FileID)
273       ++I;
274     assert(I != E && "function does not cover the given file");
275     auto &Functions = InstantiatedFunctions[I->startLoc()];
276     Functions.push_back(&Function);
277   }
278 
279   MapT::iterator begin() { return InstantiatedFunctions.begin(); }
280 
281   MapT::iterator end() { return InstantiatedFunctions.end(); }
282 };
283 
284 class SegmentBuilder {
285   std::vector<CoverageSegment> &Segments;
286   SmallVector<const CountedRegion *, 8> ActiveRegions;
287 
288   SegmentBuilder(std::vector<CoverageSegment> &Segments) : Segments(Segments) {}
289 
290   /// Start a segment with no count specified.
291   void startSegment(unsigned Line, unsigned Col) {
292     DEBUG(dbgs() << "Top level segment at " << Line << ":" << Col << "\n");
293     Segments.emplace_back(Line, Col, /*IsRegionEntry=*/false);
294   }
295 
296   /// Start a segment with the given Region's count.
297   void startSegment(unsigned Line, unsigned Col, bool IsRegionEntry,
298                     const CountedRegion &Region) {
299     // Avoid creating empty regions.
300     if (!Segments.empty() && Segments.back().Line == Line &&
301         Segments.back().Col == Col)
302       Segments.pop_back();
303     DEBUG(dbgs() << "Segment at " << Line << ":" << Col);
304     // Set this region's count.
305     if (Region.Kind != coverage::CounterMappingRegion::SkippedRegion) {
306       DEBUG(dbgs() << " with count " << Region.ExecutionCount);
307       Segments.emplace_back(Line, Col, Region.ExecutionCount, IsRegionEntry);
308     } else
309       Segments.emplace_back(Line, Col, IsRegionEntry);
310     DEBUG(dbgs() << "\n");
311   }
312 
313   /// Start a segment for the given region.
314   void startSegment(const CountedRegion &Region) {
315     startSegment(Region.LineStart, Region.ColumnStart, true, Region);
316   }
317 
318   /// Pop the top region off of the active stack, starting a new segment with
319   /// the containing Region's count.
320   void popRegion() {
321     const CountedRegion *Active = ActiveRegions.back();
322     unsigned Line = Active->LineEnd, Col = Active->ColumnEnd;
323     ActiveRegions.pop_back();
324     if (ActiveRegions.empty())
325       startSegment(Line, Col);
326     else
327       startSegment(Line, Col, false, *ActiveRegions.back());
328   }
329 
330   void buildSegmentsImpl(ArrayRef<CountedRegion> Regions) {
331     for (const auto &Region : Regions) {
332       // Pop any regions that end before this one starts.
333       while (!ActiveRegions.empty() &&
334              ActiveRegions.back()->endLoc() <= Region.startLoc())
335         popRegion();
336       // Add this region to the stack.
337       ActiveRegions.push_back(&Region);
338       startSegment(Region);
339     }
340     // Pop any regions that are left in the stack.
341     while (!ActiveRegions.empty())
342       popRegion();
343   }
344 
345   /// Sort a nested sequence of regions from a single file.
346   static void sortNestedRegions(MutableArrayRef<CountedRegion> Regions) {
347     std::sort(Regions.begin(), Regions.end(), [](const CountedRegion &LHS,
348                                                  const CountedRegion &RHS) {
349       if (LHS.startLoc() != RHS.startLoc())
350         return LHS.startLoc() < RHS.startLoc();
351       if (LHS.endLoc() != RHS.endLoc())
352         // When LHS completely contains RHS, we sort LHS first.
353         return RHS.endLoc() < LHS.endLoc();
354       // If LHS and RHS cover the same area, we need to sort them according
355       // to their kinds so that the most suitable region will become "active"
356       // in combineRegions(). Because we accumulate counter values only from
357       // regions of the same kind as the first region of the area, prefer
358       // CodeRegion to ExpansionRegion and ExpansionRegion to SkippedRegion.
359       static_assert(coverage::CounterMappingRegion::CodeRegion <
360                             coverage::CounterMappingRegion::ExpansionRegion &&
361                         coverage::CounterMappingRegion::ExpansionRegion <
362                             coverage::CounterMappingRegion::SkippedRegion,
363                     "Unexpected order of region kind values");
364       return LHS.Kind < RHS.Kind;
365     });
366   }
367 
368   /// Combine counts of regions which cover the same area.
369   static ArrayRef<CountedRegion>
370   combineRegions(MutableArrayRef<CountedRegion> Regions) {
371     if (Regions.empty())
372       return Regions;
373     auto Active = Regions.begin();
374     auto End = Regions.end();
375     for (auto I = Regions.begin() + 1; I != End; ++I) {
376       if (Active->startLoc() != I->startLoc() ||
377           Active->endLoc() != I->endLoc()) {
378         // Shift to the next region.
379         ++Active;
380         if (Active != I)
381           *Active = *I;
382         continue;
383       }
384       // Merge duplicate region.
385       // If CodeRegions and ExpansionRegions cover the same area, it's probably
386       // a macro which is fully expanded to another macro. In that case, we need
387       // to accumulate counts only from CodeRegions, or else the area will be
388       // counted twice.
389       // On the other hand, a macro may have a nested macro in its body. If the
390       // outer macro is used several times, the ExpansionRegion for the nested
391       // macro will also be added several times. These ExpansionRegions cover
392       // the same source locations and have to be combined to reach the correct
393       // value for that area.
394       // We add counts of the regions of the same kind as the active region
395       // to handle the both situations.
396       if (I->Kind == Active->Kind)
397         Active->ExecutionCount += I->ExecutionCount;
398     }
399     return Regions.drop_back(std::distance(++Active, End));
400   }
401 
402 public:
403   /// Build a list of CoverageSegments from a list of Regions.
404   static std::vector<CoverageSegment>
405   buildSegments(MutableArrayRef<CountedRegion> Regions) {
406     std::vector<CoverageSegment> Segments;
407     SegmentBuilder Builder(Segments);
408 
409     sortNestedRegions(Regions);
410     ArrayRef<CountedRegion> CombinedRegions = combineRegions(Regions);
411 
412     Builder.buildSegmentsImpl(CombinedRegions);
413     return Segments;
414   }
415 };
416 }
417 
418 std::vector<StringRef> CoverageMapping::getUniqueSourceFiles() const {
419   std::vector<StringRef> Filenames;
420   for (const auto &Function : getCoveredFunctions())
421     Filenames.insert(Filenames.end(), Function.Filenames.begin(),
422                      Function.Filenames.end());
423   std::sort(Filenames.begin(), Filenames.end());
424   auto Last = std::unique(Filenames.begin(), Filenames.end());
425   Filenames.erase(Last, Filenames.end());
426   return Filenames;
427 }
428 
429 static SmallBitVector gatherFileIDs(StringRef SourceFile,
430                                     const FunctionRecord &Function) {
431   SmallBitVector FilenameEquivalence(Function.Filenames.size(), false);
432   for (unsigned I = 0, E = Function.Filenames.size(); I < E; ++I)
433     if (SourceFile == Function.Filenames[I])
434       FilenameEquivalence[I] = true;
435   return FilenameEquivalence;
436 }
437 
438 /// Return the ID of the file where the definition of the function is located.
439 static Optional<unsigned> findMainViewFileID(const FunctionRecord &Function) {
440   SmallBitVector IsNotExpandedFile(Function.Filenames.size(), true);
441   for (const auto &CR : Function.CountedRegions)
442     if (CR.Kind == CounterMappingRegion::ExpansionRegion)
443       IsNotExpandedFile[CR.ExpandedFileID] = false;
444   int I = IsNotExpandedFile.find_first();
445   if (I == -1)
446     return None;
447   return I;
448 }
449 
450 /// Check if SourceFile is the file that contains the definition of
451 /// the Function. Return the ID of the file in that case or None otherwise.
452 static Optional<unsigned> findMainViewFileID(StringRef SourceFile,
453                                              const FunctionRecord &Function) {
454   Optional<unsigned> I = findMainViewFileID(Function);
455   if (I && SourceFile == Function.Filenames[*I])
456     return I;
457   return None;
458 }
459 
460 static bool isExpansion(const CountedRegion &R, unsigned FileID) {
461   return R.Kind == CounterMappingRegion::ExpansionRegion && R.FileID == FileID;
462 }
463 
464 CoverageData CoverageMapping::getCoverageForFile(StringRef Filename) const {
465   CoverageData FileCoverage(Filename);
466   std::vector<coverage::CountedRegion> Regions;
467 
468   for (const auto &Function : Functions) {
469     auto MainFileID = findMainViewFileID(Filename, Function);
470     auto FileIDs = gatherFileIDs(Filename, Function);
471     for (const auto &CR : Function.CountedRegions)
472       if (FileIDs.test(CR.FileID)) {
473         Regions.push_back(CR);
474         if (MainFileID && isExpansion(CR, *MainFileID))
475           FileCoverage.Expansions.emplace_back(CR, Function);
476       }
477   }
478 
479   DEBUG(dbgs() << "Emitting segments for file: " << Filename << "\n");
480   FileCoverage.Segments = SegmentBuilder::buildSegments(Regions);
481 
482   return FileCoverage;
483 }
484 
485 std::vector<const FunctionRecord *>
486 CoverageMapping::getInstantiations(StringRef Filename) const {
487   FunctionInstantiationSetCollector InstantiationSetCollector;
488   for (const auto &Function : Functions) {
489     auto MainFileID = findMainViewFileID(Filename, Function);
490     if (!MainFileID)
491       continue;
492     InstantiationSetCollector.insert(Function, *MainFileID);
493   }
494 
495   std::vector<const FunctionRecord *> Result;
496   for (const auto &InstantiationSet : InstantiationSetCollector) {
497     if (InstantiationSet.second.size() < 2)
498       continue;
499     Result.insert(Result.end(), InstantiationSet.second.begin(),
500                   InstantiationSet.second.end());
501   }
502   return Result;
503 }
504 
505 CoverageData
506 CoverageMapping::getCoverageForFunction(const FunctionRecord &Function) const {
507   auto MainFileID = findMainViewFileID(Function);
508   if (!MainFileID)
509     return CoverageData();
510 
511   CoverageData FunctionCoverage(Function.Filenames[*MainFileID]);
512   std::vector<coverage::CountedRegion> Regions;
513   for (const auto &CR : Function.CountedRegions)
514     if (CR.FileID == *MainFileID) {
515       Regions.push_back(CR);
516       if (isExpansion(CR, *MainFileID))
517         FunctionCoverage.Expansions.emplace_back(CR, Function);
518     }
519 
520   DEBUG(dbgs() << "Emitting segments for function: " << Function.Name << "\n");
521   FunctionCoverage.Segments = SegmentBuilder::buildSegments(Regions);
522 
523   return FunctionCoverage;
524 }
525 
526 CoverageData CoverageMapping::getCoverageForExpansion(
527     const ExpansionRecord &Expansion) const {
528   CoverageData ExpansionCoverage(
529       Expansion.Function.Filenames[Expansion.FileID]);
530   std::vector<coverage::CountedRegion> Regions;
531   for (const auto &CR : Expansion.Function.CountedRegions)
532     if (CR.FileID == Expansion.FileID) {
533       Regions.push_back(CR);
534       if (isExpansion(CR, Expansion.FileID))
535         ExpansionCoverage.Expansions.emplace_back(CR, Expansion.Function);
536     }
537 
538   DEBUG(dbgs() << "Emitting segments for expansion of file " << Expansion.FileID
539                << "\n");
540   ExpansionCoverage.Segments = SegmentBuilder::buildSegments(Regions);
541 
542   return ExpansionCoverage;
543 }
544 
545 namespace {
546 std::string getCoverageMapErrString(coveragemap_error Err) {
547   switch (Err) {
548   case coveragemap_error::success:
549     return "Success";
550   case coveragemap_error::eof:
551     return "End of File";
552   case coveragemap_error::no_data_found:
553     return "No coverage data found";
554   case coveragemap_error::unsupported_version:
555     return "Unsupported coverage format version";
556   case coveragemap_error::truncated:
557     return "Truncated coverage data";
558   case coveragemap_error::malformed:
559     return "Malformed coverage data";
560   }
561   llvm_unreachable("A value of coveragemap_error has no message.");
562 }
563 
564 // FIXME: This class is only here to support the transition to llvm::Error. It
565 // will be removed once this transition is complete. Clients should prefer to
566 // deal with the Error value directly, rather than converting to error_code.
567 class CoverageMappingErrorCategoryType : public std::error_category {
568   const char *name() const LLVM_NOEXCEPT override { return "llvm.coveragemap"; }
569   std::string message(int IE) const override {
570     return getCoverageMapErrString(static_cast<coveragemap_error>(IE));
571   }
572 };
573 } // end anonymous namespace
574 
575 std::string CoverageMapError::message() const {
576   return getCoverageMapErrString(Err);
577 }
578 
579 static ManagedStatic<CoverageMappingErrorCategoryType> ErrorCategory;
580 
581 const std::error_category &llvm::coverage::coveragemap_category() {
582   return *ErrorCategory;
583 }
584 
585 char CoverageMapError::ID = 0;
586