xref: /llvm-project/llvm/lib/ProfileData/Coverage/CoverageMapping.cpp (revision dc7071226b588110392975a07bcaf516e6eb9829)
1 //=-- CoverageMapping.cpp - Code coverage mapping support ---------*- C++ -*-=//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains support for clang's and llvm's instrumentation based
11 // code coverage.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "llvm/ProfileData/Coverage/CoverageMapping.h"
16 #include "llvm/ADT/DenseMap.h"
17 #include "llvm/ADT/Optional.h"
18 #include "llvm/ADT/SmallBitVector.h"
19 #include "llvm/ProfileData/Coverage/CoverageMappingReader.h"
20 #include "llvm/ProfileData/InstrProfReader.h"
21 #include "llvm/Support/Debug.h"
22 #include "llvm/Support/Errc.h"
23 #include "llvm/Support/ErrorHandling.h"
24 #include "llvm/Support/ManagedStatic.h"
25 #include "llvm/Support/Path.h"
26 #include "llvm/Support/raw_ostream.h"
27 
28 using namespace llvm;
29 using namespace coverage;
30 
31 #define DEBUG_TYPE "coverage-mapping"
32 
33 Counter CounterExpressionBuilder::get(const CounterExpression &E) {
34   auto It = ExpressionIndices.find(E);
35   if (It != ExpressionIndices.end())
36     return Counter::getExpression(It->second);
37   unsigned I = Expressions.size();
38   Expressions.push_back(E);
39   ExpressionIndices[E] = I;
40   return Counter::getExpression(I);
41 }
42 
43 void CounterExpressionBuilder::extractTerms(
44     Counter C, int Sign, SmallVectorImpl<std::pair<unsigned, int>> &Terms) {
45   switch (C.getKind()) {
46   case Counter::Zero:
47     break;
48   case Counter::CounterValueReference:
49     Terms.push_back(std::make_pair(C.getCounterID(), Sign));
50     break;
51   case Counter::Expression:
52     const auto &E = Expressions[C.getExpressionID()];
53     extractTerms(E.LHS, Sign, Terms);
54     extractTerms(E.RHS, E.Kind == CounterExpression::Subtract ? -Sign : Sign,
55                  Terms);
56     break;
57   }
58 }
59 
60 Counter CounterExpressionBuilder::simplify(Counter ExpressionTree) {
61   // Gather constant terms.
62   llvm::SmallVector<std::pair<unsigned, int>, 32> Terms;
63   extractTerms(ExpressionTree, +1, Terms);
64 
65   // If there are no terms, this is just a zero. The algorithm below assumes at
66   // least one term.
67   if (Terms.size() == 0)
68     return Counter::getZero();
69 
70   // Group the terms by counter ID.
71   std::sort(Terms.begin(), Terms.end(),
72             [](const std::pair<unsigned, int> &LHS,
73                const std::pair<unsigned, int> &RHS) {
74     return LHS.first < RHS.first;
75   });
76 
77   // Combine terms by counter ID to eliminate counters that sum to zero.
78   auto Prev = Terms.begin();
79   for (auto I = Prev + 1, E = Terms.end(); I != E; ++I) {
80     if (I->first == Prev->first) {
81       Prev->second += I->second;
82       continue;
83     }
84     ++Prev;
85     *Prev = *I;
86   }
87   Terms.erase(++Prev, Terms.end());
88 
89   Counter C;
90   // Create additions. We do this before subtractions to avoid constructs like
91   // ((0 - X) + Y), as opposed to (Y - X).
92   for (auto Term : Terms) {
93     if (Term.second <= 0)
94       continue;
95     for (int I = 0; I < Term.second; ++I)
96       if (C.isZero())
97         C = Counter::getCounter(Term.first);
98       else
99         C = get(CounterExpression(CounterExpression::Add, C,
100                                   Counter::getCounter(Term.first)));
101   }
102 
103   // Create subtractions.
104   for (auto Term : Terms) {
105     if (Term.second >= 0)
106       continue;
107     for (int I = 0; I < -Term.second; ++I)
108       C = get(CounterExpression(CounterExpression::Subtract, C,
109                                 Counter::getCounter(Term.first)));
110   }
111   return C;
112 }
113 
114 Counter CounterExpressionBuilder::add(Counter LHS, Counter RHS) {
115   return simplify(get(CounterExpression(CounterExpression::Add, LHS, RHS)));
116 }
117 
118 Counter CounterExpressionBuilder::subtract(Counter LHS, Counter RHS) {
119   return simplify(
120       get(CounterExpression(CounterExpression::Subtract, LHS, RHS)));
121 }
122 
123 void CounterMappingContext::dump(const Counter &C,
124                                  llvm::raw_ostream &OS) const {
125   switch (C.getKind()) {
126   case Counter::Zero:
127     OS << '0';
128     return;
129   case Counter::CounterValueReference:
130     OS << '#' << C.getCounterID();
131     break;
132   case Counter::Expression: {
133     if (C.getExpressionID() >= Expressions.size())
134       return;
135     const auto &E = Expressions[C.getExpressionID()];
136     OS << '(';
137     dump(E.LHS, OS);
138     OS << (E.Kind == CounterExpression::Subtract ? " - " : " + ");
139     dump(E.RHS, OS);
140     OS << ')';
141     break;
142   }
143   }
144   if (CounterValues.empty())
145     return;
146   ErrorOr<int64_t> Value = evaluate(C);
147   if (!Value)
148     return;
149   OS << '[' << *Value << ']';
150 }
151 
152 ErrorOr<int64_t> CounterMappingContext::evaluate(const Counter &C) const {
153   switch (C.getKind()) {
154   case Counter::Zero:
155     return 0;
156   case Counter::CounterValueReference:
157     if (C.getCounterID() >= CounterValues.size())
158       return make_error_code(errc::argument_out_of_domain);
159     return CounterValues[C.getCounterID()];
160   case Counter::Expression: {
161     if (C.getExpressionID() >= Expressions.size())
162       return make_error_code(errc::argument_out_of_domain);
163     const auto &E = Expressions[C.getExpressionID()];
164     ErrorOr<int64_t> LHS = evaluate(E.LHS);
165     if (!LHS)
166       return LHS;
167     ErrorOr<int64_t> RHS = evaluate(E.RHS);
168     if (!RHS)
169       return RHS;
170     return E.Kind == CounterExpression::Subtract ? *LHS - *RHS : *LHS + *RHS;
171   }
172   }
173   llvm_unreachable("Unhandled CounterKind");
174 }
175 
176 void FunctionRecordIterator::skipOtherFiles() {
177   while (Current != Records.end() && !Filename.empty() &&
178          Filename != Current->Filenames[0])
179     ++Current;
180   if (Current == Records.end())
181     *this = FunctionRecordIterator();
182 }
183 
184 ErrorOr<std::unique_ptr<CoverageMapping>>
185 CoverageMapping::load(CoverageMappingReader &CoverageReader,
186                       IndexedInstrProfReader &ProfileReader) {
187   auto Coverage = std::unique_ptr<CoverageMapping>(new CoverageMapping());
188 
189   std::vector<uint64_t> Counts;
190   for (const auto &Record : CoverageReader) {
191     CounterMappingContext Ctx(Record.Expressions);
192 
193     Counts.clear();
194     if (std::error_code EC = ProfileReader.getFunctionCounts(
195             Record.FunctionName, Record.FunctionHash, Counts)) {
196       if (EC == instrprof_error::hash_mismatch) {
197         Coverage->MismatchedFunctionCount++;
198         continue;
199       } else if (EC != instrprof_error::unknown_function)
200         return EC;
201       Counts.assign(Record.MappingRegions.size(), 0);
202     }
203     Ctx.setCounts(Counts);
204 
205     assert(!Record.MappingRegions.empty() && "Function has no regions");
206 
207     StringRef OrigFuncName = Record.FunctionName;
208     if (Record.Filenames.empty())
209       OrigFuncName = getFuncNameWithoutPrefix(OrigFuncName);
210     else
211       OrigFuncName =
212           getFuncNameWithoutPrefix(OrigFuncName, Record.Filenames[0]);
213     FunctionRecord Function(OrigFuncName, Record.Filenames);
214     for (const auto &Region : Record.MappingRegions) {
215       ErrorOr<int64_t> ExecutionCount = Ctx.evaluate(Region.Count);
216       if (!ExecutionCount)
217         break;
218       Function.pushRegion(Region, *ExecutionCount);
219     }
220     if (Function.CountedRegions.size() != Record.MappingRegions.size()) {
221       Coverage->MismatchedFunctionCount++;
222       continue;
223     }
224 
225     Coverage->Functions.push_back(std::move(Function));
226   }
227 
228   return std::move(Coverage);
229 }
230 
231 ErrorOr<std::unique_ptr<CoverageMapping>>
232 CoverageMapping::load(StringRef ObjectFilename, StringRef ProfileFilename,
233                       StringRef Arch) {
234   auto CounterMappingBuff = MemoryBuffer::getFileOrSTDIN(ObjectFilename);
235   if (std::error_code EC = CounterMappingBuff.getError())
236     return EC;
237   auto CoverageReaderOrErr =
238       BinaryCoverageReader::create(CounterMappingBuff.get(), Arch);
239   if (std::error_code EC = CoverageReaderOrErr.getError())
240     return EC;
241   auto CoverageReader = std::move(CoverageReaderOrErr.get());
242   auto ProfileReaderOrErr = IndexedInstrProfReader::create(ProfileFilename);
243   if (auto EC = ProfileReaderOrErr.getError())
244     return EC;
245   auto ProfileReader = std::move(ProfileReaderOrErr.get());
246   return load(*CoverageReader, *ProfileReader);
247 }
248 
249 namespace {
250 /// \brief Distributes functions into instantiation sets.
251 ///
252 /// An instantiation set is a collection of functions that have the same source
253 /// code, ie, template functions specializations.
254 class FunctionInstantiationSetCollector {
255   typedef DenseMap<std::pair<unsigned, unsigned>,
256                    std::vector<const FunctionRecord *>> MapT;
257   MapT InstantiatedFunctions;
258 
259 public:
260   void insert(const FunctionRecord &Function, unsigned FileID) {
261     auto I = Function.CountedRegions.begin(), E = Function.CountedRegions.end();
262     while (I != E && I->FileID != FileID)
263       ++I;
264     assert(I != E && "function does not cover the given file");
265     auto &Functions = InstantiatedFunctions[I->startLoc()];
266     Functions.push_back(&Function);
267   }
268 
269   MapT::iterator begin() { return InstantiatedFunctions.begin(); }
270 
271   MapT::iterator end() { return InstantiatedFunctions.end(); }
272 };
273 
274 class SegmentBuilder {
275   std::vector<CoverageSegment> &Segments;
276   SmallVector<const CountedRegion *, 8> ActiveRegions;
277 
278   SegmentBuilder(std::vector<CoverageSegment> &Segments) : Segments(Segments) {}
279 
280   /// Start a segment with no count specified.
281   void startSegment(unsigned Line, unsigned Col) {
282     DEBUG(dbgs() << "Top level segment at " << Line << ":" << Col << "\n");
283     Segments.emplace_back(Line, Col, /*IsRegionEntry=*/false);
284   }
285 
286   /// Start a segment with the given Region's count.
287   void startSegment(unsigned Line, unsigned Col, bool IsRegionEntry,
288                     const CountedRegion &Region) {
289     // Avoid creating empty regions.
290     if (!Segments.empty() && Segments.back().Line == Line &&
291         Segments.back().Col == Col)
292       Segments.pop_back();
293     DEBUG(dbgs() << "Segment at " << Line << ":" << Col);
294     // Set this region's count.
295     if (Region.Kind != coverage::CounterMappingRegion::SkippedRegion) {
296       DEBUG(dbgs() << " with count " << Region.ExecutionCount);
297       Segments.emplace_back(Line, Col, Region.ExecutionCount, IsRegionEntry);
298     } else
299       Segments.emplace_back(Line, Col, IsRegionEntry);
300     DEBUG(dbgs() << "\n");
301   }
302 
303   /// Start a segment for the given region.
304   void startSegment(const CountedRegion &Region) {
305     startSegment(Region.LineStart, Region.ColumnStart, true, Region);
306   }
307 
308   /// Pop the top region off of the active stack, starting a new segment with
309   /// the containing Region's count.
310   void popRegion() {
311     const CountedRegion *Active = ActiveRegions.back();
312     unsigned Line = Active->LineEnd, Col = Active->ColumnEnd;
313     ActiveRegions.pop_back();
314     if (ActiveRegions.empty())
315       startSegment(Line, Col);
316     else
317       startSegment(Line, Col, false, *ActiveRegions.back());
318   }
319 
320   void buildSegmentsImpl(ArrayRef<CountedRegion> Regions) {
321     for (const auto &Region : Regions) {
322       // Pop any regions that end before this one starts.
323       while (!ActiveRegions.empty() &&
324              ActiveRegions.back()->endLoc() <= Region.startLoc())
325         popRegion();
326       // Add this region to the stack.
327       ActiveRegions.push_back(&Region);
328       startSegment(Region);
329     }
330     // Pop any regions that are left in the stack.
331     while (!ActiveRegions.empty())
332       popRegion();
333   }
334 
335   /// Sort a nested sequence of regions from a single file.
336   static void sortNestedRegions(MutableArrayRef<CountedRegion> Regions) {
337     std::sort(Regions.begin(), Regions.end(),
338               [](const CountedRegion &LHS, const CountedRegion &RHS) {
339                 if (LHS.startLoc() == RHS.startLoc())
340                   // When LHS completely contains RHS, we sort LHS first.
341                   return RHS.endLoc() < LHS.endLoc();
342                 return LHS.startLoc() < RHS.startLoc();
343               });
344   }
345 
346   /// Combine counts of regions which cover the same area.
347   static ArrayRef<CountedRegion>
348   combineRegions(MutableArrayRef<CountedRegion> Regions) {
349     if (Regions.empty())
350       return Regions;
351     auto Active = Regions.begin();
352     auto End = Regions.end();
353     for (auto I = Regions.begin() + 1; I != End; ++I) {
354       if (Active->startLoc() != I->startLoc() ||
355           Active->endLoc() != I->endLoc()) {
356         // Shift to the next region.
357         ++Active;
358         if (Active != I)
359           *Active = *I;
360         continue;
361       }
362       // Merge duplicate region.
363       if (I->Kind != coverage::CounterMappingRegion::CodeRegion)
364         // Add counts only from CodeRegions.
365         continue;
366       if (Active->Kind == coverage::CounterMappingRegion::SkippedRegion)
367         // We have to overwrite SkippedRegions because of special handling
368         // of them in startSegment().
369         *Active = *I;
370       else
371         // Otherwise, just append the count.
372         Active->ExecutionCount += I->ExecutionCount;
373     }
374     return Regions.drop_back(std::distance(++Active, End));
375   }
376 
377 public:
378   /// Build a list of CoverageSegments from a list of Regions.
379   static std::vector<CoverageSegment>
380   buildSegments(MutableArrayRef<CountedRegion> Regions) {
381     std::vector<CoverageSegment> Segments;
382     SegmentBuilder Builder(Segments);
383 
384     sortNestedRegions(Regions);
385     ArrayRef<CountedRegion> CombinedRegions = combineRegions(Regions);
386 
387     Builder.buildSegmentsImpl(CombinedRegions);
388     return Segments;
389   }
390 };
391 }
392 
393 std::vector<StringRef> CoverageMapping::getUniqueSourceFiles() const {
394   std::vector<StringRef> Filenames;
395   for (const auto &Function : getCoveredFunctions())
396     Filenames.insert(Filenames.end(), Function.Filenames.begin(),
397                      Function.Filenames.end());
398   std::sort(Filenames.begin(), Filenames.end());
399   auto Last = std::unique(Filenames.begin(), Filenames.end());
400   Filenames.erase(Last, Filenames.end());
401   return Filenames;
402 }
403 
404 static SmallBitVector gatherFileIDs(StringRef SourceFile,
405                                     const FunctionRecord &Function) {
406   SmallBitVector FilenameEquivalence(Function.Filenames.size(), false);
407   for (unsigned I = 0, E = Function.Filenames.size(); I < E; ++I)
408     if (SourceFile == Function.Filenames[I])
409       FilenameEquivalence[I] = true;
410   return FilenameEquivalence;
411 }
412 
413 /// Return the ID of the file where the definition of the function is located.
414 static Optional<unsigned> findMainViewFileID(const FunctionRecord &Function) {
415   SmallBitVector IsNotExpandedFile(Function.Filenames.size(), true);
416   for (const auto &CR : Function.CountedRegions)
417     if (CR.Kind == CounterMappingRegion::ExpansionRegion)
418       IsNotExpandedFile[CR.ExpandedFileID] = false;
419   int I = IsNotExpandedFile.find_first();
420   if (I == -1)
421     return None;
422   return I;
423 }
424 
425 /// Check if SourceFile is the file that contains the definition of
426 /// the Function. Return the ID of the file in that case or None otherwise.
427 static Optional<unsigned> findMainViewFileID(StringRef SourceFile,
428                                              const FunctionRecord &Function) {
429   Optional<unsigned> I = findMainViewFileID(Function);
430   if (I && SourceFile == Function.Filenames[*I])
431     return I;
432   return None;
433 }
434 
435 static bool isExpansion(const CountedRegion &R, unsigned FileID) {
436   return R.Kind == CounterMappingRegion::ExpansionRegion && R.FileID == FileID;
437 }
438 
439 CoverageData CoverageMapping::getCoverageForFile(StringRef Filename) {
440   CoverageData FileCoverage(Filename);
441   std::vector<coverage::CountedRegion> Regions;
442 
443   for (const auto &Function : Functions) {
444     auto MainFileID = findMainViewFileID(Filename, Function);
445     auto FileIDs = gatherFileIDs(Filename, Function);
446     for (const auto &CR : Function.CountedRegions)
447       if (FileIDs.test(CR.FileID)) {
448         Regions.push_back(CR);
449         if (MainFileID && isExpansion(CR, *MainFileID))
450           FileCoverage.Expansions.emplace_back(CR, Function);
451       }
452   }
453 
454   DEBUG(dbgs() << "Emitting segments for file: " << Filename << "\n");
455   FileCoverage.Segments = SegmentBuilder::buildSegments(Regions);
456 
457   return FileCoverage;
458 }
459 
460 std::vector<const FunctionRecord *>
461 CoverageMapping::getInstantiations(StringRef Filename) {
462   FunctionInstantiationSetCollector InstantiationSetCollector;
463   for (const auto &Function : Functions) {
464     auto MainFileID = findMainViewFileID(Filename, Function);
465     if (!MainFileID)
466       continue;
467     InstantiationSetCollector.insert(Function, *MainFileID);
468   }
469 
470   std::vector<const FunctionRecord *> Result;
471   for (const auto &InstantiationSet : InstantiationSetCollector) {
472     if (InstantiationSet.second.size() < 2)
473       continue;
474     Result.insert(Result.end(), InstantiationSet.second.begin(),
475                   InstantiationSet.second.end());
476   }
477   return Result;
478 }
479 
480 CoverageData
481 CoverageMapping::getCoverageForFunction(const FunctionRecord &Function) {
482   auto MainFileID = findMainViewFileID(Function);
483   if (!MainFileID)
484     return CoverageData();
485 
486   CoverageData FunctionCoverage(Function.Filenames[*MainFileID]);
487   std::vector<coverage::CountedRegion> Regions;
488   for (const auto &CR : Function.CountedRegions)
489     if (CR.FileID == *MainFileID) {
490       Regions.push_back(CR);
491       if (isExpansion(CR, *MainFileID))
492         FunctionCoverage.Expansions.emplace_back(CR, Function);
493     }
494 
495   DEBUG(dbgs() << "Emitting segments for function: " << Function.Name << "\n");
496   FunctionCoverage.Segments = SegmentBuilder::buildSegments(Regions);
497 
498   return FunctionCoverage;
499 }
500 
501 CoverageData
502 CoverageMapping::getCoverageForExpansion(const ExpansionRecord &Expansion) {
503   CoverageData ExpansionCoverage(
504       Expansion.Function.Filenames[Expansion.FileID]);
505   std::vector<coverage::CountedRegion> Regions;
506   for (const auto &CR : Expansion.Function.CountedRegions)
507     if (CR.FileID == Expansion.FileID) {
508       Regions.push_back(CR);
509       if (isExpansion(CR, Expansion.FileID))
510         ExpansionCoverage.Expansions.emplace_back(CR, Expansion.Function);
511     }
512 
513   DEBUG(dbgs() << "Emitting segments for expansion of file " << Expansion.FileID
514                << "\n");
515   ExpansionCoverage.Segments = SegmentBuilder::buildSegments(Regions);
516 
517   return ExpansionCoverage;
518 }
519 
520 namespace {
521 class CoverageMappingErrorCategoryType : public std::error_category {
522   const char *name() const LLVM_NOEXCEPT override { return "llvm.coveragemap"; }
523   std::string message(int IE) const override {
524     auto E = static_cast<coveragemap_error>(IE);
525     switch (E) {
526     case coveragemap_error::success:
527       return "Success";
528     case coveragemap_error::eof:
529       return "End of File";
530     case coveragemap_error::no_data_found:
531       return "No coverage data found";
532     case coveragemap_error::unsupported_version:
533       return "Unsupported coverage format version";
534     case coveragemap_error::truncated:
535       return "Truncated coverage data";
536     case coveragemap_error::malformed:
537       return "Malformed coverage data";
538     }
539     llvm_unreachable("A value of coveragemap_error has no message.");
540   }
541 };
542 }
543 
544 static ManagedStatic<CoverageMappingErrorCategoryType> ErrorCategory;
545 
546 const std::error_category &llvm::coverage::coveragemap_category() {
547   return *ErrorCategory;
548 }
549