1 //=-- CoverageMapping.cpp - Code coverage mapping support ---------*- C++ -*-=// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file contains support for clang's and llvm's instrumentation based 11 // code coverage. 12 // 13 //===----------------------------------------------------------------------===// 14 15 #include "llvm/ProfileData/Coverage/CoverageMapping.h" 16 #include "llvm/ADT/DenseMap.h" 17 #include "llvm/ADT/Optional.h" 18 #include "llvm/ADT/SmallBitVector.h" 19 #include "llvm/ProfileData/Coverage/CoverageMappingReader.h" 20 #include "llvm/ProfileData/InstrProfReader.h" 21 #include "llvm/Support/Debug.h" 22 #include "llvm/Support/Errc.h" 23 #include "llvm/Support/ErrorHandling.h" 24 #include "llvm/Support/ManagedStatic.h" 25 #include "llvm/Support/Path.h" 26 #include "llvm/Support/raw_ostream.h" 27 28 using namespace llvm; 29 using namespace coverage; 30 31 #define DEBUG_TYPE "coverage-mapping" 32 33 Counter CounterExpressionBuilder::get(const CounterExpression &E) { 34 auto It = ExpressionIndices.find(E); 35 if (It != ExpressionIndices.end()) 36 return Counter::getExpression(It->second); 37 unsigned I = Expressions.size(); 38 Expressions.push_back(E); 39 ExpressionIndices[E] = I; 40 return Counter::getExpression(I); 41 } 42 43 void CounterExpressionBuilder::extractTerms( 44 Counter C, int Sign, SmallVectorImpl<std::pair<unsigned, int>> &Terms) { 45 switch (C.getKind()) { 46 case Counter::Zero: 47 break; 48 case Counter::CounterValueReference: 49 Terms.push_back(std::make_pair(C.getCounterID(), Sign)); 50 break; 51 case Counter::Expression: 52 const auto &E = Expressions[C.getExpressionID()]; 53 extractTerms(E.LHS, Sign, Terms); 54 extractTerms(E.RHS, E.Kind == CounterExpression::Subtract ? -Sign : Sign, 55 Terms); 56 break; 57 } 58 } 59 60 Counter CounterExpressionBuilder::simplify(Counter ExpressionTree) { 61 // Gather constant terms. 62 llvm::SmallVector<std::pair<unsigned, int>, 32> Terms; 63 extractTerms(ExpressionTree, +1, Terms); 64 65 // If there are no terms, this is just a zero. The algorithm below assumes at 66 // least one term. 67 if (Terms.size() == 0) 68 return Counter::getZero(); 69 70 // Group the terms by counter ID. 71 std::sort(Terms.begin(), Terms.end(), 72 [](const std::pair<unsigned, int> &LHS, 73 const std::pair<unsigned, int> &RHS) { 74 return LHS.first < RHS.first; 75 }); 76 77 // Combine terms by counter ID to eliminate counters that sum to zero. 78 auto Prev = Terms.begin(); 79 for (auto I = Prev + 1, E = Terms.end(); I != E; ++I) { 80 if (I->first == Prev->first) { 81 Prev->second += I->second; 82 continue; 83 } 84 ++Prev; 85 *Prev = *I; 86 } 87 Terms.erase(++Prev, Terms.end()); 88 89 Counter C; 90 // Create additions. We do this before subtractions to avoid constructs like 91 // ((0 - X) + Y), as opposed to (Y - X). 92 for (auto Term : Terms) { 93 if (Term.second <= 0) 94 continue; 95 for (int I = 0; I < Term.second; ++I) 96 if (C.isZero()) 97 C = Counter::getCounter(Term.first); 98 else 99 C = get(CounterExpression(CounterExpression::Add, C, 100 Counter::getCounter(Term.first))); 101 } 102 103 // Create subtractions. 104 for (auto Term : Terms) { 105 if (Term.second >= 0) 106 continue; 107 for (int I = 0; I < -Term.second; ++I) 108 C = get(CounterExpression(CounterExpression::Subtract, C, 109 Counter::getCounter(Term.first))); 110 } 111 return C; 112 } 113 114 Counter CounterExpressionBuilder::add(Counter LHS, Counter RHS) { 115 return simplify(get(CounterExpression(CounterExpression::Add, LHS, RHS))); 116 } 117 118 Counter CounterExpressionBuilder::subtract(Counter LHS, Counter RHS) { 119 return simplify( 120 get(CounterExpression(CounterExpression::Subtract, LHS, RHS))); 121 } 122 123 void CounterMappingContext::dump(const Counter &C, 124 llvm::raw_ostream &OS) const { 125 switch (C.getKind()) { 126 case Counter::Zero: 127 OS << '0'; 128 return; 129 case Counter::CounterValueReference: 130 OS << '#' << C.getCounterID(); 131 break; 132 case Counter::Expression: { 133 if (C.getExpressionID() >= Expressions.size()) 134 return; 135 const auto &E = Expressions[C.getExpressionID()]; 136 OS << '('; 137 dump(E.LHS, OS); 138 OS << (E.Kind == CounterExpression::Subtract ? " - " : " + "); 139 dump(E.RHS, OS); 140 OS << ')'; 141 break; 142 } 143 } 144 if (CounterValues.empty()) 145 return; 146 Expected<int64_t> Value = evaluate(C); 147 if (auto E = Value.takeError()) { 148 llvm::consumeError(std::move(E)); 149 return; 150 } 151 OS << '[' << *Value << ']'; 152 } 153 154 Expected<int64_t> CounterMappingContext::evaluate(const Counter &C) const { 155 switch (C.getKind()) { 156 case Counter::Zero: 157 return 0; 158 case Counter::CounterValueReference: 159 if (C.getCounterID() >= CounterValues.size()) 160 return errorCodeToError(errc::argument_out_of_domain); 161 return CounterValues[C.getCounterID()]; 162 case Counter::Expression: { 163 if (C.getExpressionID() >= Expressions.size()) 164 return errorCodeToError(errc::argument_out_of_domain); 165 const auto &E = Expressions[C.getExpressionID()]; 166 Expected<int64_t> LHS = evaluate(E.LHS); 167 if (!LHS) 168 return LHS; 169 Expected<int64_t> RHS = evaluate(E.RHS); 170 if (!RHS) 171 return RHS; 172 return E.Kind == CounterExpression::Subtract ? *LHS - *RHS : *LHS + *RHS; 173 } 174 } 175 llvm_unreachable("Unhandled CounterKind"); 176 } 177 178 void FunctionRecordIterator::skipOtherFiles() { 179 while (Current != Records.end() && !Filename.empty() && 180 Filename != Current->Filenames[0]) 181 ++Current; 182 if (Current == Records.end()) 183 *this = FunctionRecordIterator(); 184 } 185 186 Error CoverageMapping::loadFunctionRecord( 187 const CoverageMappingRecord &Record, 188 IndexedInstrProfReader &ProfileReader) { 189 CounterMappingContext Ctx(Record.Expressions); 190 191 std::vector<uint64_t> Counts; 192 if (Error E = ProfileReader.getFunctionCounts(Record.FunctionName, 193 Record.FunctionHash, Counts)) { 194 instrprof_error IPE = InstrProfError::take(std::move(E)); 195 if (IPE == instrprof_error::hash_mismatch) { 196 MismatchedFunctionCount++; 197 return Error::success(); 198 } else if (IPE != instrprof_error::unknown_function) 199 return make_error<InstrProfError>(IPE); 200 Counts.assign(Record.MappingRegions.size(), 0); 201 } 202 Ctx.setCounts(Counts); 203 204 assert(!Record.MappingRegions.empty() && "Function has no regions"); 205 206 StringRef OrigFuncName = Record.FunctionName; 207 if (Record.Filenames.empty()) 208 OrigFuncName = getFuncNameWithoutPrefix(OrigFuncName); 209 else 210 OrigFuncName = getFuncNameWithoutPrefix(OrigFuncName, Record.Filenames[0]); 211 FunctionRecord Function(OrigFuncName, Record.Filenames); 212 for (const auto &Region : Record.MappingRegions) { 213 Expected<int64_t> ExecutionCount = Ctx.evaluate(Region.Count); 214 if (auto E = ExecutionCount.takeError()) { 215 llvm::consumeError(std::move(E)); 216 return Error::success(); 217 } 218 Function.pushRegion(Region, *ExecutionCount); 219 } 220 if (Function.CountedRegions.size() != Record.MappingRegions.size()) { 221 MismatchedFunctionCount++; 222 return Error::success(); 223 } 224 225 Functions.push_back(std::move(Function)); 226 return Error::success(); 227 } 228 229 Expected<std::unique_ptr<CoverageMapping>> 230 CoverageMapping::load(CoverageMappingReader &CoverageReader, 231 IndexedInstrProfReader &ProfileReader) { 232 auto Coverage = std::unique_ptr<CoverageMapping>(new CoverageMapping()); 233 234 for (const auto &Record : CoverageReader) 235 if (Error E = Coverage->loadFunctionRecord(Record, ProfileReader)) 236 return std::move(E); 237 238 return std::move(Coverage); 239 } 240 241 Expected<std::unique_ptr<CoverageMapping>> 242 CoverageMapping::load(StringRef ObjectFilename, StringRef ProfileFilename, 243 StringRef Arch) { 244 auto CounterMappingBuff = MemoryBuffer::getFileOrSTDIN(ObjectFilename); 245 if (std::error_code EC = CounterMappingBuff.getError()) 246 return errorCodeToError(EC); 247 auto CoverageReaderOrErr = 248 BinaryCoverageReader::create(CounterMappingBuff.get(), Arch); 249 if (Error E = CoverageReaderOrErr.takeError()) 250 return std::move(E); 251 auto CoverageReader = std::move(CoverageReaderOrErr.get()); 252 auto ProfileReaderOrErr = IndexedInstrProfReader::create(ProfileFilename); 253 if (Error E = ProfileReaderOrErr.takeError()) 254 return std::move(E); 255 auto ProfileReader = std::move(ProfileReaderOrErr.get()); 256 return load(*CoverageReader, *ProfileReader); 257 } 258 259 namespace { 260 /// \brief Distributes functions into instantiation sets. 261 /// 262 /// An instantiation set is a collection of functions that have the same source 263 /// code, ie, template functions specializations. 264 class FunctionInstantiationSetCollector { 265 typedef DenseMap<std::pair<unsigned, unsigned>, 266 std::vector<const FunctionRecord *>> MapT; 267 MapT InstantiatedFunctions; 268 269 public: 270 void insert(const FunctionRecord &Function, unsigned FileID) { 271 auto I = Function.CountedRegions.begin(), E = Function.CountedRegions.end(); 272 while (I != E && I->FileID != FileID) 273 ++I; 274 assert(I != E && "function does not cover the given file"); 275 auto &Functions = InstantiatedFunctions[I->startLoc()]; 276 Functions.push_back(&Function); 277 } 278 279 MapT::iterator begin() { return InstantiatedFunctions.begin(); } 280 281 MapT::iterator end() { return InstantiatedFunctions.end(); } 282 }; 283 284 class SegmentBuilder { 285 std::vector<CoverageSegment> &Segments; 286 SmallVector<const CountedRegion *, 8> ActiveRegions; 287 288 SegmentBuilder(std::vector<CoverageSegment> &Segments) : Segments(Segments) {} 289 290 /// Start a segment with no count specified. 291 void startSegment(unsigned Line, unsigned Col) { 292 DEBUG(dbgs() << "Top level segment at " << Line << ":" << Col << "\n"); 293 Segments.emplace_back(Line, Col, /*IsRegionEntry=*/false); 294 } 295 296 /// Start a segment with the given Region's count. 297 void startSegment(unsigned Line, unsigned Col, bool IsRegionEntry, 298 const CountedRegion &Region) { 299 // Avoid creating empty regions. 300 if (!Segments.empty() && Segments.back().Line == Line && 301 Segments.back().Col == Col) 302 Segments.pop_back(); 303 DEBUG(dbgs() << "Segment at " << Line << ":" << Col); 304 // Set this region's count. 305 if (Region.Kind != coverage::CounterMappingRegion::SkippedRegion) { 306 DEBUG(dbgs() << " with count " << Region.ExecutionCount); 307 Segments.emplace_back(Line, Col, Region.ExecutionCount, IsRegionEntry); 308 } else 309 Segments.emplace_back(Line, Col, IsRegionEntry); 310 DEBUG(dbgs() << "\n"); 311 } 312 313 /// Start a segment for the given region. 314 void startSegment(const CountedRegion &Region) { 315 startSegment(Region.LineStart, Region.ColumnStart, true, Region); 316 } 317 318 /// Pop the top region off of the active stack, starting a new segment with 319 /// the containing Region's count. 320 void popRegion() { 321 const CountedRegion *Active = ActiveRegions.back(); 322 unsigned Line = Active->LineEnd, Col = Active->ColumnEnd; 323 ActiveRegions.pop_back(); 324 if (ActiveRegions.empty()) 325 startSegment(Line, Col); 326 else 327 startSegment(Line, Col, false, *ActiveRegions.back()); 328 } 329 330 void buildSegmentsImpl(ArrayRef<CountedRegion> Regions) { 331 for (const auto &Region : Regions) { 332 // Pop any regions that end before this one starts. 333 while (!ActiveRegions.empty() && 334 ActiveRegions.back()->endLoc() <= Region.startLoc()) 335 popRegion(); 336 // Add this region to the stack. 337 ActiveRegions.push_back(&Region); 338 startSegment(Region); 339 } 340 // Pop any regions that are left in the stack. 341 while (!ActiveRegions.empty()) 342 popRegion(); 343 } 344 345 /// Sort a nested sequence of regions from a single file. 346 static void sortNestedRegions(MutableArrayRef<CountedRegion> Regions) { 347 std::sort(Regions.begin(), Regions.end(), [](const CountedRegion &LHS, 348 const CountedRegion &RHS) { 349 if (LHS.startLoc() != RHS.startLoc()) 350 return LHS.startLoc() < RHS.startLoc(); 351 if (LHS.endLoc() != RHS.endLoc()) 352 // When LHS completely contains RHS, we sort LHS first. 353 return RHS.endLoc() < LHS.endLoc(); 354 // If LHS and RHS cover the same area, we need to sort them according 355 // to their kinds so that the most suitable region will become "active" 356 // in combineRegions(). Because we accumulate counter values only from 357 // regions of the same kind as the first region of the area, prefer 358 // CodeRegion to ExpansionRegion and ExpansionRegion to SkippedRegion. 359 static_assert(coverage::CounterMappingRegion::CodeRegion < 360 coverage::CounterMappingRegion::ExpansionRegion && 361 coverage::CounterMappingRegion::ExpansionRegion < 362 coverage::CounterMappingRegion::SkippedRegion, 363 "Unexpected order of region kind values"); 364 return LHS.Kind < RHS.Kind; 365 }); 366 } 367 368 /// Combine counts of regions which cover the same area. 369 static ArrayRef<CountedRegion> 370 combineRegions(MutableArrayRef<CountedRegion> Regions) { 371 if (Regions.empty()) 372 return Regions; 373 auto Active = Regions.begin(); 374 auto End = Regions.end(); 375 for (auto I = Regions.begin() + 1; I != End; ++I) { 376 if (Active->startLoc() != I->startLoc() || 377 Active->endLoc() != I->endLoc()) { 378 // Shift to the next region. 379 ++Active; 380 if (Active != I) 381 *Active = *I; 382 continue; 383 } 384 // Merge duplicate region. 385 // If CodeRegions and ExpansionRegions cover the same area, it's probably 386 // a macro which is fully expanded to another macro. In that case, we need 387 // to accumulate counts only from CodeRegions, or else the area will be 388 // counted twice. 389 // On the other hand, a macro may have a nested macro in its body. If the 390 // outer macro is used several times, the ExpansionRegion for the nested 391 // macro will also be added several times. These ExpansionRegions cover 392 // the same source locations and have to be combined to reach the correct 393 // value for that area. 394 // We add counts of the regions of the same kind as the active region 395 // to handle the both situations. 396 if (I->Kind == Active->Kind) 397 Active->ExecutionCount += I->ExecutionCount; 398 } 399 return Regions.drop_back(std::distance(++Active, End)); 400 } 401 402 public: 403 /// Build a list of CoverageSegments from a list of Regions. 404 static std::vector<CoverageSegment> 405 buildSegments(MutableArrayRef<CountedRegion> Regions) { 406 std::vector<CoverageSegment> Segments; 407 SegmentBuilder Builder(Segments); 408 409 sortNestedRegions(Regions); 410 ArrayRef<CountedRegion> CombinedRegions = combineRegions(Regions); 411 412 Builder.buildSegmentsImpl(CombinedRegions); 413 return Segments; 414 } 415 }; 416 } 417 418 std::vector<StringRef> CoverageMapping::getUniqueSourceFiles() const { 419 std::vector<StringRef> Filenames; 420 for (const auto &Function : getCoveredFunctions()) 421 Filenames.insert(Filenames.end(), Function.Filenames.begin(), 422 Function.Filenames.end()); 423 std::sort(Filenames.begin(), Filenames.end()); 424 auto Last = std::unique(Filenames.begin(), Filenames.end()); 425 Filenames.erase(Last, Filenames.end()); 426 return Filenames; 427 } 428 429 static SmallBitVector gatherFileIDs(StringRef SourceFile, 430 const FunctionRecord &Function) { 431 SmallBitVector FilenameEquivalence(Function.Filenames.size(), false); 432 for (unsigned I = 0, E = Function.Filenames.size(); I < E; ++I) 433 if (SourceFile == Function.Filenames[I]) 434 FilenameEquivalence[I] = true; 435 return FilenameEquivalence; 436 } 437 438 /// Return the ID of the file where the definition of the function is located. 439 static Optional<unsigned> findMainViewFileID(const FunctionRecord &Function) { 440 SmallBitVector IsNotExpandedFile(Function.Filenames.size(), true); 441 for (const auto &CR : Function.CountedRegions) 442 if (CR.Kind == CounterMappingRegion::ExpansionRegion) 443 IsNotExpandedFile[CR.ExpandedFileID] = false; 444 int I = IsNotExpandedFile.find_first(); 445 if (I == -1) 446 return None; 447 return I; 448 } 449 450 /// Check if SourceFile is the file that contains the definition of 451 /// the Function. Return the ID of the file in that case or None otherwise. 452 static Optional<unsigned> findMainViewFileID(StringRef SourceFile, 453 const FunctionRecord &Function) { 454 Optional<unsigned> I = findMainViewFileID(Function); 455 if (I && SourceFile == Function.Filenames[*I]) 456 return I; 457 return None; 458 } 459 460 static bool isExpansion(const CountedRegion &R, unsigned FileID) { 461 return R.Kind == CounterMappingRegion::ExpansionRegion && R.FileID == FileID; 462 } 463 464 CoverageData CoverageMapping::getCoverageForFile(StringRef Filename) const { 465 CoverageData FileCoverage(Filename); 466 std::vector<coverage::CountedRegion> Regions; 467 468 for (const auto &Function : Functions) { 469 auto MainFileID = findMainViewFileID(Filename, Function); 470 auto FileIDs = gatherFileIDs(Filename, Function); 471 for (const auto &CR : Function.CountedRegions) 472 if (FileIDs.test(CR.FileID)) { 473 Regions.push_back(CR); 474 if (MainFileID && isExpansion(CR, *MainFileID)) 475 FileCoverage.Expansions.emplace_back(CR, Function); 476 } 477 } 478 479 DEBUG(dbgs() << "Emitting segments for file: " << Filename << "\n"); 480 FileCoverage.Segments = SegmentBuilder::buildSegments(Regions); 481 482 return FileCoverage; 483 } 484 485 std::vector<const FunctionRecord *> 486 CoverageMapping::getInstantiations(StringRef Filename) const { 487 FunctionInstantiationSetCollector InstantiationSetCollector; 488 for (const auto &Function : Functions) { 489 auto MainFileID = findMainViewFileID(Filename, Function); 490 if (!MainFileID) 491 continue; 492 InstantiationSetCollector.insert(Function, *MainFileID); 493 } 494 495 std::vector<const FunctionRecord *> Result; 496 for (const auto &InstantiationSet : InstantiationSetCollector) { 497 if (InstantiationSet.second.size() < 2) 498 continue; 499 Result.insert(Result.end(), InstantiationSet.second.begin(), 500 InstantiationSet.second.end()); 501 } 502 return Result; 503 } 504 505 CoverageData 506 CoverageMapping::getCoverageForFunction(const FunctionRecord &Function) const { 507 auto MainFileID = findMainViewFileID(Function); 508 if (!MainFileID) 509 return CoverageData(); 510 511 CoverageData FunctionCoverage(Function.Filenames[*MainFileID]); 512 std::vector<coverage::CountedRegion> Regions; 513 for (const auto &CR : Function.CountedRegions) 514 if (CR.FileID == *MainFileID) { 515 Regions.push_back(CR); 516 if (isExpansion(CR, *MainFileID)) 517 FunctionCoverage.Expansions.emplace_back(CR, Function); 518 } 519 520 DEBUG(dbgs() << "Emitting segments for function: " << Function.Name << "\n"); 521 FunctionCoverage.Segments = SegmentBuilder::buildSegments(Regions); 522 523 return FunctionCoverage; 524 } 525 526 CoverageData CoverageMapping::getCoverageForExpansion( 527 const ExpansionRecord &Expansion) const { 528 CoverageData ExpansionCoverage( 529 Expansion.Function.Filenames[Expansion.FileID]); 530 std::vector<coverage::CountedRegion> Regions; 531 for (const auto &CR : Expansion.Function.CountedRegions) 532 if (CR.FileID == Expansion.FileID) { 533 Regions.push_back(CR); 534 if (isExpansion(CR, Expansion.FileID)) 535 ExpansionCoverage.Expansions.emplace_back(CR, Expansion.Function); 536 } 537 538 DEBUG(dbgs() << "Emitting segments for expansion of file " << Expansion.FileID 539 << "\n"); 540 ExpansionCoverage.Segments = SegmentBuilder::buildSegments(Regions); 541 542 return ExpansionCoverage; 543 } 544 545 namespace { 546 std::string getCoverageMapErrString(coveragemap_error Err) { 547 switch (Err) { 548 case coveragemap_error::success: 549 return "Success"; 550 case coveragemap_error::eof: 551 return "End of File"; 552 case coveragemap_error::no_data_found: 553 return "No coverage data found"; 554 case coveragemap_error::unsupported_version: 555 return "Unsupported coverage format version"; 556 case coveragemap_error::truncated: 557 return "Truncated coverage data"; 558 case coveragemap_error::malformed: 559 return "Malformed coverage data"; 560 } 561 llvm_unreachable("A value of coveragemap_error has no message."); 562 } 563 564 // FIXME: This class is only here to support the transition to llvm::Error. It 565 // will be removed once this transition is complete. Clients should prefer to 566 // deal with the Error value directly, rather than converting to error_code. 567 class CoverageMappingErrorCategoryType : public std::error_category { 568 const char *name() const LLVM_NOEXCEPT override { return "llvm.coveragemap"; } 569 std::string message(int IE) const override { 570 return getCoverageMapErrString(static_cast<coveragemap_error>(IE)); 571 } 572 }; 573 } // end anonymous namespace 574 575 std::string CoverageMapError::message() const { 576 return getCoverageMapErrString(Err); 577 } 578 579 static ManagedStatic<CoverageMappingErrorCategoryType> ErrorCategory; 580 581 const std::error_category &llvm::coverage::coveragemap_category() { 582 return *ErrorCategory; 583 } 584 585 char CoverageMapError::ID = 0; 586