15ffd83dbSDimitry Andric //===- DwarfTransformer.cpp -----------------------------------------------===// 25ffd83dbSDimitry Andric // 35ffd83dbSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 45ffd83dbSDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 55ffd83dbSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 65ffd83dbSDimitry Andric // 75ffd83dbSDimitry Andric //===----------------------------------------------------------------------===// 85ffd83dbSDimitry Andric 95ffd83dbSDimitry Andric #include <thread> 105ffd83dbSDimitry Andric #include <unordered_set> 115ffd83dbSDimitry Andric 125ffd83dbSDimitry Andric #include "llvm/DebugInfo/DIContext.h" 135ffd83dbSDimitry Andric #include "llvm/DebugInfo/DWARF/DWARFContext.h" 145ffd83dbSDimitry Andric #include "llvm/Support/Error.h" 155ffd83dbSDimitry Andric #include "llvm/Support/ThreadPool.h" 165ffd83dbSDimitry Andric #include "llvm/Support/raw_ostream.h" 175ffd83dbSDimitry Andric 185ffd83dbSDimitry Andric #include "llvm/DebugInfo/GSYM/DwarfTransformer.h" 195ffd83dbSDimitry Andric #include "llvm/DebugInfo/GSYM/FunctionInfo.h" 205ffd83dbSDimitry Andric #include "llvm/DebugInfo/GSYM/GsymCreator.h" 215ffd83dbSDimitry Andric #include "llvm/DebugInfo/GSYM/GsymReader.h" 225ffd83dbSDimitry Andric #include "llvm/DebugInfo/GSYM/InlineInfo.h" 235ffd83dbSDimitry Andric 245ffd83dbSDimitry Andric using namespace llvm; 255ffd83dbSDimitry Andric using namespace gsym; 265ffd83dbSDimitry Andric 275ffd83dbSDimitry Andric struct llvm::gsym::CUInfo { 285ffd83dbSDimitry Andric const DWARFDebugLine::LineTable *LineTable; 295ffd83dbSDimitry Andric const char *CompDir; 305ffd83dbSDimitry Andric std::vector<uint32_t> FileCache; 315ffd83dbSDimitry Andric uint64_t Language = 0; 325ffd83dbSDimitry Andric uint8_t AddrSize = 0; 335ffd83dbSDimitry Andric 345ffd83dbSDimitry Andric CUInfo(DWARFContext &DICtx, DWARFCompileUnit *CU) { 355ffd83dbSDimitry Andric LineTable = DICtx.getLineTableForUnit(CU); 365ffd83dbSDimitry Andric CompDir = CU->getCompilationDir(); 375ffd83dbSDimitry Andric FileCache.clear(); 385ffd83dbSDimitry Andric if (LineTable) 395ffd83dbSDimitry Andric FileCache.assign(LineTable->Prologue.FileNames.size() + 1, UINT32_MAX); 405ffd83dbSDimitry Andric DWARFDie Die = CU->getUnitDIE(); 415ffd83dbSDimitry Andric Language = dwarf::toUnsigned(Die.find(dwarf::DW_AT_language), 0); 425ffd83dbSDimitry Andric AddrSize = CU->getAddressByteSize(); 435ffd83dbSDimitry Andric } 445ffd83dbSDimitry Andric 455ffd83dbSDimitry Andric /// Return true if Addr is the highest address for a given compile unit. The 465ffd83dbSDimitry Andric /// highest address is encoded as -1, of all ones in the address. These high 475ffd83dbSDimitry Andric /// addresses are used by some linkers to indicate that a function has been 485ffd83dbSDimitry Andric /// dead stripped or didn't end up in the linked executable. 495ffd83dbSDimitry Andric bool isHighestAddress(uint64_t Addr) const { 505ffd83dbSDimitry Andric if (AddrSize == 4) 515ffd83dbSDimitry Andric return Addr == UINT32_MAX; 525ffd83dbSDimitry Andric else if (AddrSize == 8) 535ffd83dbSDimitry Andric return Addr == UINT64_MAX; 545ffd83dbSDimitry Andric return false; 555ffd83dbSDimitry Andric } 565ffd83dbSDimitry Andric 575ffd83dbSDimitry Andric /// Convert a DWARF compile unit file index into a GSYM global file index. 585ffd83dbSDimitry Andric /// 595ffd83dbSDimitry Andric /// Each compile unit in DWARF has its own file table in the line table 605ffd83dbSDimitry Andric /// prologue. GSYM has a single large file table that applies to all files 615ffd83dbSDimitry Andric /// from all of the info in a GSYM file. This function converts between the 625ffd83dbSDimitry Andric /// two and caches and DWARF CU file index that has already been converted so 635ffd83dbSDimitry Andric /// the first client that asks for a compile unit file index will end up 645ffd83dbSDimitry Andric /// doing the conversion, and subsequent clients will get the cached GSYM 655ffd83dbSDimitry Andric /// index. 665ffd83dbSDimitry Andric uint32_t DWARFToGSYMFileIndex(GsymCreator &Gsym, uint32_t DwarfFileIdx) { 675ffd83dbSDimitry Andric if (!LineTable) 685ffd83dbSDimitry Andric return 0; 695ffd83dbSDimitry Andric assert(DwarfFileIdx < FileCache.size()); 705ffd83dbSDimitry Andric uint32_t &GsymFileIdx = FileCache[DwarfFileIdx]; 715ffd83dbSDimitry Andric if (GsymFileIdx != UINT32_MAX) 725ffd83dbSDimitry Andric return GsymFileIdx; 735ffd83dbSDimitry Andric std::string File; 745ffd83dbSDimitry Andric if (LineTable->getFileNameByIndex( 755ffd83dbSDimitry Andric DwarfFileIdx, CompDir, 765ffd83dbSDimitry Andric DILineInfoSpecifier::FileLineInfoKind::AbsoluteFilePath, File)) 775ffd83dbSDimitry Andric GsymFileIdx = Gsym.insertFile(File); 785ffd83dbSDimitry Andric else 795ffd83dbSDimitry Andric GsymFileIdx = 0; 805ffd83dbSDimitry Andric return GsymFileIdx; 815ffd83dbSDimitry Andric } 825ffd83dbSDimitry Andric }; 835ffd83dbSDimitry Andric 845ffd83dbSDimitry Andric 855ffd83dbSDimitry Andric static DWARFDie GetParentDeclContextDIE(DWARFDie &Die) { 865ffd83dbSDimitry Andric if (DWARFDie SpecDie = 875ffd83dbSDimitry Andric Die.getAttributeValueAsReferencedDie(dwarf::DW_AT_specification)) { 885ffd83dbSDimitry Andric if (DWARFDie SpecParent = GetParentDeclContextDIE(SpecDie)) 895ffd83dbSDimitry Andric return SpecParent; 905ffd83dbSDimitry Andric } 915ffd83dbSDimitry Andric if (DWARFDie AbstDie = 925ffd83dbSDimitry Andric Die.getAttributeValueAsReferencedDie(dwarf::DW_AT_abstract_origin)) { 935ffd83dbSDimitry Andric if (DWARFDie AbstParent = GetParentDeclContextDIE(AbstDie)) 945ffd83dbSDimitry Andric return AbstParent; 955ffd83dbSDimitry Andric } 965ffd83dbSDimitry Andric 975ffd83dbSDimitry Andric // We never want to follow parent for inlined subroutine - that would 985ffd83dbSDimitry Andric // give us information about where the function is inlined, not what 995ffd83dbSDimitry Andric // function is inlined 1005ffd83dbSDimitry Andric if (Die.getTag() == dwarf::DW_TAG_inlined_subroutine) 1015ffd83dbSDimitry Andric return DWARFDie(); 1025ffd83dbSDimitry Andric 1035ffd83dbSDimitry Andric DWARFDie ParentDie = Die.getParent(); 1045ffd83dbSDimitry Andric if (!ParentDie) 1055ffd83dbSDimitry Andric return DWARFDie(); 1065ffd83dbSDimitry Andric 1075ffd83dbSDimitry Andric switch (ParentDie.getTag()) { 1085ffd83dbSDimitry Andric case dwarf::DW_TAG_namespace: 1095ffd83dbSDimitry Andric case dwarf::DW_TAG_structure_type: 1105ffd83dbSDimitry Andric case dwarf::DW_TAG_union_type: 1115ffd83dbSDimitry Andric case dwarf::DW_TAG_class_type: 1125ffd83dbSDimitry Andric case dwarf::DW_TAG_subprogram: 1135ffd83dbSDimitry Andric return ParentDie; // Found parent decl context DIE 1145ffd83dbSDimitry Andric case dwarf::DW_TAG_lexical_block: 1155ffd83dbSDimitry Andric return GetParentDeclContextDIE(ParentDie); 1165ffd83dbSDimitry Andric default: 1175ffd83dbSDimitry Andric break; 1185ffd83dbSDimitry Andric } 1195ffd83dbSDimitry Andric 1205ffd83dbSDimitry Andric return DWARFDie(); 1215ffd83dbSDimitry Andric } 1225ffd83dbSDimitry Andric 1235ffd83dbSDimitry Andric /// Get the GsymCreator string table offset for the qualified name for the 1245ffd83dbSDimitry Andric /// DIE passed in. This function will avoid making copies of any strings in 1255ffd83dbSDimitry Andric /// the GsymCreator when possible. We don't need to copy a string when the 1265ffd83dbSDimitry Andric /// string comes from our .debug_str section or is an inlined string in the 1275ffd83dbSDimitry Andric /// .debug_info. If we create a qualified name string in this function by 1285ffd83dbSDimitry Andric /// combining multiple strings in the DWARF string table or info, we will make 1295ffd83dbSDimitry Andric /// a copy of the string when we add it to the string table. 1305ffd83dbSDimitry Andric static Optional<uint32_t> getQualifiedNameIndex(DWARFDie &Die, 1315ffd83dbSDimitry Andric uint64_t Language, 1325ffd83dbSDimitry Andric GsymCreator &Gsym) { 1335ffd83dbSDimitry Andric // If the dwarf has mangled name, use mangled name 1345ffd83dbSDimitry Andric if (auto LinkageName = 1355ffd83dbSDimitry Andric dwarf::toString(Die.findRecursively({dwarf::DW_AT_MIPS_linkage_name, 1365ffd83dbSDimitry Andric dwarf::DW_AT_linkage_name}), 1375ffd83dbSDimitry Andric nullptr)) 1385ffd83dbSDimitry Andric return Gsym.insertString(LinkageName, /* Copy */ false); 1395ffd83dbSDimitry Andric 1405ffd83dbSDimitry Andric StringRef ShortName(Die.getName(DINameKind::ShortName)); 1415ffd83dbSDimitry Andric if (ShortName.empty()) 1425ffd83dbSDimitry Andric return llvm::None; 1435ffd83dbSDimitry Andric 1445ffd83dbSDimitry Andric // For C++ and ObjC, prepend names of all parent declaration contexts 1455ffd83dbSDimitry Andric if (!(Language == dwarf::DW_LANG_C_plus_plus || 1465ffd83dbSDimitry Andric Language == dwarf::DW_LANG_C_plus_plus_03 || 1475ffd83dbSDimitry Andric Language == dwarf::DW_LANG_C_plus_plus_11 || 1485ffd83dbSDimitry Andric Language == dwarf::DW_LANG_C_plus_plus_14 || 1495ffd83dbSDimitry Andric Language == dwarf::DW_LANG_ObjC_plus_plus || 1505ffd83dbSDimitry Andric // This should not be needed for C, but we see C++ code marked as C 1515ffd83dbSDimitry Andric // in some binaries. This should hurt, so let's do it for C as well 1525ffd83dbSDimitry Andric Language == dwarf::DW_LANG_C)) 1535ffd83dbSDimitry Andric return Gsym.insertString(ShortName, /* Copy */ false); 1545ffd83dbSDimitry Andric 1555ffd83dbSDimitry Andric // Some GCC optimizations create functions with names ending with .isra.<num> 1565ffd83dbSDimitry Andric // or .part.<num> and those names are just DW_AT_name, not DW_AT_linkage_name 1575ffd83dbSDimitry Andric // If it looks like it could be the case, don't add any prefix 1585ffd83dbSDimitry Andric if (ShortName.startswith("_Z") && 1595ffd83dbSDimitry Andric (ShortName.contains(".isra.") || ShortName.contains(".part."))) 1605ffd83dbSDimitry Andric return Gsym.insertString(ShortName, /* Copy */ false); 1615ffd83dbSDimitry Andric 1625ffd83dbSDimitry Andric DWARFDie ParentDeclCtxDie = GetParentDeclContextDIE(Die); 1635ffd83dbSDimitry Andric if (ParentDeclCtxDie) { 1645ffd83dbSDimitry Andric std::string Name = ShortName.str(); 1655ffd83dbSDimitry Andric while (ParentDeclCtxDie) { 1665ffd83dbSDimitry Andric StringRef ParentName(ParentDeclCtxDie.getName(DINameKind::ShortName)); 1675ffd83dbSDimitry Andric if (!ParentName.empty()) { 1685ffd83dbSDimitry Andric // "lambda" names are wrapped in < >. Replace with { } 1695ffd83dbSDimitry Andric // to be consistent with demangled names and not to confuse with 1705ffd83dbSDimitry Andric // templates 1715ffd83dbSDimitry Andric if (ParentName.front() == '<' && ParentName.back() == '>') 1725ffd83dbSDimitry Andric Name = "{" + ParentName.substr(1, ParentName.size() - 2).str() + "}" + 1735ffd83dbSDimitry Andric "::" + Name; 1745ffd83dbSDimitry Andric else 1755ffd83dbSDimitry Andric Name = ParentName.str() + "::" + Name; 1765ffd83dbSDimitry Andric } 1775ffd83dbSDimitry Andric ParentDeclCtxDie = GetParentDeclContextDIE(ParentDeclCtxDie); 1785ffd83dbSDimitry Andric } 1795ffd83dbSDimitry Andric // Copy the name since we created a new name in a std::string. 1805ffd83dbSDimitry Andric return Gsym.insertString(Name, /* Copy */ true); 1815ffd83dbSDimitry Andric } 1825ffd83dbSDimitry Andric // Don't copy the name since it exists in the DWARF object file. 1835ffd83dbSDimitry Andric return Gsym.insertString(ShortName, /* Copy */ false); 1845ffd83dbSDimitry Andric } 1855ffd83dbSDimitry Andric 1865ffd83dbSDimitry Andric static bool hasInlineInfo(DWARFDie Die, uint32_t Depth) { 1875ffd83dbSDimitry Andric bool CheckChildren = true; 1885ffd83dbSDimitry Andric switch (Die.getTag()) { 1895ffd83dbSDimitry Andric case dwarf::DW_TAG_subprogram: 1905ffd83dbSDimitry Andric // Don't look into functions within functions. 1915ffd83dbSDimitry Andric CheckChildren = Depth == 0; 1925ffd83dbSDimitry Andric break; 1935ffd83dbSDimitry Andric case dwarf::DW_TAG_inlined_subroutine: 1945ffd83dbSDimitry Andric return true; 1955ffd83dbSDimitry Andric default: 1965ffd83dbSDimitry Andric break; 1975ffd83dbSDimitry Andric } 1985ffd83dbSDimitry Andric if (!CheckChildren) 1995ffd83dbSDimitry Andric return false; 2005ffd83dbSDimitry Andric for (DWARFDie ChildDie : Die.children()) { 2015ffd83dbSDimitry Andric if (hasInlineInfo(ChildDie, Depth + 1)) 2025ffd83dbSDimitry Andric return true; 2035ffd83dbSDimitry Andric } 2045ffd83dbSDimitry Andric return false; 2055ffd83dbSDimitry Andric } 2065ffd83dbSDimitry Andric 2075ffd83dbSDimitry Andric static void parseInlineInfo(GsymCreator &Gsym, CUInfo &CUI, DWARFDie Die, 2085ffd83dbSDimitry Andric uint32_t Depth, FunctionInfo &FI, 2095ffd83dbSDimitry Andric InlineInfo &parent) { 2105ffd83dbSDimitry Andric if (!hasInlineInfo(Die, Depth)) 2115ffd83dbSDimitry Andric return; 2125ffd83dbSDimitry Andric 2135ffd83dbSDimitry Andric dwarf::Tag Tag = Die.getTag(); 2145ffd83dbSDimitry Andric if (Tag == dwarf::DW_TAG_inlined_subroutine) { 2155ffd83dbSDimitry Andric // create new InlineInfo and append to parent.children 2165ffd83dbSDimitry Andric InlineInfo II; 2175ffd83dbSDimitry Andric DWARFAddressRange FuncRange = 2185ffd83dbSDimitry Andric DWARFAddressRange(FI.startAddress(), FI.endAddress()); 2195ffd83dbSDimitry Andric Expected<DWARFAddressRangesVector> RangesOrError = Die.getAddressRanges(); 2205ffd83dbSDimitry Andric if (RangesOrError) { 2215ffd83dbSDimitry Andric for (const DWARFAddressRange &Range : RangesOrError.get()) { 2225ffd83dbSDimitry Andric // Check that the inlined function is within the range of the function 2235ffd83dbSDimitry Andric // info, it might not be in case of split functions 2245ffd83dbSDimitry Andric if (FuncRange.LowPC <= Range.LowPC && Range.HighPC <= FuncRange.HighPC) 2255ffd83dbSDimitry Andric II.Ranges.insert(AddressRange(Range.LowPC, Range.HighPC)); 2265ffd83dbSDimitry Andric } 2275ffd83dbSDimitry Andric } 2285ffd83dbSDimitry Andric if (II.Ranges.empty()) 2295ffd83dbSDimitry Andric return; 2305ffd83dbSDimitry Andric 2315ffd83dbSDimitry Andric if (auto NameIndex = getQualifiedNameIndex(Die, CUI.Language, Gsym)) 2325ffd83dbSDimitry Andric II.Name = *NameIndex; 2335ffd83dbSDimitry Andric II.CallFile = CUI.DWARFToGSYMFileIndex( 2345ffd83dbSDimitry Andric Gsym, dwarf::toUnsigned(Die.find(dwarf::DW_AT_call_file), 0)); 2355ffd83dbSDimitry Andric II.CallLine = dwarf::toUnsigned(Die.find(dwarf::DW_AT_call_line), 0); 2365ffd83dbSDimitry Andric // parse all children and append to parent 2375ffd83dbSDimitry Andric for (DWARFDie ChildDie : Die.children()) 2385ffd83dbSDimitry Andric parseInlineInfo(Gsym, CUI, ChildDie, Depth + 1, FI, II); 2395ffd83dbSDimitry Andric parent.Children.emplace_back(std::move(II)); 2405ffd83dbSDimitry Andric return; 2415ffd83dbSDimitry Andric } 2425ffd83dbSDimitry Andric if (Tag == dwarf::DW_TAG_subprogram || Tag == dwarf::DW_TAG_lexical_block) { 2435ffd83dbSDimitry Andric // skip this Die and just recurse down 2445ffd83dbSDimitry Andric for (DWARFDie ChildDie : Die.children()) 2455ffd83dbSDimitry Andric parseInlineInfo(Gsym, CUI, ChildDie, Depth + 1, FI, parent); 2465ffd83dbSDimitry Andric } 2475ffd83dbSDimitry Andric } 2485ffd83dbSDimitry Andric 2495ffd83dbSDimitry Andric static void convertFunctionLineTable(raw_ostream &Log, CUInfo &CUI, 2505ffd83dbSDimitry Andric DWARFDie Die, GsymCreator &Gsym, 2515ffd83dbSDimitry Andric FunctionInfo &FI) { 2525ffd83dbSDimitry Andric std::vector<uint32_t> RowVector; 2535ffd83dbSDimitry Andric const uint64_t StartAddress = FI.startAddress(); 2545ffd83dbSDimitry Andric const uint64_t EndAddress = FI.endAddress(); 2555ffd83dbSDimitry Andric const uint64_t RangeSize = EndAddress - StartAddress; 2565ffd83dbSDimitry Andric const object::SectionedAddress SecAddress{ 2575ffd83dbSDimitry Andric StartAddress, object::SectionedAddress::UndefSection}; 2585ffd83dbSDimitry Andric 2595ffd83dbSDimitry Andric 2605ffd83dbSDimitry Andric if (!CUI.LineTable->lookupAddressRange(SecAddress, RangeSize, RowVector)) { 2615ffd83dbSDimitry Andric // If we have a DW_TAG_subprogram but no line entries, fall back to using 2625ffd83dbSDimitry Andric // the DW_AT_decl_file an d DW_AT_decl_line if we have both attributes. 263349cc55cSDimitry Andric std::string FilePath = Die.getDeclFile( 264349cc55cSDimitry Andric DILineInfoSpecifier::FileLineInfoKind::AbsoluteFilePath); 265349cc55cSDimitry Andric if (FilePath.empty()) 266349cc55cSDimitry Andric return; 2675ffd83dbSDimitry Andric if (auto Line = 2685ffd83dbSDimitry Andric dwarf::toUnsigned(Die.findRecursively({dwarf::DW_AT_decl_line}))) { 269349cc55cSDimitry Andric LineEntry LE(StartAddress, Gsym.insertFile(FilePath), *Line); 2705ffd83dbSDimitry Andric FI.OptLineTable = LineTable(); 2715ffd83dbSDimitry Andric FI.OptLineTable->push(LE); 2725ffd83dbSDimitry Andric } 2735ffd83dbSDimitry Andric return; 2745ffd83dbSDimitry Andric } 2755ffd83dbSDimitry Andric 2765ffd83dbSDimitry Andric FI.OptLineTable = LineTable(); 2775ffd83dbSDimitry Andric DWARFDebugLine::Row PrevRow; 2785ffd83dbSDimitry Andric for (uint32_t RowIndex : RowVector) { 2795ffd83dbSDimitry Andric // Take file number and line/column from the row. 2805ffd83dbSDimitry Andric const DWARFDebugLine::Row &Row = CUI.LineTable->Rows[RowIndex]; 2815ffd83dbSDimitry Andric const uint32_t FileIdx = CUI.DWARFToGSYMFileIndex(Gsym, Row.File); 2825ffd83dbSDimitry Andric uint64_t RowAddress = Row.Address.Address; 2835ffd83dbSDimitry Andric // Watch out for a RowAddress that is in the middle of a line table entry 2845ffd83dbSDimitry Andric // in the DWARF. If we pass an address in between two line table entries 2855ffd83dbSDimitry Andric // we will get a RowIndex for the previous valid line table row which won't 2865ffd83dbSDimitry Andric // be contained in our function. This is usually a bug in the DWARF due to 2875ffd83dbSDimitry Andric // linker problems or LTO or other DWARF re-linking so it is worth emitting 2885ffd83dbSDimitry Andric // an error, but not worth stopping the creation of the GSYM. 2895ffd83dbSDimitry Andric if (!FI.Range.contains(RowAddress)) { 2905ffd83dbSDimitry Andric if (RowAddress < FI.Range.Start) { 2915ffd83dbSDimitry Andric Log << "error: DIE has a start address whose LowPC is between the " 2925ffd83dbSDimitry Andric "line table Row[" << RowIndex << "] with address " 2935ffd83dbSDimitry Andric << HEX64(RowAddress) << " and the next one.\n"; 2945ffd83dbSDimitry Andric Die.dump(Log, 0, DIDumpOptions::getForSingleDIE()); 2955ffd83dbSDimitry Andric RowAddress = FI.Range.Start; 2965ffd83dbSDimitry Andric } else { 2975ffd83dbSDimitry Andric continue; 2985ffd83dbSDimitry Andric } 2995ffd83dbSDimitry Andric } 3005ffd83dbSDimitry Andric 3015ffd83dbSDimitry Andric LineEntry LE(RowAddress, FileIdx, Row.Line); 3025ffd83dbSDimitry Andric if (RowIndex != RowVector[0] && Row.Address < PrevRow.Address) { 3035ffd83dbSDimitry Andric // We have seen full duplicate line tables for functions in some 3045ffd83dbSDimitry Andric // DWARF files. Watch for those here by checking the the last 3055ffd83dbSDimitry Andric // row was the function's end address (HighPC) and that the 3065ffd83dbSDimitry Andric // current line table entry's address is the same as the first 3075ffd83dbSDimitry Andric // line entry we already have in our "function_info.Lines". If 3085ffd83dbSDimitry Andric // so break out after printing a warning. 3095ffd83dbSDimitry Andric auto FirstLE = FI.OptLineTable->first(); 3105ffd83dbSDimitry Andric if (FirstLE && *FirstLE == LE) { 311fe6060f1SDimitry Andric if (!Gsym.isQuiet()) { 3125ffd83dbSDimitry Andric Log << "warning: duplicate line table detected for DIE:\n"; 3135ffd83dbSDimitry Andric Die.dump(Log, 0, DIDumpOptions::getForSingleDIE()); 314fe6060f1SDimitry Andric } 3155ffd83dbSDimitry Andric } else { 3165ffd83dbSDimitry Andric // Print out (ignore if os == nulls as this is expensive) 3175ffd83dbSDimitry Andric Log << "error: line table has addresses that do not " 3185ffd83dbSDimitry Andric << "monotonically increase:\n"; 3195ffd83dbSDimitry Andric for (uint32_t RowIndex2 : RowVector) { 3205ffd83dbSDimitry Andric CUI.LineTable->Rows[RowIndex2].dump(Log); 3215ffd83dbSDimitry Andric } 3225ffd83dbSDimitry Andric Die.dump(Log, 0, DIDumpOptions::getForSingleDIE()); 3235ffd83dbSDimitry Andric } 3245ffd83dbSDimitry Andric break; 3255ffd83dbSDimitry Andric } 3265ffd83dbSDimitry Andric 3275ffd83dbSDimitry Andric // Skip multiple line entries for the same file and line. 3285ffd83dbSDimitry Andric auto LastLE = FI.OptLineTable->last(); 3295ffd83dbSDimitry Andric if (LastLE && LastLE->File == FileIdx && LastLE->Line == Row.Line) 3305ffd83dbSDimitry Andric continue; 3315ffd83dbSDimitry Andric // Only push a row if it isn't an end sequence. End sequence markers are 3325ffd83dbSDimitry Andric // included for the last address in a function or the last contiguous 3335ffd83dbSDimitry Andric // address in a sequence. 3345ffd83dbSDimitry Andric if (Row.EndSequence) { 3355ffd83dbSDimitry Andric // End sequence means that the next line entry could have a lower address 3365ffd83dbSDimitry Andric // that the previous entries. So we clear the previous row so we don't 3375ffd83dbSDimitry Andric // trigger the line table error about address that do not monotonically 3385ffd83dbSDimitry Andric // increase. 3395ffd83dbSDimitry Andric PrevRow = DWARFDebugLine::Row(); 3405ffd83dbSDimitry Andric } else { 3415ffd83dbSDimitry Andric FI.OptLineTable->push(LE); 3425ffd83dbSDimitry Andric PrevRow = Row; 3435ffd83dbSDimitry Andric } 3445ffd83dbSDimitry Andric } 3455ffd83dbSDimitry Andric // If not line table rows were added, clear the line table so we don't encode 3465ffd83dbSDimitry Andric // on in the GSYM file. 3475ffd83dbSDimitry Andric if (FI.OptLineTable->empty()) 3485ffd83dbSDimitry Andric FI.OptLineTable = llvm::None; 3495ffd83dbSDimitry Andric } 3505ffd83dbSDimitry Andric 3515ffd83dbSDimitry Andric void DwarfTransformer::handleDie(raw_ostream &OS, CUInfo &CUI, DWARFDie Die) { 3525ffd83dbSDimitry Andric switch (Die.getTag()) { 3535ffd83dbSDimitry Andric case dwarf::DW_TAG_subprogram: { 3545ffd83dbSDimitry Andric Expected<DWARFAddressRangesVector> RangesOrError = Die.getAddressRanges(); 3555ffd83dbSDimitry Andric if (!RangesOrError) { 3565ffd83dbSDimitry Andric consumeError(RangesOrError.takeError()); 3575ffd83dbSDimitry Andric break; 3585ffd83dbSDimitry Andric } 3595ffd83dbSDimitry Andric const DWARFAddressRangesVector &Ranges = RangesOrError.get(); 3605ffd83dbSDimitry Andric if (Ranges.empty()) 3615ffd83dbSDimitry Andric break; 3625ffd83dbSDimitry Andric auto NameIndex = getQualifiedNameIndex(Die, CUI.Language, Gsym); 3635ffd83dbSDimitry Andric if (!NameIndex) { 3645ffd83dbSDimitry Andric OS << "error: function at " << HEX64(Die.getOffset()) 3655ffd83dbSDimitry Andric << " has no name\n "; 3665ffd83dbSDimitry Andric Die.dump(OS, 0, DIDumpOptions::getForSingleDIE()); 3675ffd83dbSDimitry Andric break; 3685ffd83dbSDimitry Andric } 3695ffd83dbSDimitry Andric 3705ffd83dbSDimitry Andric // Create a function_info for each range 3715ffd83dbSDimitry Andric for (const DWARFAddressRange &Range : Ranges) { 3725ffd83dbSDimitry Andric // The low PC must be less than the high PC. Many linkers don't remove 3735ffd83dbSDimitry Andric // DWARF for functions that don't get linked into the final executable. 3745ffd83dbSDimitry Andric // If both the high and low pc have relocations, linkers will often set 3755ffd83dbSDimitry Andric // the address values for both to the same value to indicate the function 3765ffd83dbSDimitry Andric // has been remove. Other linkers have been known to set the one or both 3775ffd83dbSDimitry Andric // PC values to a UINT32_MAX for 4 byte addresses and UINT64_MAX for 8 3785ffd83dbSDimitry Andric // byte addresses to indicate the function isn't valid. The check below 3795ffd83dbSDimitry Andric // tries to watch for these cases and abort if it runs into them. 3805ffd83dbSDimitry Andric if (Range.LowPC >= Range.HighPC || CUI.isHighestAddress(Range.LowPC)) 3815ffd83dbSDimitry Andric break; 3825ffd83dbSDimitry Andric 3835ffd83dbSDimitry Andric // Many linkers can't remove DWARF and might set the LowPC to zero. Since 3845ffd83dbSDimitry Andric // high PC can be an offset from the low PC in more recent DWARF versions 3855ffd83dbSDimitry Andric // we need to watch for a zero'ed low pc which we do using 3865ffd83dbSDimitry Andric // ValidTextRanges below. 3875ffd83dbSDimitry Andric if (!Gsym.IsValidTextAddress(Range.LowPC)) { 3885ffd83dbSDimitry Andric // We expect zero and -1 to be invalid addresses in DWARF depending 3895ffd83dbSDimitry Andric // on the linker of the DWARF. This indicates a function was stripped 3905ffd83dbSDimitry Andric // and the debug info wasn't able to be stripped from the DWARF. If 3915ffd83dbSDimitry Andric // the LowPC isn't zero or -1, then we should emit an error. 3925ffd83dbSDimitry Andric if (Range.LowPC != 0) { 393fe6060f1SDimitry Andric if (!Gsym.isQuiet()) { 394fe6060f1SDimitry Andric // Unexpected invalid address, emit a warning 395349cc55cSDimitry Andric OS << "warning: DIE has an address range whose start address is " 396fe6060f1SDimitry Andric "not in any executable sections (" 397fe6060f1SDimitry Andric << *Gsym.GetValidTextRanges() 398fe6060f1SDimitry Andric << ") and will not be processed:\n"; 399349cc55cSDimitry Andric Die.dump(OS, 0, DIDumpOptions::getForSingleDIE()); 4005ffd83dbSDimitry Andric } 401fe6060f1SDimitry Andric } 4025ffd83dbSDimitry Andric break; 4035ffd83dbSDimitry Andric } 4045ffd83dbSDimitry Andric 4055ffd83dbSDimitry Andric FunctionInfo FI; 4065ffd83dbSDimitry Andric FI.setStartAddress(Range.LowPC); 4075ffd83dbSDimitry Andric FI.setEndAddress(Range.HighPC); 4085ffd83dbSDimitry Andric FI.Name = *NameIndex; 4095ffd83dbSDimitry Andric if (CUI.LineTable) { 4105ffd83dbSDimitry Andric convertFunctionLineTable(OS, CUI, Die, Gsym, FI); 4115ffd83dbSDimitry Andric } 4125ffd83dbSDimitry Andric if (hasInlineInfo(Die, 0)) { 4135ffd83dbSDimitry Andric FI.Inline = InlineInfo(); 4145ffd83dbSDimitry Andric FI.Inline->Name = *NameIndex; 4155ffd83dbSDimitry Andric FI.Inline->Ranges.insert(FI.Range); 4165ffd83dbSDimitry Andric parseInlineInfo(Gsym, CUI, Die, 0, FI, *FI.Inline); 4175ffd83dbSDimitry Andric } 4185ffd83dbSDimitry Andric Gsym.addFunctionInfo(std::move(FI)); 4195ffd83dbSDimitry Andric } 4205ffd83dbSDimitry Andric } break; 4215ffd83dbSDimitry Andric default: 4225ffd83dbSDimitry Andric break; 4235ffd83dbSDimitry Andric } 4245ffd83dbSDimitry Andric for (DWARFDie ChildDie : Die.children()) 4255ffd83dbSDimitry Andric handleDie(OS, CUI, ChildDie); 4265ffd83dbSDimitry Andric } 4275ffd83dbSDimitry Andric 4285ffd83dbSDimitry Andric Error DwarfTransformer::convert(uint32_t NumThreads) { 4295ffd83dbSDimitry Andric size_t NumBefore = Gsym.getNumFunctionInfos(); 4305ffd83dbSDimitry Andric if (NumThreads == 1) { 4315ffd83dbSDimitry Andric // Parse all DWARF data from this thread, use the same string/file table 4325ffd83dbSDimitry Andric // for everything 4335ffd83dbSDimitry Andric for (const auto &CU : DICtx.compile_units()) { 4345ffd83dbSDimitry Andric DWARFDie Die = CU->getUnitDIE(false); 4355ffd83dbSDimitry Andric CUInfo CUI(DICtx, dyn_cast<DWARFCompileUnit>(CU.get())); 4365ffd83dbSDimitry Andric handleDie(Log, CUI, Die); 4375ffd83dbSDimitry Andric } 4385ffd83dbSDimitry Andric } else { 4395ffd83dbSDimitry Andric // LLVM Dwarf parser is not thread-safe and we need to parse all DWARF up 4405ffd83dbSDimitry Andric // front before we start accessing any DIEs since there might be 4415ffd83dbSDimitry Andric // cross compile unit references in the DWARF. If we don't do this we can 4425ffd83dbSDimitry Andric // end up crashing. 4435ffd83dbSDimitry Andric 4445ffd83dbSDimitry Andric // We need to call getAbbreviations sequentially first so that getUnitDIE() 4455ffd83dbSDimitry Andric // only works with its local data. 4465ffd83dbSDimitry Andric for (const auto &CU : DICtx.compile_units()) 4475ffd83dbSDimitry Andric CU->getAbbreviations(); 4485ffd83dbSDimitry Andric 4495ffd83dbSDimitry Andric // Now parse all DIEs in case we have cross compile unit references in a 4505ffd83dbSDimitry Andric // thread pool. 4515ffd83dbSDimitry Andric ThreadPool pool(hardware_concurrency(NumThreads)); 4525ffd83dbSDimitry Andric for (const auto &CU : DICtx.compile_units()) 4535ffd83dbSDimitry Andric pool.async([&CU]() { CU->getUnitDIE(false /*CUDieOnly*/); }); 4545ffd83dbSDimitry Andric pool.wait(); 4555ffd83dbSDimitry Andric 4565ffd83dbSDimitry Andric // Now convert all DWARF to GSYM in a thread pool. 4575ffd83dbSDimitry Andric std::mutex LogMutex; 4585ffd83dbSDimitry Andric for (const auto &CU : DICtx.compile_units()) { 4595ffd83dbSDimitry Andric DWARFDie Die = CU->getUnitDIE(false /*CUDieOnly*/); 4605ffd83dbSDimitry Andric if (Die) { 4615ffd83dbSDimitry Andric CUInfo CUI(DICtx, dyn_cast<DWARFCompileUnit>(CU.get())); 4625ffd83dbSDimitry Andric pool.async([this, CUI, &LogMutex, Die]() mutable { 4635ffd83dbSDimitry Andric std::string ThreadLogStorage; 4645ffd83dbSDimitry Andric raw_string_ostream ThreadOS(ThreadLogStorage); 4655ffd83dbSDimitry Andric handleDie(ThreadOS, CUI, Die); 4665ffd83dbSDimitry Andric ThreadOS.flush(); 4675ffd83dbSDimitry Andric if (!ThreadLogStorage.empty()) { 4685ffd83dbSDimitry Andric // Print ThreadLogStorage lines into an actual stream under a lock 4695ffd83dbSDimitry Andric std::lock_guard<std::mutex> guard(LogMutex); 4705ffd83dbSDimitry Andric Log << ThreadLogStorage; 4715ffd83dbSDimitry Andric } 4725ffd83dbSDimitry Andric }); 4735ffd83dbSDimitry Andric } 4745ffd83dbSDimitry Andric } 4755ffd83dbSDimitry Andric pool.wait(); 4765ffd83dbSDimitry Andric } 4775ffd83dbSDimitry Andric size_t FunctionsAddedCount = Gsym.getNumFunctionInfos() - NumBefore; 4785ffd83dbSDimitry Andric Log << "Loaded " << FunctionsAddedCount << " functions from DWARF.\n"; 4795ffd83dbSDimitry Andric return Error::success(); 4805ffd83dbSDimitry Andric } 4815ffd83dbSDimitry Andric 4825ffd83dbSDimitry Andric llvm::Error DwarfTransformer::verify(StringRef GsymPath) { 4835ffd83dbSDimitry Andric Log << "Verifying GSYM file \"" << GsymPath << "\":\n"; 4845ffd83dbSDimitry Andric 4855ffd83dbSDimitry Andric auto Gsym = GsymReader::openFile(GsymPath); 4865ffd83dbSDimitry Andric if (!Gsym) 4875ffd83dbSDimitry Andric return Gsym.takeError(); 4885ffd83dbSDimitry Andric 4895ffd83dbSDimitry Andric auto NumAddrs = Gsym->getNumAddresses(); 4905ffd83dbSDimitry Andric DILineInfoSpecifier DLIS( 4915ffd83dbSDimitry Andric DILineInfoSpecifier::FileLineInfoKind::AbsoluteFilePath, 4925ffd83dbSDimitry Andric DILineInfoSpecifier::FunctionNameKind::LinkageName); 4935ffd83dbSDimitry Andric std::string gsymFilename; 4945ffd83dbSDimitry Andric for (uint32_t I = 0; I < NumAddrs; ++I) { 4955ffd83dbSDimitry Andric auto FuncAddr = Gsym->getAddress(I); 4965ffd83dbSDimitry Andric if (!FuncAddr) 4975ffd83dbSDimitry Andric return createStringError(std::errc::invalid_argument, 4985ffd83dbSDimitry Andric "failed to extract address[%i]", I); 4995ffd83dbSDimitry Andric 5005ffd83dbSDimitry Andric auto FI = Gsym->getFunctionInfo(*FuncAddr); 5015ffd83dbSDimitry Andric if (!FI) 5025ffd83dbSDimitry Andric return createStringError(std::errc::invalid_argument, 5035ffd83dbSDimitry Andric "failed to extract function info for address 0x%" 5045ffd83dbSDimitry Andric PRIu64, *FuncAddr); 5055ffd83dbSDimitry Andric 5065ffd83dbSDimitry Andric for (auto Addr = *FuncAddr; Addr < *FuncAddr + FI->size(); ++Addr) { 5075ffd83dbSDimitry Andric const object::SectionedAddress SectAddr{ 5085ffd83dbSDimitry Andric Addr, object::SectionedAddress::UndefSection}; 5095ffd83dbSDimitry Andric auto LR = Gsym->lookup(Addr); 5105ffd83dbSDimitry Andric if (!LR) 5115ffd83dbSDimitry Andric return LR.takeError(); 5125ffd83dbSDimitry Andric 5135ffd83dbSDimitry Andric auto DwarfInlineInfos = 5145ffd83dbSDimitry Andric DICtx.getInliningInfoForAddress(SectAddr, DLIS); 5155ffd83dbSDimitry Andric uint32_t NumDwarfInlineInfos = DwarfInlineInfos.getNumberOfFrames(); 5165ffd83dbSDimitry Andric if (NumDwarfInlineInfos == 0) { 5175ffd83dbSDimitry Andric DwarfInlineInfos.addFrame( 5185ffd83dbSDimitry Andric DICtx.getLineInfoForAddress(SectAddr, DLIS)); 5195ffd83dbSDimitry Andric } 5205ffd83dbSDimitry Andric 5215ffd83dbSDimitry Andric // Check for 1 entry that has no file and line info 5225ffd83dbSDimitry Andric if (NumDwarfInlineInfos == 1 && 5235ffd83dbSDimitry Andric DwarfInlineInfos.getFrame(0).FileName == "<invalid>") { 5245ffd83dbSDimitry Andric DwarfInlineInfos = DIInliningInfo(); 5255ffd83dbSDimitry Andric NumDwarfInlineInfos = 0; 5265ffd83dbSDimitry Andric } 5275ffd83dbSDimitry Andric if (NumDwarfInlineInfos > 0 && 5285ffd83dbSDimitry Andric NumDwarfInlineInfos != LR->Locations.size()) { 5295ffd83dbSDimitry Andric Log << "error: address " << HEX64(Addr) << " has " 5305ffd83dbSDimitry Andric << NumDwarfInlineInfos << " DWARF inline frames and GSYM has " 5315ffd83dbSDimitry Andric << LR->Locations.size() << "\n"; 5325ffd83dbSDimitry Andric Log << " " << NumDwarfInlineInfos << " DWARF frames:\n"; 5335ffd83dbSDimitry Andric for (size_t Idx = 0; Idx < NumDwarfInlineInfos; ++Idx) { 534*0eae32dcSDimitry Andric const auto &dii = DwarfInlineInfos.getFrame(Idx); 5355ffd83dbSDimitry Andric Log << " [" << Idx << "]: " << dii.FunctionName << " @ " 5365ffd83dbSDimitry Andric << dii.FileName << ':' << dii.Line << '\n'; 5375ffd83dbSDimitry Andric } 5385ffd83dbSDimitry Andric Log << " " << LR->Locations.size() << " GSYM frames:\n"; 5395ffd83dbSDimitry Andric for (size_t Idx = 0, count = LR->Locations.size(); 5405ffd83dbSDimitry Andric Idx < count; ++Idx) { 5415ffd83dbSDimitry Andric const auto &gii = LR->Locations[Idx]; 5425ffd83dbSDimitry Andric Log << " [" << Idx << "]: " << gii.Name << " @ " << gii.Dir 5435ffd83dbSDimitry Andric << '/' << gii.Base << ':' << gii.Line << '\n'; 5445ffd83dbSDimitry Andric } 5455ffd83dbSDimitry Andric DwarfInlineInfos = DICtx.getInliningInfoForAddress(SectAddr, DLIS); 5465ffd83dbSDimitry Andric Gsym->dump(Log, *FI); 5475ffd83dbSDimitry Andric continue; 5485ffd83dbSDimitry Andric } 5495ffd83dbSDimitry Andric 5505ffd83dbSDimitry Andric for (size_t Idx = 0, count = LR->Locations.size(); Idx < count; 5515ffd83dbSDimitry Andric ++Idx) { 5525ffd83dbSDimitry Andric const auto &gii = LR->Locations[Idx]; 5535ffd83dbSDimitry Andric if (Idx < NumDwarfInlineInfos) { 554*0eae32dcSDimitry Andric const auto &dii = DwarfInlineInfos.getFrame(Idx); 5555ffd83dbSDimitry Andric gsymFilename = LR->getSourceFile(Idx); 5565ffd83dbSDimitry Andric // Verify function name 5575ffd83dbSDimitry Andric if (dii.FunctionName.find(gii.Name.str()) != 0) 5585ffd83dbSDimitry Andric Log << "error: address " << HEX64(Addr) << " DWARF function \"" 5595ffd83dbSDimitry Andric << dii.FunctionName.c_str() 5605ffd83dbSDimitry Andric << "\" doesn't match GSYM function \"" << gii.Name << "\"\n"; 5615ffd83dbSDimitry Andric // Verify source file path 5625ffd83dbSDimitry Andric if (dii.FileName != gsymFilename) 5635ffd83dbSDimitry Andric Log << "error: address " << HEX64(Addr) << " DWARF path \"" 5645ffd83dbSDimitry Andric << dii.FileName.c_str() << "\" doesn't match GSYM path \"" 5655ffd83dbSDimitry Andric << gsymFilename.c_str() << "\"\n"; 5665ffd83dbSDimitry Andric // Verify source file line 5675ffd83dbSDimitry Andric if (dii.Line != gii.Line) 5685ffd83dbSDimitry Andric Log << "error: address " << HEX64(Addr) << " DWARF line " 5695ffd83dbSDimitry Andric << dii.Line << " != GSYM line " << gii.Line << "\n"; 5705ffd83dbSDimitry Andric } 5715ffd83dbSDimitry Andric } 5725ffd83dbSDimitry Andric } 5735ffd83dbSDimitry Andric } 5745ffd83dbSDimitry Andric return Error::success(); 5755ffd83dbSDimitry Andric } 576