xref: /openbsd-src/gnu/llvm/lldb/source/Plugins/SymbolFile/DWARF/DWARFUnit.cpp (revision f6aab3d83b51b91c24247ad2c2573574de475a82)
1dda28197Spatrick //===-- DWARFUnit.cpp -----------------------------------------------------===//
2061da546Spatrick //
3061da546Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4061da546Spatrick // See https://llvm.org/LICENSE.txt for license information.
5061da546Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6061da546Spatrick //
7061da546Spatrick //===----------------------------------------------------------------------===//
8061da546Spatrick 
9061da546Spatrick #include "DWARFUnit.h"
10061da546Spatrick 
11061da546Spatrick #include "lldb/Core/Module.h"
12061da546Spatrick #include "lldb/Symbol/ObjectFile.h"
13061da546Spatrick #include "lldb/Utility/LLDBAssert.h"
14061da546Spatrick #include "lldb/Utility/StreamString.h"
15061da546Spatrick #include "lldb/Utility/Timer.h"
16*f6aab3d8Srobert #include "llvm/DebugInfo/DWARF/DWARFDebugLoc.h"
17061da546Spatrick #include "llvm/Object/Error.h"
18061da546Spatrick 
19061da546Spatrick #include "DWARFCompileUnit.h"
20061da546Spatrick #include "DWARFDebugAranges.h"
21061da546Spatrick #include "DWARFDebugInfo.h"
22061da546Spatrick #include "DWARFTypeUnit.h"
23061da546Spatrick #include "LogChannelDWARF.h"
24061da546Spatrick #include "SymbolFileDWARFDwo.h"
25*f6aab3d8Srobert #include <optional>
26061da546Spatrick 
27061da546Spatrick using namespace lldb;
28061da546Spatrick using namespace lldb_private;
29*f6aab3d8Srobert using namespace lldb_private::dwarf;
30061da546Spatrick 
31061da546Spatrick extern int g_verbose;
32061da546Spatrick 
DWARFUnit(SymbolFileDWARF & dwarf,lldb::user_id_t uid,const DWARFUnitHeader & header,const DWARFAbbreviationDeclarationSet & abbrevs,DIERef::Section section,bool is_dwo)33061da546Spatrick DWARFUnit::DWARFUnit(SymbolFileDWARF &dwarf, lldb::user_id_t uid,
34061da546Spatrick                      const DWARFUnitHeader &header,
35061da546Spatrick                      const DWARFAbbreviationDeclarationSet &abbrevs,
36061da546Spatrick                      DIERef::Section section, bool is_dwo)
37061da546Spatrick     : UserID(uid), m_dwarf(dwarf), m_header(header), m_abbrevs(&abbrevs),
38be691f3bSpatrick       m_cancel_scopes(false), m_section(section), m_is_dwo(is_dwo),
39*f6aab3d8Srobert       m_has_parsed_non_skeleton_unit(false), m_dwo_id(header.GetDWOId()) {}
40061da546Spatrick 
41061da546Spatrick DWARFUnit::~DWARFUnit() = default;
42061da546Spatrick 
43*f6aab3d8Srobert // Parses first DIE of a compile unit, excluding DWO.
ExtractUnitDIENoDwoIfNeeded()44*f6aab3d8Srobert void DWARFUnit::ExtractUnitDIENoDwoIfNeeded() {
45061da546Spatrick   {
46061da546Spatrick     llvm::sys::ScopedReader lock(m_first_die_mutex);
47061da546Spatrick     if (m_first_die)
48061da546Spatrick       return; // Already parsed
49061da546Spatrick   }
50061da546Spatrick   llvm::sys::ScopedWriter lock(m_first_die_mutex);
51061da546Spatrick   if (m_first_die)
52061da546Spatrick     return; // Already parsed
53061da546Spatrick 
54*f6aab3d8Srobert   ElapsedTime elapsed(m_dwarf.GetDebugInfoParseTimeRef());
55061da546Spatrick 
56061da546Spatrick   // Set the offset to that of the first DIE and calculate the start of the
57061da546Spatrick   // next compilation unit header.
58061da546Spatrick   lldb::offset_t offset = GetFirstDIEOffset();
59061da546Spatrick 
60061da546Spatrick   // We are in our compile unit, parse starting at the offset we were told to
61061da546Spatrick   // parse
62061da546Spatrick   const DWARFDataExtractor &data = GetData();
63061da546Spatrick   if (offset < GetNextUnitOffset() &&
64061da546Spatrick       m_first_die.Extract(data, this, &offset)) {
65061da546Spatrick     AddUnitDIE(m_first_die);
66061da546Spatrick     return;
67061da546Spatrick   }
68061da546Spatrick }
69061da546Spatrick 
70*f6aab3d8Srobert // Parses first DIE of a compile unit including DWO.
ExtractUnitDIEIfNeeded()71*f6aab3d8Srobert void DWARFUnit::ExtractUnitDIEIfNeeded() {
72*f6aab3d8Srobert   ExtractUnitDIENoDwoIfNeeded();
73*f6aab3d8Srobert 
74*f6aab3d8Srobert   if (m_has_parsed_non_skeleton_unit)
75*f6aab3d8Srobert     return;
76*f6aab3d8Srobert 
77*f6aab3d8Srobert   m_has_parsed_non_skeleton_unit = true;
78*f6aab3d8Srobert   m_dwo_error.Clear();
79*f6aab3d8Srobert 
80*f6aab3d8Srobert   if (!m_dwo_id)
81*f6aab3d8Srobert     return; // No DWO file.
82*f6aab3d8Srobert 
83*f6aab3d8Srobert   std::shared_ptr<SymbolFileDWARFDwo> dwo_symbol_file =
84*f6aab3d8Srobert       m_dwarf.GetDwoSymbolFileForCompileUnit(*this, m_first_die);
85*f6aab3d8Srobert   if (!dwo_symbol_file)
86*f6aab3d8Srobert     return;
87*f6aab3d8Srobert 
88*f6aab3d8Srobert   DWARFUnit *dwo_cu = dwo_symbol_file->GetDWOCompileUnitForHash(*m_dwo_id);
89*f6aab3d8Srobert 
90*f6aab3d8Srobert   if (!dwo_cu) {
91*f6aab3d8Srobert     SetDwoError(Status::createWithFormat(
92*f6aab3d8Srobert         "unable to load .dwo file from \"{0}\" due to ID ({1:x16}) mismatch "
93*f6aab3d8Srobert         "for skeleton DIE at {2:x8}",
94*f6aab3d8Srobert         dwo_symbol_file->GetObjectFile()->GetFileSpec().GetPath().c_str(),
95*f6aab3d8Srobert         *m_dwo_id, m_first_die.GetOffset()));
96*f6aab3d8Srobert     return; // Can't fetch the compile unit from the dwo file.
97*f6aab3d8Srobert   }
98*f6aab3d8Srobert   dwo_cu->SetUserData(this);
99*f6aab3d8Srobert 
100*f6aab3d8Srobert   DWARFBaseDIE dwo_cu_die = dwo_cu->GetUnitDIEOnly();
101*f6aab3d8Srobert   if (!dwo_cu_die.IsValid()) {
102*f6aab3d8Srobert     // Can't fetch the compile unit DIE from the dwo file.
103*f6aab3d8Srobert     SetDwoError(Status::createWithFormat(
104*f6aab3d8Srobert         "unable to extract compile unit DIE from .dwo file for skeleton "
105*f6aab3d8Srobert         "DIE at {0:x16}",
106*f6aab3d8Srobert         m_first_die.GetOffset()));
107*f6aab3d8Srobert     return;
108*f6aab3d8Srobert   }
109*f6aab3d8Srobert 
110*f6aab3d8Srobert   // Here for DWO CU we want to use the address base set in the skeleton unit
111*f6aab3d8Srobert   // (DW_AT_addr_base) if it is available and use the DW_AT_GNU_addr_base
112*f6aab3d8Srobert   // otherwise. We do that because pre-DWARF v5 could use the DW_AT_GNU_*
113*f6aab3d8Srobert   // attributes which were applicable to the DWO units. The corresponding
114*f6aab3d8Srobert   // DW_AT_* attributes standardized in DWARF v5 are also applicable to the
115*f6aab3d8Srobert   // main unit in contrast.
116*f6aab3d8Srobert   if (m_addr_base)
117*f6aab3d8Srobert     dwo_cu->SetAddrBase(*m_addr_base);
118*f6aab3d8Srobert   else if (m_gnu_addr_base)
119*f6aab3d8Srobert     dwo_cu->SetAddrBase(*m_gnu_addr_base);
120*f6aab3d8Srobert 
121*f6aab3d8Srobert   if (GetVersion() <= 4 && m_gnu_ranges_base)
122*f6aab3d8Srobert     dwo_cu->SetRangesBase(*m_gnu_ranges_base);
123*f6aab3d8Srobert   else if (dwo_symbol_file->GetDWARFContext()
124*f6aab3d8Srobert                .getOrLoadRngListsData()
125*f6aab3d8Srobert                .GetByteSize() > 0)
126*f6aab3d8Srobert     dwo_cu->SetRangesBase(llvm::DWARFListTableHeader::getHeaderSize(DWARF32));
127*f6aab3d8Srobert 
128*f6aab3d8Srobert   if (GetVersion() >= 5 &&
129*f6aab3d8Srobert       dwo_symbol_file->GetDWARFContext().getOrLoadLocListsData().GetByteSize() >
130*f6aab3d8Srobert           0)
131*f6aab3d8Srobert     dwo_cu->SetLoclistsBase(llvm::DWARFListTableHeader::getHeaderSize(DWARF32));
132*f6aab3d8Srobert 
133*f6aab3d8Srobert   dwo_cu->SetBaseAddress(GetBaseAddress());
134*f6aab3d8Srobert 
135*f6aab3d8Srobert   m_dwo = std::shared_ptr<DWARFUnit>(std::move(dwo_symbol_file), dwo_cu);
136*f6aab3d8Srobert }
137*f6aab3d8Srobert 
138061da546Spatrick // Parses a compile unit and indexes its DIEs if it hasn't already been done.
139061da546Spatrick // It will leave this compile unit extracted forever.
ExtractDIEsIfNeeded()140061da546Spatrick void DWARFUnit::ExtractDIEsIfNeeded() {
141061da546Spatrick   m_cancel_scopes = true;
142061da546Spatrick 
143061da546Spatrick   {
144061da546Spatrick     llvm::sys::ScopedReader lock(m_die_array_mutex);
145061da546Spatrick     if (!m_die_array.empty())
146061da546Spatrick       return; // Already parsed
147061da546Spatrick   }
148061da546Spatrick   llvm::sys::ScopedWriter lock(m_die_array_mutex);
149061da546Spatrick   if (!m_die_array.empty())
150061da546Spatrick     return; // Already parsed
151061da546Spatrick 
152061da546Spatrick   ExtractDIEsRWLocked();
153061da546Spatrick }
154061da546Spatrick 
155061da546Spatrick // Parses a compile unit and indexes its DIEs if it hasn't already been done.
156061da546Spatrick // It will clear this compile unit after returned instance gets out of scope,
157061da546Spatrick // no other ScopedExtractDIEs instance is running for this compile unit
158061da546Spatrick // and no ExtractDIEsIfNeeded() has been executed during this ScopedExtractDIEs
159061da546Spatrick // lifetime.
ExtractDIEsScoped()160061da546Spatrick DWARFUnit::ScopedExtractDIEs DWARFUnit::ExtractDIEsScoped() {
161061da546Spatrick   ScopedExtractDIEs scoped(*this);
162061da546Spatrick 
163061da546Spatrick   {
164061da546Spatrick     llvm::sys::ScopedReader lock(m_die_array_mutex);
165061da546Spatrick     if (!m_die_array.empty())
166061da546Spatrick       return scoped; // Already parsed
167061da546Spatrick   }
168061da546Spatrick   llvm::sys::ScopedWriter lock(m_die_array_mutex);
169061da546Spatrick   if (!m_die_array.empty())
170061da546Spatrick     return scoped; // Already parsed
171061da546Spatrick 
172061da546Spatrick   // Otherwise m_die_array would be already populated.
173061da546Spatrick   lldbassert(!m_cancel_scopes);
174061da546Spatrick 
175061da546Spatrick   ExtractDIEsRWLocked();
176061da546Spatrick   scoped.m_clear_dies = true;
177061da546Spatrick   return scoped;
178061da546Spatrick }
179061da546Spatrick 
ScopedExtractDIEs(DWARFUnit & cu)180061da546Spatrick DWARFUnit::ScopedExtractDIEs::ScopedExtractDIEs(DWARFUnit &cu) : m_cu(&cu) {
181061da546Spatrick   m_cu->m_die_array_scoped_mutex.lock_shared();
182061da546Spatrick }
183061da546Spatrick 
~ScopedExtractDIEs()184061da546Spatrick DWARFUnit::ScopedExtractDIEs::~ScopedExtractDIEs() {
185061da546Spatrick   if (!m_cu)
186061da546Spatrick     return;
187061da546Spatrick   m_cu->m_die_array_scoped_mutex.unlock_shared();
188061da546Spatrick   if (!m_clear_dies || m_cu->m_cancel_scopes)
189061da546Spatrick     return;
190061da546Spatrick   // Be sure no other ScopedExtractDIEs is running anymore.
191061da546Spatrick   llvm::sys::ScopedWriter lock_scoped(m_cu->m_die_array_scoped_mutex);
192061da546Spatrick   llvm::sys::ScopedWriter lock(m_cu->m_die_array_mutex);
193061da546Spatrick   if (m_cu->m_cancel_scopes)
194061da546Spatrick     return;
195061da546Spatrick   m_cu->ClearDIEsRWLocked();
196061da546Spatrick }
197061da546Spatrick 
ScopedExtractDIEs(ScopedExtractDIEs && rhs)198061da546Spatrick DWARFUnit::ScopedExtractDIEs::ScopedExtractDIEs(ScopedExtractDIEs &&rhs)
199061da546Spatrick     : m_cu(rhs.m_cu), m_clear_dies(rhs.m_clear_dies) {
200061da546Spatrick   rhs.m_cu = nullptr;
201061da546Spatrick }
202061da546Spatrick 
operator =(DWARFUnit::ScopedExtractDIEs && rhs)203061da546Spatrick DWARFUnit::ScopedExtractDIEs &DWARFUnit::ScopedExtractDIEs::operator=(
204061da546Spatrick     DWARFUnit::ScopedExtractDIEs &&rhs) {
205061da546Spatrick   m_cu = rhs.m_cu;
206061da546Spatrick   rhs.m_cu = nullptr;
207061da546Spatrick   m_clear_dies = rhs.m_clear_dies;
208061da546Spatrick   return *this;
209061da546Spatrick }
210061da546Spatrick 
211061da546Spatrick // Parses a compile unit and indexes its DIEs, m_die_array_mutex must be
212061da546Spatrick // held R/W and m_die_array must be empty.
ExtractDIEsRWLocked()213061da546Spatrick void DWARFUnit::ExtractDIEsRWLocked() {
214061da546Spatrick   llvm::sys::ScopedWriter first_die_lock(m_first_die_mutex);
215061da546Spatrick 
216*f6aab3d8Srobert   ElapsedTime elapsed(m_dwarf.GetDebugInfoParseTimeRef());
217*f6aab3d8Srobert   LLDB_SCOPED_TIMERF(
218*f6aab3d8Srobert       "%s",
219*f6aab3d8Srobert       llvm::formatv("{0:x16}: DWARFUnit::ExtractDIEsIfNeeded()", GetOffset())
220*f6aab3d8Srobert           .str()
221*f6aab3d8Srobert           .c_str());
222061da546Spatrick 
223061da546Spatrick   // Set the offset to that of the first DIE and calculate the start of the
224061da546Spatrick   // next compilation unit header.
225061da546Spatrick   lldb::offset_t offset = GetFirstDIEOffset();
226061da546Spatrick   lldb::offset_t next_cu_offset = GetNextUnitOffset();
227061da546Spatrick 
228061da546Spatrick   DWARFDebugInfoEntry die;
229061da546Spatrick 
230061da546Spatrick   uint32_t depth = 0;
231061da546Spatrick   // We are in our compile unit, parse starting at the offset we were told to
232061da546Spatrick   // parse
233061da546Spatrick   const DWARFDataExtractor &data = GetData();
234061da546Spatrick   std::vector<uint32_t> die_index_stack;
235061da546Spatrick   die_index_stack.reserve(32);
236061da546Spatrick   die_index_stack.push_back(0);
237061da546Spatrick   bool prev_die_had_children = false;
238061da546Spatrick   while (offset < next_cu_offset && die.Extract(data, this, &offset)) {
239061da546Spatrick     const bool null_die = die.IsNULL();
240061da546Spatrick     if (depth == 0) {
241061da546Spatrick       assert(m_die_array.empty() && "Compile unit DIE already added");
242061da546Spatrick 
243061da546Spatrick       // The average bytes per DIE entry has been seen to be around 14-20 so
244061da546Spatrick       // lets pre-reserve half of that since we are now stripping the NULL
245061da546Spatrick       // tags.
246061da546Spatrick 
247061da546Spatrick       // Only reserve the memory if we are adding children of the main
248061da546Spatrick       // compile unit DIE. The compile unit DIE is always the first entry, so
249061da546Spatrick       // if our size is 1, then we are adding the first compile unit child
250061da546Spatrick       // DIE and should reserve the memory.
251061da546Spatrick       m_die_array.reserve(GetDebugInfoSize() / 24);
252061da546Spatrick       m_die_array.push_back(die);
253061da546Spatrick 
254061da546Spatrick       if (!m_first_die)
255061da546Spatrick         AddUnitDIE(m_die_array.front());
256061da546Spatrick 
257061da546Spatrick       // With -fsplit-dwarf-inlining, clang will emit non-empty skeleton compile
258061da546Spatrick       // units. We are not able to access these DIE *and* the dwo file
259061da546Spatrick       // simultaneously. We also don't need to do that as the dwo file will
260061da546Spatrick       // contain a superset of information. So, we don't even attempt to parse
261061da546Spatrick       // any remaining DIEs.
262dda28197Spatrick       if (m_dwo) {
263061da546Spatrick         m_die_array.front().SetHasChildren(false);
264061da546Spatrick         break;
265061da546Spatrick       }
266061da546Spatrick 
267061da546Spatrick     } else {
268061da546Spatrick       if (null_die) {
269061da546Spatrick         if (prev_die_had_children) {
270061da546Spatrick           // This will only happen if a DIE says is has children but all it
271061da546Spatrick           // contains is a NULL tag. Since we are removing the NULL DIEs from
272061da546Spatrick           // the list (saves up to 25% in C++ code), we need a way to let the
273061da546Spatrick           // DIE know that it actually doesn't have children.
274061da546Spatrick           if (!m_die_array.empty())
275061da546Spatrick             m_die_array.back().SetHasChildren(false);
276061da546Spatrick         }
277061da546Spatrick       } else {
278061da546Spatrick         die.SetParentIndex(m_die_array.size() - die_index_stack[depth - 1]);
279061da546Spatrick 
280061da546Spatrick         if (die_index_stack.back())
281061da546Spatrick           m_die_array[die_index_stack.back()].SetSiblingIndex(
282061da546Spatrick               m_die_array.size() - die_index_stack.back());
283061da546Spatrick 
284061da546Spatrick         // Only push the DIE if it isn't a NULL DIE
285061da546Spatrick         m_die_array.push_back(die);
286061da546Spatrick       }
287061da546Spatrick     }
288061da546Spatrick 
289061da546Spatrick     if (null_die) {
290061da546Spatrick       // NULL DIE.
291061da546Spatrick       if (!die_index_stack.empty())
292061da546Spatrick         die_index_stack.pop_back();
293061da546Spatrick 
294061da546Spatrick       if (depth > 0)
295061da546Spatrick         --depth;
296061da546Spatrick       prev_die_had_children = false;
297061da546Spatrick     } else {
298061da546Spatrick       die_index_stack.back() = m_die_array.size() - 1;
299061da546Spatrick       // Normal DIE
300061da546Spatrick       const bool die_has_children = die.HasChildren();
301061da546Spatrick       if (die_has_children) {
302061da546Spatrick         die_index_stack.push_back(0);
303061da546Spatrick         ++depth;
304061da546Spatrick       }
305061da546Spatrick       prev_die_had_children = die_has_children;
306061da546Spatrick     }
307061da546Spatrick 
308061da546Spatrick     if (depth == 0)
309061da546Spatrick       break; // We are done with this compile unit!
310061da546Spatrick   }
311061da546Spatrick 
312061da546Spatrick   if (!m_die_array.empty()) {
313be691f3bSpatrick     // The last die cannot have children (if it did, it wouldn't be the last one).
314be691f3bSpatrick     // This only makes a difference for malformed dwarf that does not have a
315be691f3bSpatrick     // terminating null die.
316be691f3bSpatrick     m_die_array.back().SetHasChildren(false);
317be691f3bSpatrick 
318061da546Spatrick     if (m_first_die) {
319061da546Spatrick       // Only needed for the assertion.
320061da546Spatrick       m_first_die.SetHasChildren(m_die_array.front().HasChildren());
321061da546Spatrick       lldbassert(m_first_die == m_die_array.front());
322061da546Spatrick     }
323061da546Spatrick     m_first_die = m_die_array.front();
324061da546Spatrick   }
325061da546Spatrick 
326061da546Spatrick   m_die_array.shrink_to_fit();
327061da546Spatrick 
328dda28197Spatrick   if (m_dwo)
329dda28197Spatrick     m_dwo->ExtractDIEsIfNeeded();
330061da546Spatrick }
331061da546Spatrick 
332061da546Spatrick // This is used when a split dwarf is enabled.
333061da546Spatrick // A skeleton compilation unit may contain the DW_AT_str_offsets_base attribute
334061da546Spatrick // that points to the first string offset of the CU contribution to the
335061da546Spatrick // .debug_str_offsets. At the same time, the corresponding split debug unit also
336061da546Spatrick // may use DW_FORM_strx* forms pointing to its own .debug_str_offsets.dwo and
337061da546Spatrick // for that case, we should find the offset (skip the section header).
SetDwoStrOffsetsBase()338dda28197Spatrick void DWARFUnit::SetDwoStrOffsetsBase() {
339061da546Spatrick   lldb::offset_t baseOffset = 0;
340061da546Spatrick 
341dda28197Spatrick   if (const llvm::DWARFUnitIndex::Entry *entry = m_header.GetIndexEntry()) {
342dda28197Spatrick     if (const auto *contribution =
343dda28197Spatrick             entry->getContribution(llvm::DW_SECT_STR_OFFSETS))
344*f6aab3d8Srobert       baseOffset = contribution->getOffset32();
345dda28197Spatrick     else
346dda28197Spatrick       return;
347dda28197Spatrick   }
348dda28197Spatrick 
349dda28197Spatrick   if (GetVersion() >= 5) {
350061da546Spatrick     const DWARFDataExtractor &strOffsets =
351dda28197Spatrick         GetSymbolFileDWARF().GetDWARFContext().getOrLoadStrOffsetsData();
352061da546Spatrick     uint64_t length = strOffsets.GetU32(&baseOffset);
353061da546Spatrick     if (length == 0xffffffff)
354061da546Spatrick       length = strOffsets.GetU64(&baseOffset);
355061da546Spatrick 
356061da546Spatrick     // Check version.
357061da546Spatrick     if (strOffsets.GetU16(&baseOffset) < 5)
358061da546Spatrick       return;
359061da546Spatrick 
360061da546Spatrick     // Skip padding.
361061da546Spatrick     baseOffset += 2;
362dda28197Spatrick   }
363061da546Spatrick 
364dda28197Spatrick   SetStrOffsetsBase(baseOffset);
365061da546Spatrick }
366061da546Spatrick 
GetDWOId()367*f6aab3d8Srobert std::optional<uint64_t> DWARFUnit::GetDWOId() {
368*f6aab3d8Srobert   ExtractUnitDIENoDwoIfNeeded();
369be691f3bSpatrick   return m_dwo_id;
370be691f3bSpatrick }
371be691f3bSpatrick 
372061da546Spatrick // m_die_array_mutex must be already held as read/write.
AddUnitDIE(const DWARFDebugInfoEntry & cu_die)373061da546Spatrick void DWARFUnit::AddUnitDIE(const DWARFDebugInfoEntry &cu_die) {
374061da546Spatrick   DWARFAttributes attributes;
375061da546Spatrick   size_t num_attributes = cu_die.GetAttributes(this, attributes);
376061da546Spatrick 
377061da546Spatrick   // Extract DW_AT_addr_base first, as other attributes may need it.
378061da546Spatrick   for (size_t i = 0; i < num_attributes; ++i) {
379061da546Spatrick     if (attributes.AttributeAtIndex(i) != DW_AT_addr_base)
380061da546Spatrick       continue;
381061da546Spatrick     DWARFFormValue form_value;
382061da546Spatrick     if (attributes.ExtractFormValueAtIndex(i, form_value)) {
383*f6aab3d8Srobert       SetAddrBase(form_value.Unsigned());
384061da546Spatrick       break;
385061da546Spatrick     }
386061da546Spatrick   }
387061da546Spatrick 
388061da546Spatrick   for (size_t i = 0; i < num_attributes; ++i) {
389061da546Spatrick     dw_attr_t attr = attributes.AttributeAtIndex(i);
390061da546Spatrick     DWARFFormValue form_value;
391061da546Spatrick     if (!attributes.ExtractFormValueAtIndex(i, form_value))
392061da546Spatrick       continue;
393061da546Spatrick     switch (attr) {
394061da546Spatrick     case DW_AT_loclists_base:
395061da546Spatrick       SetLoclistsBase(form_value.Unsigned());
396061da546Spatrick       break;
397061da546Spatrick     case DW_AT_rnglists_base:
398be691f3bSpatrick       SetRangesBase(form_value.Unsigned());
399061da546Spatrick       break;
400061da546Spatrick     case DW_AT_str_offsets_base:
401061da546Spatrick       SetStrOffsetsBase(form_value.Unsigned());
402061da546Spatrick       break;
403061da546Spatrick     case DW_AT_low_pc:
404061da546Spatrick       SetBaseAddress(form_value.Address());
405061da546Spatrick       break;
406061da546Spatrick     case DW_AT_entry_pc:
407061da546Spatrick       // If the value was already set by DW_AT_low_pc, don't update it.
408061da546Spatrick       if (m_base_addr == LLDB_INVALID_ADDRESS)
409061da546Spatrick         SetBaseAddress(form_value.Address());
410061da546Spatrick       break;
411061da546Spatrick     case DW_AT_stmt_list:
412061da546Spatrick       m_line_table_offset = form_value.Unsigned();
413061da546Spatrick       break;
414061da546Spatrick     case DW_AT_GNU_addr_base:
415*f6aab3d8Srobert       m_gnu_addr_base = form_value.Unsigned();
416061da546Spatrick       break;
417061da546Spatrick     case DW_AT_GNU_ranges_base:
418*f6aab3d8Srobert       m_gnu_ranges_base = form_value.Unsigned();
419061da546Spatrick       break;
420be691f3bSpatrick     case DW_AT_GNU_dwo_id:
421be691f3bSpatrick       m_dwo_id = form_value.Unsigned();
422be691f3bSpatrick       break;
423061da546Spatrick     }
424061da546Spatrick   }
425061da546Spatrick 
426dda28197Spatrick   if (m_is_dwo) {
427*f6aab3d8Srobert     m_has_parsed_non_skeleton_unit = true;
428dda28197Spatrick     SetDwoStrOffsetsBase();
429061da546Spatrick     return;
430dda28197Spatrick   }
431061da546Spatrick }
432061da546Spatrick 
GetDebugInfoSize() const433061da546Spatrick size_t DWARFUnit::GetDebugInfoSize() const {
434061da546Spatrick   return GetLengthByteSize() + GetLength() - GetHeaderByteSize();
435061da546Spatrick }
436061da546Spatrick 
GetAbbreviations() const437061da546Spatrick const DWARFAbbreviationDeclarationSet *DWARFUnit::GetAbbreviations() const {
438061da546Spatrick   return m_abbrevs;
439061da546Spatrick }
440061da546Spatrick 
GetAbbrevOffset() const441061da546Spatrick dw_offset_t DWARFUnit::GetAbbrevOffset() const {
442061da546Spatrick   return m_abbrevs ? m_abbrevs->GetOffset() : DW_INVALID_OFFSET;
443061da546Spatrick }
444061da546Spatrick 
GetLineTableOffset()445061da546Spatrick dw_offset_t DWARFUnit::GetLineTableOffset() {
446*f6aab3d8Srobert   ExtractUnitDIENoDwoIfNeeded();
447061da546Spatrick   return m_line_table_offset;
448061da546Spatrick }
449061da546Spatrick 
SetAddrBase(dw_addr_t addr_base)450061da546Spatrick void DWARFUnit::SetAddrBase(dw_addr_t addr_base) { m_addr_base = addr_base; }
451061da546Spatrick 
452061da546Spatrick // Parse the rangelist table header, including the optional array of offsets
453061da546Spatrick // following it (DWARF v5 and later).
454061da546Spatrick template <typename ListTableType>
455061da546Spatrick static llvm::Expected<ListTableType>
ParseListTableHeader(const llvm::DWARFDataExtractor & data,uint64_t offset,DwarfFormat format)456061da546Spatrick ParseListTableHeader(const llvm::DWARFDataExtractor &data, uint64_t offset,
457061da546Spatrick                      DwarfFormat format) {
458061da546Spatrick   // We are expected to be called with Offset 0 or pointing just past the table
459061da546Spatrick   // header. Correct Offset in the latter case so that it points to the start
460061da546Spatrick   // of the header.
461*f6aab3d8Srobert   if (offset == 0) {
462*f6aab3d8Srobert     // This means DW_AT_rnglists_base is missing and therefore DW_FORM_rnglistx
463*f6aab3d8Srobert     // cannot be handled. Returning a default-constructed ListTableType allows
464*f6aab3d8Srobert     // DW_FORM_sec_offset to be supported.
465*f6aab3d8Srobert     return ListTableType();
466*f6aab3d8Srobert   }
467*f6aab3d8Srobert 
468061da546Spatrick   uint64_t HeaderSize = llvm::DWARFListTableHeader::getHeaderSize(format);
469061da546Spatrick   if (offset < HeaderSize)
470*f6aab3d8Srobert     return llvm::createStringError(std::errc::invalid_argument,
471061da546Spatrick                                    "did not detect a valid"
472061da546Spatrick                                    " list table with base = 0x%" PRIx64 "\n",
473061da546Spatrick                                    offset);
474061da546Spatrick   offset -= HeaderSize;
475061da546Spatrick   ListTableType Table;
476061da546Spatrick   if (llvm::Error E = Table.extractHeaderAndOffsets(data, &offset))
477061da546Spatrick     return std::move(E);
478061da546Spatrick   return Table;
479061da546Spatrick }
480061da546Spatrick 
SetLoclistsBase(dw_addr_t loclists_base)481061da546Spatrick void DWARFUnit::SetLoclistsBase(dw_addr_t loclists_base) {
482*f6aab3d8Srobert   uint64_t offset = 0;
483*f6aab3d8Srobert   if (const llvm::DWARFUnitIndex::Entry *entry = m_header.GetIndexEntry()) {
484*f6aab3d8Srobert     const auto *contribution = entry->getContribution(llvm::DW_SECT_LOCLISTS);
485*f6aab3d8Srobert     if (!contribution) {
486*f6aab3d8Srobert       GetSymbolFileDWARF().GetObjectFile()->GetModule()->ReportError(
487*f6aab3d8Srobert           "Failed to find location list contribution for CU with DWO Id "
488*f6aab3d8Srobert           "{0:x16}",
489*f6aab3d8Srobert           *GetDWOId());
490*f6aab3d8Srobert       return;
491*f6aab3d8Srobert     }
492*f6aab3d8Srobert     offset += contribution->getOffset32();
493*f6aab3d8Srobert   }
494061da546Spatrick   m_loclists_base = loclists_base;
495061da546Spatrick 
496061da546Spatrick   uint64_t header_size = llvm::DWARFListTableHeader::getHeaderSize(DWARF32);
497061da546Spatrick   if (loclists_base < header_size)
498061da546Spatrick     return;
499061da546Spatrick 
500061da546Spatrick   m_loclist_table_header.emplace(".debug_loclists", "locations");
501*f6aab3d8Srobert   offset += loclists_base - header_size;
502061da546Spatrick   if (llvm::Error E = m_loclist_table_header->extract(
503061da546Spatrick           m_dwarf.GetDWARFContext().getOrLoadLocListsData().GetAsLLVM(),
504061da546Spatrick           &offset)) {
505061da546Spatrick     GetSymbolFileDWARF().GetObjectFile()->GetModule()->ReportError(
506*f6aab3d8Srobert         "Failed to extract location list table at offset {0:x16} (location "
507*f6aab3d8Srobert         "list base: {1:x16}): {2}",
508*f6aab3d8Srobert         offset, loclists_base, toString(std::move(E)).c_str());
509061da546Spatrick   }
510061da546Spatrick }
511061da546Spatrick 
512061da546Spatrick std::unique_ptr<llvm::DWARFLocationTable>
GetLocationTable(const DataExtractor & data) const513061da546Spatrick DWARFUnit::GetLocationTable(const DataExtractor &data) const {
514061da546Spatrick   llvm::DWARFDataExtractor llvm_data(
515dda28197Spatrick       data.GetData(), data.GetByteOrder() == lldb::eByteOrderLittle,
516dda28197Spatrick       data.GetAddressByteSize());
517061da546Spatrick 
518061da546Spatrick   if (m_is_dwo || GetVersion() >= 5)
519061da546Spatrick     return std::make_unique<llvm::DWARFDebugLoclists>(llvm_data, GetVersion());
520061da546Spatrick   return std::make_unique<llvm::DWARFDebugLoc>(llvm_data);
521061da546Spatrick }
522061da546Spatrick 
GetLocationData() const523dda28197Spatrick DWARFDataExtractor DWARFUnit::GetLocationData() const {
524061da546Spatrick   DWARFContext &Ctx = GetSymbolFileDWARF().GetDWARFContext();
525dda28197Spatrick   const DWARFDataExtractor &data =
526dda28197Spatrick       GetVersion() >= 5 ? Ctx.getOrLoadLocListsData() : Ctx.getOrLoadLocData();
527dda28197Spatrick   if (const llvm::DWARFUnitIndex::Entry *entry = m_header.GetIndexEntry()) {
528*f6aab3d8Srobert     if (const auto *contribution = entry->getContribution(
529*f6aab3d8Srobert             GetVersion() >= 5 ? llvm::DW_SECT_LOCLISTS : llvm::DW_SECT_EXT_LOC))
530*f6aab3d8Srobert       return DWARFDataExtractor(data, contribution->getOffset32(),
531*f6aab3d8Srobert                                 contribution->getLength32());
532*f6aab3d8Srobert     return DWARFDataExtractor();
533*f6aab3d8Srobert   }
534*f6aab3d8Srobert   return data;
535*f6aab3d8Srobert }
536*f6aab3d8Srobert 
GetRnglistData() const537*f6aab3d8Srobert DWARFDataExtractor DWARFUnit::GetRnglistData() const {
538*f6aab3d8Srobert   DWARFContext &Ctx = GetSymbolFileDWARF().GetDWARFContext();
539*f6aab3d8Srobert   const DWARFDataExtractor &data = Ctx.getOrLoadRngListsData();
540*f6aab3d8Srobert   if (const llvm::DWARFUnitIndex::Entry *entry = m_header.GetIndexEntry()) {
541*f6aab3d8Srobert     if (const auto *contribution =
542*f6aab3d8Srobert             entry->getContribution(llvm::DW_SECT_RNGLISTS))
543*f6aab3d8Srobert       return DWARFDataExtractor(data, contribution->getOffset32(),
544*f6aab3d8Srobert                                 contribution->getLength32());
545*f6aab3d8Srobert     GetSymbolFileDWARF().GetObjectFile()->GetModule()->ReportError(
546*f6aab3d8Srobert         "Failed to find range list contribution for CU with signature {0:x16}",
547*f6aab3d8Srobert         entry->getSignature());
548*f6aab3d8Srobert 
549dda28197Spatrick     return DWARFDataExtractor();
550dda28197Spatrick   }
551dda28197Spatrick   return data;
552061da546Spatrick }
553061da546Spatrick 
SetRangesBase(dw_addr_t ranges_base)554061da546Spatrick void DWARFUnit::SetRangesBase(dw_addr_t ranges_base) {
555be691f3bSpatrick   lldbassert(!m_rnglist_table_done);
556be691f3bSpatrick 
557061da546Spatrick   m_ranges_base = ranges_base;
558be691f3bSpatrick }
559061da546Spatrick 
560*f6aab3d8Srobert const std::optional<llvm::DWARFDebugRnglistTable> &
GetRnglistTable()561be691f3bSpatrick DWARFUnit::GetRnglistTable() {
562be691f3bSpatrick   if (GetVersion() >= 5 && !m_rnglist_table_done) {
563be691f3bSpatrick     m_rnglist_table_done = true;
564be691f3bSpatrick     if (auto table_or_error =
565be691f3bSpatrick             ParseListTableHeader<llvm::DWARFDebugRnglistTable>(
566*f6aab3d8Srobert                 GetRnglistData().GetAsLLVM(), m_ranges_base, DWARF32))
567061da546Spatrick       m_rnglist_table = std::move(table_or_error.get());
568061da546Spatrick     else
569061da546Spatrick       GetSymbolFileDWARF().GetObjectFile()->GetModule()->ReportError(
570*f6aab3d8Srobert           "Failed to extract range list table at offset {0:x16}: {1}",
571be691f3bSpatrick           m_ranges_base, toString(table_or_error.takeError()).c_str());
572be691f3bSpatrick   }
573be691f3bSpatrick   return m_rnglist_table;
574be691f3bSpatrick }
575be691f3bSpatrick 
576be691f3bSpatrick // This function is called only for DW_FORM_rnglistx.
GetRnglistOffset(uint32_t Index)577be691f3bSpatrick llvm::Expected<uint64_t> DWARFUnit::GetRnglistOffset(uint32_t Index) {
578be691f3bSpatrick   if (!GetRnglistTable())
579*f6aab3d8Srobert     return llvm::createStringError(std::errc::invalid_argument,
580be691f3bSpatrick                                    "missing or invalid range list table");
581be691f3bSpatrick   if (!m_ranges_base)
582*f6aab3d8Srobert     return llvm::createStringError(
583*f6aab3d8Srobert         std::errc::invalid_argument,
584*f6aab3d8Srobert         llvm::formatv("DW_FORM_rnglistx cannot be used without "
585*f6aab3d8Srobert                       "DW_AT_rnglists_base for CU at {0:x16}",
586*f6aab3d8Srobert                       GetOffset())
587*f6aab3d8Srobert             .str()
588*f6aab3d8Srobert             .c_str());
589*f6aab3d8Srobert   if (std::optional<uint64_t> off = GetRnglistTable()->getOffsetEntry(
590*f6aab3d8Srobert           GetRnglistData().GetAsLLVM(), Index))
591be691f3bSpatrick     return *off + m_ranges_base;
592be691f3bSpatrick   return llvm::createStringError(
593*f6aab3d8Srobert       std::errc::invalid_argument,
594be691f3bSpatrick       "invalid range list table index %u; OffsetEntryCount is %u, "
595be691f3bSpatrick       "DW_AT_rnglists_base is %" PRIu64,
596be691f3bSpatrick       Index, GetRnglistTable()->getOffsetEntryCount(), m_ranges_base);
597061da546Spatrick }
598061da546Spatrick 
SetStrOffsetsBase(dw_offset_t str_offsets_base)599061da546Spatrick void DWARFUnit::SetStrOffsetsBase(dw_offset_t str_offsets_base) {
600061da546Spatrick   m_str_offsets_base = str_offsets_base;
601061da546Spatrick }
602061da546Spatrick 
ReadAddressFromDebugAddrSection(uint32_t index) const603*f6aab3d8Srobert dw_addr_t DWARFUnit::ReadAddressFromDebugAddrSection(uint32_t index) const {
604*f6aab3d8Srobert   uint32_t index_size = GetAddressByteSize();
605*f6aab3d8Srobert   dw_offset_t addr_base = GetAddrBase();
606*f6aab3d8Srobert   dw_addr_t offset = addr_base + static_cast<dw_addr_t>(index) * index_size;
607*f6aab3d8Srobert   const DWARFDataExtractor &data =
608*f6aab3d8Srobert       m_dwarf.GetDWARFContext().getOrLoadAddrData();
609*f6aab3d8Srobert   if (data.ValidOffsetForDataOfSize(offset, index_size))
610*f6aab3d8Srobert     return data.GetMaxU64_unchecked(&offset, index_size);
611*f6aab3d8Srobert   return LLDB_INVALID_ADDRESS;
612*f6aab3d8Srobert }
613*f6aab3d8Srobert 
614061da546Spatrick // It may be called only with m_die_array_mutex held R/W.
ClearDIEsRWLocked()615061da546Spatrick void DWARFUnit::ClearDIEsRWLocked() {
616061da546Spatrick   m_die_array.clear();
617061da546Spatrick   m_die_array.shrink_to_fit();
618061da546Spatrick 
619*f6aab3d8Srobert   if (m_dwo && !m_dwo->m_cancel_scopes)
620dda28197Spatrick     m_dwo->ClearDIEsRWLocked();
621061da546Spatrick }
622061da546Spatrick 
GetByteOrder() const623061da546Spatrick lldb::ByteOrder DWARFUnit::GetByteOrder() const {
624061da546Spatrick   return m_dwarf.GetObjectFile()->GetByteOrder();
625061da546Spatrick }
626061da546Spatrick 
SetBaseAddress(dw_addr_t base_addr)627061da546Spatrick void DWARFUnit::SetBaseAddress(dw_addr_t base_addr) { m_base_addr = base_addr; }
628061da546Spatrick 
629061da546Spatrick // Compare function DWARFDebugAranges::Range structures
CompareDIEOffset(const DWARFDebugInfoEntry & die,const dw_offset_t die_offset)630061da546Spatrick static bool CompareDIEOffset(const DWARFDebugInfoEntry &die,
631061da546Spatrick                              const dw_offset_t die_offset) {
632061da546Spatrick   return die.GetOffset() < die_offset;
633061da546Spatrick }
634061da546Spatrick 
635061da546Spatrick // GetDIE()
636061da546Spatrick //
637061da546Spatrick // Get the DIE (Debug Information Entry) with the specified offset by first
638061da546Spatrick // checking if the DIE is contained within this compile unit and grabbing the
639061da546Spatrick // DIE from this compile unit. Otherwise we grab the DIE from the DWARF file.
640061da546Spatrick DWARFDIE
GetDIE(dw_offset_t die_offset)641061da546Spatrick DWARFUnit::GetDIE(dw_offset_t die_offset) {
642be691f3bSpatrick   if (die_offset == DW_INVALID_OFFSET)
643be691f3bSpatrick     return DWARFDIE(); // Not found
644be691f3bSpatrick 
645be691f3bSpatrick   if (!ContainsDIEOffset(die_offset)) {
646be691f3bSpatrick     GetSymbolFileDWARF().GetObjectFile()->GetModule()->ReportError(
647*f6aab3d8Srobert         "GetDIE for DIE {0:x16} is outside of its CU {0:x16}", die_offset,
648*f6aab3d8Srobert         GetOffset());
649be691f3bSpatrick     return DWARFDIE(); // Not found
650be691f3bSpatrick   }
651be691f3bSpatrick 
652061da546Spatrick   ExtractDIEsIfNeeded();
653061da546Spatrick   DWARFDebugInfoEntry::const_iterator end = m_die_array.cend();
654061da546Spatrick   DWARFDebugInfoEntry::const_iterator pos =
655061da546Spatrick       lower_bound(m_die_array.cbegin(), end, die_offset, CompareDIEOffset);
656be691f3bSpatrick 
657be691f3bSpatrick   if (pos != end && die_offset == (*pos).GetOffset())
658061da546Spatrick     return DWARFDIE(this, &(*pos));
659061da546Spatrick   return DWARFDIE(); // Not found
660061da546Spatrick }
661061da546Spatrick 
GetNonSkeletonUnit()662061da546Spatrick DWARFUnit &DWARFUnit::GetNonSkeletonUnit() {
663dda28197Spatrick   ExtractUnitDIEIfNeeded();
664dda28197Spatrick   if (m_dwo)
665dda28197Spatrick     return *m_dwo;
666061da546Spatrick   return *this;
667061da546Spatrick }
668061da546Spatrick 
GetAddressByteSize(const DWARFUnit * cu)669061da546Spatrick uint8_t DWARFUnit::GetAddressByteSize(const DWARFUnit *cu) {
670061da546Spatrick   if (cu)
671061da546Spatrick     return cu->GetAddressByteSize();
672061da546Spatrick   return DWARFUnit::GetDefaultAddressSize();
673061da546Spatrick }
674061da546Spatrick 
GetDefaultAddressSize()675061da546Spatrick uint8_t DWARFUnit::GetDefaultAddressSize() { return 4; }
676061da546Spatrick 
GetUserData() const677061da546Spatrick void *DWARFUnit::GetUserData() const { return m_user_data; }
678061da546Spatrick 
SetUserData(void * d)679dda28197Spatrick void DWARFUnit::SetUserData(void *d) { m_user_data = d; }
680061da546Spatrick 
Supports_DW_AT_APPLE_objc_complete_type()681061da546Spatrick bool DWARFUnit::Supports_DW_AT_APPLE_objc_complete_type() {
682061da546Spatrick   return GetProducer() != eProducerLLVMGCC;
683061da546Spatrick }
684061da546Spatrick 
DW_AT_decl_file_attributes_are_invalid()685061da546Spatrick bool DWARFUnit::DW_AT_decl_file_attributes_are_invalid() {
686061da546Spatrick   // llvm-gcc makes completely invalid decl file attributes and won't ever be
687061da546Spatrick   // fixed, so we need to know to ignore these.
688061da546Spatrick   return GetProducer() == eProducerLLVMGCC;
689061da546Spatrick }
690061da546Spatrick 
Supports_unnamed_objc_bitfields()691061da546Spatrick bool DWARFUnit::Supports_unnamed_objc_bitfields() {
692*f6aab3d8Srobert   if (GetProducer() == eProducerClang)
693*f6aab3d8Srobert     return GetProducerVersion() >= llvm::VersionTuple(425, 0, 13);
694*f6aab3d8Srobert   // Assume all other compilers didn't have incorrect ObjC bitfield info.
695*f6aab3d8Srobert   return true;
696061da546Spatrick }
697061da546Spatrick 
ParseProducerInfo()698061da546Spatrick void DWARFUnit::ParseProducerInfo() {
699*f6aab3d8Srobert   m_producer = eProducerOther;
700061da546Spatrick   const DWARFDebugInfoEntry *die = GetUnitDIEPtrOnly();
701*f6aab3d8Srobert   if (!die)
702*f6aab3d8Srobert     return;
703061da546Spatrick 
704*f6aab3d8Srobert   llvm::StringRef producer(
705*f6aab3d8Srobert       die->GetAttributeValueAsString(this, DW_AT_producer, nullptr));
706*f6aab3d8Srobert   if (producer.empty())
707*f6aab3d8Srobert     return;
708*f6aab3d8Srobert 
709*f6aab3d8Srobert   static const RegularExpression g_swiftlang_version_regex(
710*f6aab3d8Srobert       llvm::StringRef(R"(swiftlang-([0-9]+\.[0-9]+\.[0-9]+(\.[0-9]+)?))"));
711*f6aab3d8Srobert   static const RegularExpression g_clang_version_regex(
712*f6aab3d8Srobert       llvm::StringRef(R"(clang-([0-9]+\.[0-9]+\.[0-9]+(\.[0-9]+)?))"));
713*f6aab3d8Srobert   static const RegularExpression g_llvm_gcc_regex(
714*f6aab3d8Srobert       llvm::StringRef(R"(4\.[012]\.[01] )"
715*f6aab3d8Srobert                       R"(\(Based on Apple Inc\. build [0-9]+\) )"
716*f6aab3d8Srobert                       R"(\(LLVM build [\.0-9]+\)$)"));
717*f6aab3d8Srobert 
718*f6aab3d8Srobert   llvm::SmallVector<llvm::StringRef, 3> matches;
719*f6aab3d8Srobert   if (g_swiftlang_version_regex.Execute(producer, &matches)) {
720*f6aab3d8Srobert       m_producer_version.tryParse(matches[1]);
721*f6aab3d8Srobert     m_producer = eProducerSwift;
722*f6aab3d8Srobert   } else if (producer.contains("clang")) {
723*f6aab3d8Srobert     if (g_clang_version_regex.Execute(producer, &matches))
724*f6aab3d8Srobert       m_producer_version.tryParse(matches[1]);
725061da546Spatrick     m_producer = eProducerClang;
726*f6aab3d8Srobert   } else if (producer.contains("GNU")) {
727061da546Spatrick     m_producer = eProducerGCC;
728*f6aab3d8Srobert   } else if (g_llvm_gcc_regex.Execute(producer)) {
729*f6aab3d8Srobert     m_producer = eProducerLLVMGCC;
730061da546Spatrick   }
731061da546Spatrick }
732061da546Spatrick 
GetProducer()733061da546Spatrick DWARFProducer DWARFUnit::GetProducer() {
734061da546Spatrick   if (m_producer == eProducerInvalid)
735061da546Spatrick     ParseProducerInfo();
736061da546Spatrick   return m_producer;
737061da546Spatrick }
738061da546Spatrick 
GetProducerVersion()739*f6aab3d8Srobert llvm::VersionTuple DWARFUnit::GetProducerVersion() {
740*f6aab3d8Srobert   if (m_producer_version.empty())
741061da546Spatrick     ParseProducerInfo();
742*f6aab3d8Srobert   return m_producer_version;
743061da546Spatrick }
744061da546Spatrick 
GetDWARFLanguageType()745dda28197Spatrick uint64_t DWARFUnit::GetDWARFLanguageType() {
746dda28197Spatrick   if (m_language_type)
747dda28197Spatrick     return *m_language_type;
748061da546Spatrick 
749061da546Spatrick   const DWARFDebugInfoEntry *die = GetUnitDIEPtrOnly();
750dda28197Spatrick   if (!die)
751dda28197Spatrick     m_language_type = 0;
752dda28197Spatrick   else
753dda28197Spatrick     m_language_type = die->GetAttributeValueAsUnsigned(this, DW_AT_language, 0);
754dda28197Spatrick   return *m_language_type;
755061da546Spatrick }
756061da546Spatrick 
GetIsOptimized()757061da546Spatrick bool DWARFUnit::GetIsOptimized() {
758061da546Spatrick   if (m_is_optimized == eLazyBoolCalculate) {
759061da546Spatrick     const DWARFDebugInfoEntry *die = GetUnitDIEPtrOnly();
760061da546Spatrick     if (die) {
761061da546Spatrick       m_is_optimized = eLazyBoolNo;
762061da546Spatrick       if (die->GetAttributeValueAsUnsigned(this, DW_AT_APPLE_optimized, 0) ==
763061da546Spatrick           1) {
764061da546Spatrick         m_is_optimized = eLazyBoolYes;
765061da546Spatrick       }
766061da546Spatrick     }
767061da546Spatrick   }
768061da546Spatrick   return m_is_optimized == eLazyBoolYes;
769061da546Spatrick }
770061da546Spatrick 
GetPathStyle()771061da546Spatrick FileSpec::Style DWARFUnit::GetPathStyle() {
772061da546Spatrick   if (!m_comp_dir)
773061da546Spatrick     ComputeCompDirAndGuessPathStyle();
774061da546Spatrick   return m_comp_dir->GetPathStyle();
775061da546Spatrick }
776061da546Spatrick 
GetCompilationDirectory()777061da546Spatrick const FileSpec &DWARFUnit::GetCompilationDirectory() {
778061da546Spatrick   if (!m_comp_dir)
779061da546Spatrick     ComputeCompDirAndGuessPathStyle();
780061da546Spatrick   return *m_comp_dir;
781061da546Spatrick }
782061da546Spatrick 
GetAbsolutePath()783061da546Spatrick const FileSpec &DWARFUnit::GetAbsolutePath() {
784061da546Spatrick   if (!m_file_spec)
785061da546Spatrick     ComputeAbsolutePath();
786061da546Spatrick   return *m_file_spec;
787061da546Spatrick }
788061da546Spatrick 
GetFile(size_t file_idx)789061da546Spatrick FileSpec DWARFUnit::GetFile(size_t file_idx) {
790061da546Spatrick   return m_dwarf.GetFile(*this, file_idx);
791061da546Spatrick }
792061da546Spatrick 
793061da546Spatrick // DWARF2/3 suggests the form hostname:pathname for compilation directory.
794061da546Spatrick // Remove the host part if present.
795061da546Spatrick static llvm::StringRef
removeHostnameFromPathname(llvm::StringRef path_from_dwarf)796061da546Spatrick removeHostnameFromPathname(llvm::StringRef path_from_dwarf) {
797061da546Spatrick   if (!path_from_dwarf.contains(':'))
798061da546Spatrick     return path_from_dwarf;
799061da546Spatrick   llvm::StringRef host, path;
800061da546Spatrick   std::tie(host, path) = path_from_dwarf.split(':');
801061da546Spatrick 
802061da546Spatrick   if (host.contains('/'))
803061da546Spatrick     return path_from_dwarf;
804061da546Spatrick 
805061da546Spatrick   // check whether we have a windows path, and so the first character is a
806061da546Spatrick   // drive-letter not a hostname.
807*f6aab3d8Srobert   if (host.size() == 1 && llvm::isAlpha(host[0]) &&
808*f6aab3d8Srobert       (path.startswith("\\") || path.startswith("/")))
809061da546Spatrick     return path_from_dwarf;
810061da546Spatrick 
811061da546Spatrick   return path;
812061da546Spatrick }
813061da546Spatrick 
ComputeCompDirAndGuessPathStyle()814061da546Spatrick void DWARFUnit::ComputeCompDirAndGuessPathStyle() {
815061da546Spatrick   m_comp_dir = FileSpec();
816061da546Spatrick   const DWARFDebugInfoEntry *die = GetUnitDIEPtrOnly();
817061da546Spatrick   if (!die)
818061da546Spatrick     return;
819061da546Spatrick 
820061da546Spatrick   llvm::StringRef comp_dir = removeHostnameFromPathname(
821061da546Spatrick       die->GetAttributeValueAsString(this, DW_AT_comp_dir, nullptr));
822061da546Spatrick   if (!comp_dir.empty()) {
823061da546Spatrick     FileSpec::Style comp_dir_style =
824*f6aab3d8Srobert         FileSpec::GuessPathStyle(comp_dir).value_or(FileSpec::Style::native);
825dda28197Spatrick     m_comp_dir = FileSpec(comp_dir, comp_dir_style);
826061da546Spatrick   } else {
827061da546Spatrick     // Try to detect the style based on the DW_AT_name attribute, but just store
828061da546Spatrick     // the detected style in the m_comp_dir field.
829061da546Spatrick     const char *name =
830061da546Spatrick         die->GetAttributeValueAsString(this, DW_AT_name, nullptr);
831061da546Spatrick     m_comp_dir = FileSpec(
832*f6aab3d8Srobert         "", FileSpec::GuessPathStyle(name).value_or(FileSpec::Style::native));
833061da546Spatrick   }
834061da546Spatrick }
835061da546Spatrick 
ComputeAbsolutePath()836061da546Spatrick void DWARFUnit::ComputeAbsolutePath() {
837061da546Spatrick   m_file_spec = FileSpec();
838061da546Spatrick   const DWARFDebugInfoEntry *die = GetUnitDIEPtrOnly();
839061da546Spatrick   if (!die)
840061da546Spatrick     return;
841061da546Spatrick 
842061da546Spatrick   m_file_spec =
843061da546Spatrick       FileSpec(die->GetAttributeValueAsString(this, DW_AT_name, nullptr),
844061da546Spatrick                GetPathStyle());
845061da546Spatrick 
846061da546Spatrick   if (m_file_spec->IsRelative())
847061da546Spatrick     m_file_spec->MakeAbsolute(GetCompilationDirectory());
848061da546Spatrick }
849061da546Spatrick 
GetDwoSymbolFile()850061da546Spatrick SymbolFileDWARFDwo *DWARFUnit::GetDwoSymbolFile() {
851061da546Spatrick   ExtractUnitDIEIfNeeded();
852dda28197Spatrick   if (m_dwo)
853dda28197Spatrick     return &llvm::cast<SymbolFileDWARFDwo>(m_dwo->GetSymbolFileDWARF());
854dda28197Spatrick   return nullptr;
855061da546Spatrick }
856061da546Spatrick 
GetFunctionAranges()857061da546Spatrick const DWARFDebugAranges &DWARFUnit::GetFunctionAranges() {
858061da546Spatrick   if (m_func_aranges_up == nullptr) {
859dda28197Spatrick     m_func_aranges_up = std::make_unique<DWARFDebugAranges>();
860061da546Spatrick     const DWARFDebugInfoEntry *die = DIEPtr();
861061da546Spatrick     if (die)
862061da546Spatrick       die->BuildFunctionAddressRangeTable(this, m_func_aranges_up.get());
863061da546Spatrick 
864dda28197Spatrick     if (m_dwo) {
865dda28197Spatrick       const DWARFDebugInfoEntry *dwo_die = m_dwo->DIEPtr();
866061da546Spatrick       if (dwo_die)
867dda28197Spatrick         dwo_die->BuildFunctionAddressRangeTable(m_dwo.get(),
868061da546Spatrick                                                 m_func_aranges_up.get());
869061da546Spatrick     }
870061da546Spatrick 
871061da546Spatrick     const bool minimize = false;
872061da546Spatrick     m_func_aranges_up->Sort(minimize);
873061da546Spatrick   }
874061da546Spatrick   return *m_func_aranges_up;
875061da546Spatrick }
876061da546Spatrick 
877061da546Spatrick llvm::Expected<DWARFUnitHeader>
extract(const DWARFDataExtractor & data,DIERef::Section section,lldb_private::DWARFContext & context,lldb::offset_t * offset_ptr)878dda28197Spatrick DWARFUnitHeader::extract(const DWARFDataExtractor &data,
879be691f3bSpatrick                          DIERef::Section section,
880be691f3bSpatrick                          lldb_private::DWARFContext &context,
881be691f3bSpatrick                          lldb::offset_t *offset_ptr) {
882061da546Spatrick   DWARFUnitHeader header;
883061da546Spatrick   header.m_offset = *offset_ptr;
884061da546Spatrick   header.m_length = data.GetDWARFInitialLength(offset_ptr);
885061da546Spatrick   header.m_version = data.GetU16(offset_ptr);
886061da546Spatrick   if (header.m_version == 5) {
887061da546Spatrick     header.m_unit_type = data.GetU8(offset_ptr);
888061da546Spatrick     header.m_addr_size = data.GetU8(offset_ptr);
889061da546Spatrick     header.m_abbr_offset = data.GetDWARFOffset(offset_ptr);
890be691f3bSpatrick     if (header.m_unit_type == llvm::dwarf::DW_UT_skeleton ||
891be691f3bSpatrick         header.m_unit_type == llvm::dwarf::DW_UT_split_compile)
892061da546Spatrick       header.m_dwo_id = data.GetU64(offset_ptr);
893061da546Spatrick   } else {
894061da546Spatrick     header.m_abbr_offset = data.GetDWARFOffset(offset_ptr);
895061da546Spatrick     header.m_addr_size = data.GetU8(offset_ptr);
896061da546Spatrick     header.m_unit_type =
897061da546Spatrick         section == DIERef::Section::DebugTypes ? DW_UT_type : DW_UT_compile;
898061da546Spatrick   }
899061da546Spatrick 
900be691f3bSpatrick   if (header.IsTypeUnit()) {
901*f6aab3d8Srobert     header.m_type_hash = data.GetU64(offset_ptr);
902*f6aab3d8Srobert     header.m_type_offset = data.GetDWARFOffset(offset_ptr);
903be691f3bSpatrick   }
904*f6aab3d8Srobert 
905*f6aab3d8Srobert   if (context.isDwo()) {
906*f6aab3d8Srobert     const llvm::DWARFUnitIndex *Index;
907*f6aab3d8Srobert     if (header.IsTypeUnit()) {
908*f6aab3d8Srobert       Index = &context.GetAsLLVM().getTUIndex();
909*f6aab3d8Srobert       if (*Index)
910*f6aab3d8Srobert         header.m_index_entry = Index->getFromHash(header.m_type_hash);
911*f6aab3d8Srobert     } else {
912*f6aab3d8Srobert       Index = &context.GetAsLLVM().getCUIndex();
913*f6aab3d8Srobert       if (*Index && header.m_version >= 5 && header.m_dwo_id)
914*f6aab3d8Srobert         header.m_index_entry = Index->getFromHash(*header.m_dwo_id);
915*f6aab3d8Srobert     }
916*f6aab3d8Srobert     if (!header.m_index_entry)
917*f6aab3d8Srobert       header.m_index_entry = Index->getFromOffset(header.m_offset);
918be691f3bSpatrick   }
919be691f3bSpatrick 
920dda28197Spatrick   if (header.m_index_entry) {
921dda28197Spatrick     if (header.m_abbr_offset) {
922dda28197Spatrick       return llvm::createStringError(
923dda28197Spatrick           llvm::inconvertibleErrorCode(),
924dda28197Spatrick           "Package unit with a non-zero abbreviation offset");
925dda28197Spatrick     }
926dda28197Spatrick     auto *unit_contrib = header.m_index_entry->getContribution();
927*f6aab3d8Srobert     if (!unit_contrib || unit_contrib->getLength32() != header.m_length + 4) {
928dda28197Spatrick       return llvm::createStringError(llvm::inconvertibleErrorCode(),
929dda28197Spatrick                                      "Inconsistent DWARF package unit index");
930dda28197Spatrick     }
931dda28197Spatrick     auto *abbr_entry =
932dda28197Spatrick         header.m_index_entry->getContribution(llvm::DW_SECT_ABBREV);
933dda28197Spatrick     if (!abbr_entry) {
934dda28197Spatrick       return llvm::createStringError(
935dda28197Spatrick           llvm::inconvertibleErrorCode(),
936dda28197Spatrick           "DWARF package index missing abbreviation column");
937dda28197Spatrick     }
938*f6aab3d8Srobert     header.m_abbr_offset = abbr_entry->getOffset32();
939061da546Spatrick   }
940061da546Spatrick 
941061da546Spatrick   bool length_OK = data.ValidOffset(header.GetNextUnitOffset() - 1);
942061da546Spatrick   bool version_OK = SymbolFileDWARF::SupportedVersion(header.m_version);
943061da546Spatrick   bool addr_size_OK = (header.m_addr_size == 4) || (header.m_addr_size == 8);
944061da546Spatrick   bool type_offset_OK =
945061da546Spatrick       !header.IsTypeUnit() || (header.m_type_offset <= header.GetLength());
946061da546Spatrick 
947061da546Spatrick   if (!length_OK)
948061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
949061da546Spatrick         "Invalid unit length");
950061da546Spatrick   if (!version_OK)
951061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
952061da546Spatrick         "Unsupported unit version");
953061da546Spatrick   if (!addr_size_OK)
954061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
955061da546Spatrick         "Invalid unit address size");
956061da546Spatrick   if (!type_offset_OK)
957061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
958061da546Spatrick         "Type offset out of range");
959061da546Spatrick 
960061da546Spatrick   return header;
961061da546Spatrick }
962061da546Spatrick 
963061da546Spatrick llvm::Expected<DWARFUnitSP>
extract(SymbolFileDWARF & dwarf,user_id_t uid,const DWARFDataExtractor & debug_info,DIERef::Section section,lldb::offset_t * offset_ptr)964061da546Spatrick DWARFUnit::extract(SymbolFileDWARF &dwarf, user_id_t uid,
965061da546Spatrick                    const DWARFDataExtractor &debug_info,
966be691f3bSpatrick                    DIERef::Section section, lldb::offset_t *offset_ptr) {
967061da546Spatrick   assert(debug_info.ValidOffset(*offset_ptr));
968061da546Spatrick 
969be691f3bSpatrick   auto expected_header = DWARFUnitHeader::extract(
970be691f3bSpatrick       debug_info, section, dwarf.GetDWARFContext(), offset_ptr);
971061da546Spatrick   if (!expected_header)
972061da546Spatrick     return expected_header.takeError();
973061da546Spatrick 
974061da546Spatrick   const DWARFDebugAbbrev *abbr = dwarf.DebugAbbrev();
975061da546Spatrick   if (!abbr)
976061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
977061da546Spatrick         "No debug_abbrev data");
978061da546Spatrick 
979061da546Spatrick   bool abbr_offset_OK =
980061da546Spatrick       dwarf.GetDWARFContext().getOrLoadAbbrevData().ValidOffset(
981061da546Spatrick           expected_header->GetAbbrOffset());
982061da546Spatrick   if (!abbr_offset_OK)
983061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
984061da546Spatrick         "Abbreviation offset for unit is not valid");
985061da546Spatrick 
986061da546Spatrick   const DWARFAbbreviationDeclarationSet *abbrevs =
987061da546Spatrick       abbr->GetAbbreviationDeclarationSet(expected_header->GetAbbrOffset());
988061da546Spatrick   if (!abbrevs)
989061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
990061da546Spatrick         "No abbrev exists at the specified offset.");
991061da546Spatrick 
992061da546Spatrick   bool is_dwo = dwarf.GetDWARFContext().isDwo();
993061da546Spatrick   if (expected_header->IsTypeUnit())
994061da546Spatrick     return DWARFUnitSP(new DWARFTypeUnit(dwarf, uid, *expected_header, *abbrevs,
995061da546Spatrick                                          section, is_dwo));
996061da546Spatrick   return DWARFUnitSP(new DWARFCompileUnit(dwarf, uid, *expected_header,
997061da546Spatrick                                           *abbrevs, section, is_dwo));
998061da546Spatrick }
999061da546Spatrick 
GetData() const1000061da546Spatrick const lldb_private::DWARFDataExtractor &DWARFUnit::GetData() const {
1001061da546Spatrick   return m_section == DIERef::Section::DebugTypes
1002061da546Spatrick              ? m_dwarf.GetDWARFContext().getOrLoadDebugTypesData()
1003061da546Spatrick              : m_dwarf.GetDWARFContext().getOrLoadDebugInfoData();
1004061da546Spatrick }
1005061da546Spatrick 
GetHeaderByteSize() const1006061da546Spatrick uint32_t DWARFUnit::GetHeaderByteSize() const {
1007061da546Spatrick   switch (m_header.GetUnitType()) {
1008061da546Spatrick   case llvm::dwarf::DW_UT_compile:
1009061da546Spatrick   case llvm::dwarf::DW_UT_partial:
1010061da546Spatrick     return GetVersion() < 5 ? 11 : 12;
1011061da546Spatrick   case llvm::dwarf::DW_UT_skeleton:
1012061da546Spatrick   case llvm::dwarf::DW_UT_split_compile:
1013061da546Spatrick     return 20;
1014061da546Spatrick   case llvm::dwarf::DW_UT_type:
1015061da546Spatrick   case llvm::dwarf::DW_UT_split_type:
1016061da546Spatrick     return GetVersion() < 5 ? 23 : 24;
1017061da546Spatrick   }
1018061da546Spatrick   llvm_unreachable("invalid UnitType.");
1019061da546Spatrick }
1020061da546Spatrick 
1021*f6aab3d8Srobert std::optional<uint64_t>
GetStringOffsetSectionItem(uint32_t index) const1022dda28197Spatrick DWARFUnit::GetStringOffsetSectionItem(uint32_t index) const {
1023dda28197Spatrick   offset_t offset = GetStrOffsetsBase() + index * 4;
1024dda28197Spatrick   return m_dwarf.GetDWARFContext().getOrLoadStrOffsetsData().GetU32(&offset);
1025dda28197Spatrick }
1026dda28197Spatrick 
1027061da546Spatrick llvm::Expected<DWARFRangeList>
FindRnglistFromOffset(dw_offset_t offset)1028061da546Spatrick DWARFUnit::FindRnglistFromOffset(dw_offset_t offset) {
1029061da546Spatrick   if (GetVersion() <= 4) {
1030061da546Spatrick     const DWARFDebugRanges *debug_ranges = m_dwarf.GetDebugRanges();
1031061da546Spatrick     if (!debug_ranges)
1032061da546Spatrick       return llvm::make_error<llvm::object::GenericBinaryError>(
1033061da546Spatrick           "No debug_ranges section");
1034061da546Spatrick     DWARFRangeList ranges;
1035061da546Spatrick     debug_ranges->FindRanges(this, offset, ranges);
1036061da546Spatrick     return ranges;
1037061da546Spatrick   }
1038061da546Spatrick 
1039be691f3bSpatrick   if (!GetRnglistTable())
1040*f6aab3d8Srobert     return llvm::createStringError(std::errc::invalid_argument,
1041061da546Spatrick                                    "missing or invalid range list table");
1042061da546Spatrick 
1043*f6aab3d8Srobert   llvm::DWARFDataExtractor data = GetRnglistData().GetAsLLVM();
1044*f6aab3d8Srobert 
1045*f6aab3d8Srobert   // As DW_AT_rnglists_base may be missing we need to call setAddressSize.
1046*f6aab3d8Srobert   data.setAddressSize(m_header.GetAddressByteSize());
1047*f6aab3d8Srobert   auto range_list_or_error = GetRnglistTable()->findList(data, offset);
1048061da546Spatrick   if (!range_list_or_error)
1049061da546Spatrick     return range_list_or_error.takeError();
1050061da546Spatrick 
1051061da546Spatrick   llvm::Expected<llvm::DWARFAddressRangesVector> llvm_ranges =
1052061da546Spatrick       range_list_or_error->getAbsoluteRanges(
1053061da546Spatrick           llvm::object::SectionedAddress{GetBaseAddress()},
1054be691f3bSpatrick           GetAddressByteSize(), [&](uint32_t index) {
1055061da546Spatrick             uint32_t index_size = GetAddressByteSize();
1056061da546Spatrick             dw_offset_t addr_base = GetAddrBase();
1057*f6aab3d8Srobert             lldb::offset_t offset =
1058*f6aab3d8Srobert                 addr_base + static_cast<lldb::offset_t>(index) * index_size;
1059061da546Spatrick             return llvm::object::SectionedAddress{
1060061da546Spatrick                 m_dwarf.GetDWARFContext().getOrLoadAddrData().GetMaxU64(
1061061da546Spatrick                     &offset, index_size)};
1062061da546Spatrick           });
1063061da546Spatrick   if (!llvm_ranges)
1064061da546Spatrick     return llvm_ranges.takeError();
1065061da546Spatrick 
1066061da546Spatrick   DWARFRangeList ranges;
1067061da546Spatrick   for (const llvm::DWARFAddressRange &llvm_range : *llvm_ranges) {
1068061da546Spatrick     ranges.Append(DWARFRangeList::Entry(llvm_range.LowPC,
1069061da546Spatrick                                         llvm_range.HighPC - llvm_range.LowPC));
1070061da546Spatrick   }
1071061da546Spatrick   return ranges;
1072061da546Spatrick }
1073061da546Spatrick 
1074061da546Spatrick llvm::Expected<DWARFRangeList>
FindRnglistFromIndex(uint32_t index)1075061da546Spatrick DWARFUnit::FindRnglistFromIndex(uint32_t index) {
1076be691f3bSpatrick   llvm::Expected<uint64_t> maybe_offset = GetRnglistOffset(index);
1077be691f3bSpatrick   if (!maybe_offset)
1078be691f3bSpatrick     return maybe_offset.takeError();
1079be691f3bSpatrick   return FindRnglistFromOffset(*maybe_offset);
1080061da546Spatrick }
1081*f6aab3d8Srobert 
1082*f6aab3d8Srobert 
HasAny(llvm::ArrayRef<dw_tag_t> tags)1083*f6aab3d8Srobert bool DWARFUnit::HasAny(llvm::ArrayRef<dw_tag_t> tags) {
1084*f6aab3d8Srobert   ExtractUnitDIEIfNeeded();
1085*f6aab3d8Srobert   if (m_dwo)
1086*f6aab3d8Srobert     return m_dwo->HasAny(tags);
1087*f6aab3d8Srobert 
1088*f6aab3d8Srobert   for (const auto &die: m_die_array) {
1089*f6aab3d8Srobert     for (const auto tag: tags) {
1090*f6aab3d8Srobert       if (tag == die.Tag())
1091*f6aab3d8Srobert         return true;
1092*f6aab3d8Srobert     }
1093*f6aab3d8Srobert   }
1094*f6aab3d8Srobert   return false;
1095*f6aab3d8Srobert }
1096