xref: /openbsd-src/gnu/llvm/lldb/source/Plugins/SymbolFile/DWARF/DWARFDebugArangeSet.cpp (revision f6aab3d83b51b91c24247ad2c2573574de475a82)
1dda28197Spatrick //===-- DWARFDebugArangeSet.cpp -------------------------------------------===//
2061da546Spatrick //
3061da546Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4061da546Spatrick // See https://llvm.org/LICENSE.txt for license information.
5061da546Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6061da546Spatrick //
7061da546Spatrick //===----------------------------------------------------------------------===//
8061da546Spatrick 
9061da546Spatrick #include "DWARFDebugArangeSet.h"
10061da546Spatrick #include "DWARFDataExtractor.h"
11be691f3bSpatrick #include "LogChannelDWARF.h"
12061da546Spatrick #include "llvm/Object/Error.h"
13061da546Spatrick #include <cassert>
14061da546Spatrick 
15061da546Spatrick using namespace lldb_private;
16061da546Spatrick 
DWARFDebugArangeSet()17061da546Spatrick DWARFDebugArangeSet::DWARFDebugArangeSet()
18be691f3bSpatrick     : m_offset(DW_INVALID_OFFSET), m_next_offset(DW_INVALID_OFFSET) {}
19061da546Spatrick 
Clear()20061da546Spatrick void DWARFDebugArangeSet::Clear() {
21061da546Spatrick   m_offset = DW_INVALID_OFFSET;
22be691f3bSpatrick   m_next_offset = DW_INVALID_OFFSET;
23061da546Spatrick   m_header.length = 0;
24061da546Spatrick   m_header.version = 0;
25061da546Spatrick   m_header.cu_offset = 0;
26061da546Spatrick   m_header.addr_size = 0;
27061da546Spatrick   m_header.seg_size = 0;
28061da546Spatrick   m_arange_descriptors.clear();
29061da546Spatrick }
30061da546Spatrick 
extract(const DWARFDataExtractor & data,lldb::offset_t * offset_ptr)31061da546Spatrick llvm::Error DWARFDebugArangeSet::extract(const DWARFDataExtractor &data,
32061da546Spatrick                                          lldb::offset_t *offset_ptr) {
33061da546Spatrick   assert(data.ValidOffset(*offset_ptr));
34061da546Spatrick 
35061da546Spatrick   m_arange_descriptors.clear();
36061da546Spatrick   m_offset = *offset_ptr;
37061da546Spatrick 
38061da546Spatrick   // 7.20 Address Range Table
39061da546Spatrick   //
40061da546Spatrick   // Each set of entries in the table of address ranges contained in the
41061da546Spatrick   // .debug_aranges section begins with a header consisting of: a 4-byte
42061da546Spatrick   // length containing the length of the set of entries for this compilation
43061da546Spatrick   // unit, not including the length field itself; a 2-byte version identifier
44061da546Spatrick   // containing the value 2 for DWARF Version 2; a 4-byte offset into
45061da546Spatrick   // the.debug_infosection; a 1-byte unsigned integer containing the size in
46061da546Spatrick   // bytes of an address (or the offset portion of an address for segmented
47061da546Spatrick   // addressing) on the target system; and a 1-byte unsigned integer
48061da546Spatrick   // containing the size in bytes of a segment descriptor on the target
49061da546Spatrick   // system. This header is followed by a series of tuples. Each tuple
50061da546Spatrick   // consists of an address and a length, each in the size appropriate for an
51061da546Spatrick   // address on the target architecture.
52061da546Spatrick   m_header.length = data.GetDWARFInitialLength(offset_ptr);
53be691f3bSpatrick   // The length could be 4 bytes or 12 bytes, so use the current offset to
54be691f3bSpatrick   // determine the next offset correctly.
55be691f3bSpatrick   if (m_header.length > 0)
56be691f3bSpatrick     m_next_offset = *offset_ptr + m_header.length;
57be691f3bSpatrick   else
58be691f3bSpatrick     m_next_offset = DW_INVALID_OFFSET;
59061da546Spatrick   m_header.version = data.GetU16(offset_ptr);
60061da546Spatrick   m_header.cu_offset = data.GetDWARFOffset(offset_ptr);
61061da546Spatrick   m_header.addr_size = data.GetU8(offset_ptr);
62061da546Spatrick   m_header.seg_size = data.GetU8(offset_ptr);
63061da546Spatrick 
64061da546Spatrick   // Try to avoid reading invalid arange sets by making sure:
65061da546Spatrick   // 1 - the version looks good
66061da546Spatrick   // 2 - the address byte size looks plausible
67061da546Spatrick   // 3 - the length seems to make sense
68dda28197Spatrick   // 4 - size looks plausible
69dda28197Spatrick   // 5 - the arange tuples do not contain a segment field
70061da546Spatrick   if (m_header.version < 2 || m_header.version > 5)
71061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
72061da546Spatrick         "Invalid arange header version");
73061da546Spatrick 
74061da546Spatrick   if (m_header.addr_size != 4 && m_header.addr_size != 8)
75061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
76061da546Spatrick         "Invalid arange header address size");
77061da546Spatrick 
78061da546Spatrick   if (m_header.length == 0)
79061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
80061da546Spatrick         "Invalid arange header length");
81061da546Spatrick 
82061da546Spatrick   if (!data.ValidOffset(m_offset + sizeof(m_header.length) + m_header.length -
83061da546Spatrick                         1))
84061da546Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
85061da546Spatrick         "Invalid arange header length");
86061da546Spatrick 
87dda28197Spatrick   if (m_header.seg_size)
88dda28197Spatrick     return llvm::make_error<llvm::object::GenericBinaryError>(
89dda28197Spatrick         "segmented arange entries are not supported");
90dda28197Spatrick 
91061da546Spatrick   // The first tuple following the header in each set begins at an offset
92061da546Spatrick   // that is a multiple of the size of a single tuple (that is, twice the
93061da546Spatrick   // size of an address). The header is padded, if necessary, to the
94061da546Spatrick   // appropriate boundary.
95061da546Spatrick   const uint32_t header_size = *offset_ptr - m_offset;
96061da546Spatrick   const uint32_t tuple_size = m_header.addr_size << 1;
97061da546Spatrick   uint32_t first_tuple_offset = 0;
98061da546Spatrick   while (first_tuple_offset < header_size)
99061da546Spatrick     first_tuple_offset += tuple_size;
100061da546Spatrick 
101061da546Spatrick   *offset_ptr = m_offset + first_tuple_offset;
102061da546Spatrick 
103061da546Spatrick   Descriptor arangeDescriptor;
104061da546Spatrick 
105061da546Spatrick   static_assert(sizeof(arangeDescriptor.address) ==
106061da546Spatrick                     sizeof(arangeDescriptor.length),
107061da546Spatrick                 "DWARFDebugArangeSet::Descriptor.address and "
108061da546Spatrick                 "DWARFDebugArangeSet::Descriptor.length must have same size");
109061da546Spatrick 
110be691f3bSpatrick   const lldb::offset_t next_offset = GetNextOffset();
111be691f3bSpatrick   assert(next_offset != DW_INVALID_OFFSET);
112be691f3bSpatrick   uint32_t num_terminators = 0;
113be691f3bSpatrick   bool last_was_terminator = false;
114be691f3bSpatrick   while (*offset_ptr < next_offset) {
115061da546Spatrick     arangeDescriptor.address = data.GetMaxU64(offset_ptr, m_header.addr_size);
116061da546Spatrick     arangeDescriptor.length = data.GetMaxU64(offset_ptr, m_header.addr_size);
117061da546Spatrick 
118061da546Spatrick     // Each set of tuples is terminated by a 0 for the address and 0 for
119be691f3bSpatrick     // the length. Some linkers can emit .debug_aranges with multiple
120be691f3bSpatrick     // terminator pair entries that are still withing the length of the
121be691f3bSpatrick     // DWARFDebugArangeSet. We want to be sure to parse all entries for
122be691f3bSpatrick     // this DWARFDebugArangeSet so that we don't stop parsing early and end up
123be691f3bSpatrick     // treating addresses as a header of the next DWARFDebugArangeSet. We also
124be691f3bSpatrick     // need to make sure we parse all valid address pairs so we don't omit them
125be691f3bSpatrick     // from the aranges result, so we can't stop at the first terminator entry
126be691f3bSpatrick     // we find.
127be691f3bSpatrick     if (arangeDescriptor.address == 0 && arangeDescriptor.length == 0) {
128be691f3bSpatrick       ++num_terminators;
129be691f3bSpatrick       last_was_terminator = true;
130be691f3bSpatrick     } else {
131be691f3bSpatrick       last_was_terminator = false;
132be691f3bSpatrick       // Only add .debug_aranges address entries that have a non zero size.
133be691f3bSpatrick       // Some linkers will zero out the length field for some .debug_aranges
134be691f3bSpatrick       // entries if they were stripped. We also could watch out for multiple
135be691f3bSpatrick       // entries at address zero and remove those as well.
136be691f3bSpatrick       if (arangeDescriptor.length > 0)
137061da546Spatrick         m_arange_descriptors.push_back(arangeDescriptor);
138061da546Spatrick     }
139be691f3bSpatrick   }
140be691f3bSpatrick   if (num_terminators > 1) {
141*f6aab3d8Srobert     Log *log = GetLog(DWARFLog::DebugInfo);
142be691f3bSpatrick     LLDB_LOG(log,
143be691f3bSpatrick              "warning: DWARFDebugArangeSet at %#" PRIx64 " contains %u "
144be691f3bSpatrick              "terminator entries",
145be691f3bSpatrick              m_offset, num_terminators);
146be691f3bSpatrick   }
147be691f3bSpatrick   if (last_was_terminator)
148be691f3bSpatrick     return llvm::ErrorSuccess();
149061da546Spatrick 
150061da546Spatrick   return llvm::make_error<llvm::object::GenericBinaryError>(
151061da546Spatrick       "arange descriptors not terminated by null entry");
152061da546Spatrick }
153061da546Spatrick 
154061da546Spatrick class DescriptorContainsAddress {
155061da546Spatrick public:
DescriptorContainsAddress(dw_addr_t address)156061da546Spatrick   DescriptorContainsAddress(dw_addr_t address) : m_address(address) {}
operator ()(const DWARFDebugArangeSet::Descriptor & desc) const157061da546Spatrick   bool operator()(const DWARFDebugArangeSet::Descriptor &desc) const {
158061da546Spatrick     return (m_address >= desc.address) &&
159061da546Spatrick            (m_address < (desc.address + desc.length));
160061da546Spatrick   }
161061da546Spatrick 
162061da546Spatrick private:
163061da546Spatrick   const dw_addr_t m_address;
164061da546Spatrick };
165061da546Spatrick 
FindAddress(dw_addr_t address) const166061da546Spatrick dw_offset_t DWARFDebugArangeSet::FindAddress(dw_addr_t address) const {
167061da546Spatrick   DescriptorConstIter end = m_arange_descriptors.end();
168061da546Spatrick   DescriptorConstIter pos =
169061da546Spatrick       std::find_if(m_arange_descriptors.begin(), end,   // Range
170061da546Spatrick                    DescriptorContainsAddress(address)); // Predicate
171061da546Spatrick   if (pos != end)
172061da546Spatrick     return m_header.cu_offset;
173061da546Spatrick 
174061da546Spatrick   return DW_INVALID_OFFSET;
175061da546Spatrick }
176