1dda28197Spatrick //===-- DWARFDebugArangeSet.cpp -------------------------------------------===// 2061da546Spatrick // 3061da546Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4061da546Spatrick // See https://llvm.org/LICENSE.txt for license information. 5061da546Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6061da546Spatrick // 7061da546Spatrick //===----------------------------------------------------------------------===// 8061da546Spatrick 9061da546Spatrick #include "DWARFDebugArangeSet.h" 10061da546Spatrick #include "DWARFDataExtractor.h" 11*be691f3bSpatrick #include "LogChannelDWARF.h" 12061da546Spatrick #include "llvm/Object/Error.h" 13061da546Spatrick #include <cassert> 14061da546Spatrick 15061da546Spatrick using namespace lldb_private; 16061da546Spatrick 17061da546Spatrick DWARFDebugArangeSet::DWARFDebugArangeSet() 18*be691f3bSpatrick : m_offset(DW_INVALID_OFFSET), m_next_offset(DW_INVALID_OFFSET) {} 19061da546Spatrick 20061da546Spatrick void DWARFDebugArangeSet::Clear() { 21061da546Spatrick m_offset = DW_INVALID_OFFSET; 22*be691f3bSpatrick m_next_offset = DW_INVALID_OFFSET; 23061da546Spatrick m_header.length = 0; 24061da546Spatrick m_header.version = 0; 25061da546Spatrick m_header.cu_offset = 0; 26061da546Spatrick m_header.addr_size = 0; 27061da546Spatrick m_header.seg_size = 0; 28061da546Spatrick m_arange_descriptors.clear(); 29061da546Spatrick } 30061da546Spatrick 31061da546Spatrick llvm::Error DWARFDebugArangeSet::extract(const DWARFDataExtractor &data, 32061da546Spatrick lldb::offset_t *offset_ptr) { 33061da546Spatrick assert(data.ValidOffset(*offset_ptr)); 34061da546Spatrick 35061da546Spatrick m_arange_descriptors.clear(); 36061da546Spatrick m_offset = *offset_ptr; 37061da546Spatrick 38061da546Spatrick // 7.20 Address Range Table 39061da546Spatrick // 40061da546Spatrick // Each set of entries in the table of address ranges contained in the 41061da546Spatrick // .debug_aranges section begins with a header consisting of: a 4-byte 42061da546Spatrick // length containing the length of the set of entries for this compilation 43061da546Spatrick // unit, not including the length field itself; a 2-byte version identifier 44061da546Spatrick // containing the value 2 for DWARF Version 2; a 4-byte offset into 45061da546Spatrick // the.debug_infosection; a 1-byte unsigned integer containing the size in 46061da546Spatrick // bytes of an address (or the offset portion of an address for segmented 47061da546Spatrick // addressing) on the target system; and a 1-byte unsigned integer 48061da546Spatrick // containing the size in bytes of a segment descriptor on the target 49061da546Spatrick // system. This header is followed by a series of tuples. Each tuple 50061da546Spatrick // consists of an address and a length, each in the size appropriate for an 51061da546Spatrick // address on the target architecture. 52061da546Spatrick m_header.length = data.GetDWARFInitialLength(offset_ptr); 53*be691f3bSpatrick // The length could be 4 bytes or 12 bytes, so use the current offset to 54*be691f3bSpatrick // determine the next offset correctly. 55*be691f3bSpatrick if (m_header.length > 0) 56*be691f3bSpatrick m_next_offset = *offset_ptr + m_header.length; 57*be691f3bSpatrick else 58*be691f3bSpatrick m_next_offset = DW_INVALID_OFFSET; 59061da546Spatrick m_header.version = data.GetU16(offset_ptr); 60061da546Spatrick m_header.cu_offset = data.GetDWARFOffset(offset_ptr); 61061da546Spatrick m_header.addr_size = data.GetU8(offset_ptr); 62061da546Spatrick m_header.seg_size = data.GetU8(offset_ptr); 63061da546Spatrick 64061da546Spatrick // Try to avoid reading invalid arange sets by making sure: 65061da546Spatrick // 1 - the version looks good 66061da546Spatrick // 2 - the address byte size looks plausible 67061da546Spatrick // 3 - the length seems to make sense 68dda28197Spatrick // 4 - size looks plausible 69dda28197Spatrick // 5 - the arange tuples do not contain a segment field 70061da546Spatrick if (m_header.version < 2 || m_header.version > 5) 71061da546Spatrick return llvm::make_error<llvm::object::GenericBinaryError>( 72061da546Spatrick "Invalid arange header version"); 73061da546Spatrick 74061da546Spatrick if (m_header.addr_size != 4 && m_header.addr_size != 8) 75061da546Spatrick return llvm::make_error<llvm::object::GenericBinaryError>( 76061da546Spatrick "Invalid arange header address size"); 77061da546Spatrick 78061da546Spatrick if (m_header.length == 0) 79061da546Spatrick return llvm::make_error<llvm::object::GenericBinaryError>( 80061da546Spatrick "Invalid arange header length"); 81061da546Spatrick 82061da546Spatrick if (!data.ValidOffset(m_offset + sizeof(m_header.length) + m_header.length - 83061da546Spatrick 1)) 84061da546Spatrick return llvm::make_error<llvm::object::GenericBinaryError>( 85061da546Spatrick "Invalid arange header length"); 86061da546Spatrick 87dda28197Spatrick if (m_header.seg_size) 88dda28197Spatrick return llvm::make_error<llvm::object::GenericBinaryError>( 89dda28197Spatrick "segmented arange entries are not supported"); 90dda28197Spatrick 91061da546Spatrick // The first tuple following the header in each set begins at an offset 92061da546Spatrick // that is a multiple of the size of a single tuple (that is, twice the 93061da546Spatrick // size of an address). The header is padded, if necessary, to the 94061da546Spatrick // appropriate boundary. 95061da546Spatrick const uint32_t header_size = *offset_ptr - m_offset; 96061da546Spatrick const uint32_t tuple_size = m_header.addr_size << 1; 97061da546Spatrick uint32_t first_tuple_offset = 0; 98061da546Spatrick while (first_tuple_offset < header_size) 99061da546Spatrick first_tuple_offset += tuple_size; 100061da546Spatrick 101061da546Spatrick *offset_ptr = m_offset + first_tuple_offset; 102061da546Spatrick 103061da546Spatrick Descriptor arangeDescriptor; 104061da546Spatrick 105061da546Spatrick static_assert(sizeof(arangeDescriptor.address) == 106061da546Spatrick sizeof(arangeDescriptor.length), 107061da546Spatrick "DWARFDebugArangeSet::Descriptor.address and " 108061da546Spatrick "DWARFDebugArangeSet::Descriptor.length must have same size"); 109061da546Spatrick 110*be691f3bSpatrick const lldb::offset_t next_offset = GetNextOffset(); 111*be691f3bSpatrick assert(next_offset != DW_INVALID_OFFSET); 112*be691f3bSpatrick uint32_t num_terminators = 0; 113*be691f3bSpatrick bool last_was_terminator = false; 114*be691f3bSpatrick while (*offset_ptr < next_offset) { 115061da546Spatrick arangeDescriptor.address = data.GetMaxU64(offset_ptr, m_header.addr_size); 116061da546Spatrick arangeDescriptor.length = data.GetMaxU64(offset_ptr, m_header.addr_size); 117061da546Spatrick 118061da546Spatrick // Each set of tuples is terminated by a 0 for the address and 0 for 119*be691f3bSpatrick // the length. Some linkers can emit .debug_aranges with multiple 120*be691f3bSpatrick // terminator pair entries that are still withing the length of the 121*be691f3bSpatrick // DWARFDebugArangeSet. We want to be sure to parse all entries for 122*be691f3bSpatrick // this DWARFDebugArangeSet so that we don't stop parsing early and end up 123*be691f3bSpatrick // treating addresses as a header of the next DWARFDebugArangeSet. We also 124*be691f3bSpatrick // need to make sure we parse all valid address pairs so we don't omit them 125*be691f3bSpatrick // from the aranges result, so we can't stop at the first terminator entry 126*be691f3bSpatrick // we find. 127*be691f3bSpatrick if (arangeDescriptor.address == 0 && arangeDescriptor.length == 0) { 128*be691f3bSpatrick ++num_terminators; 129*be691f3bSpatrick last_was_terminator = true; 130*be691f3bSpatrick } else { 131*be691f3bSpatrick last_was_terminator = false; 132*be691f3bSpatrick // Only add .debug_aranges address entries that have a non zero size. 133*be691f3bSpatrick // Some linkers will zero out the length field for some .debug_aranges 134*be691f3bSpatrick // entries if they were stripped. We also could watch out for multiple 135*be691f3bSpatrick // entries at address zero and remove those as well. 136*be691f3bSpatrick if (arangeDescriptor.length > 0) 137061da546Spatrick m_arange_descriptors.push_back(arangeDescriptor); 138061da546Spatrick } 139*be691f3bSpatrick } 140*be691f3bSpatrick if (num_terminators > 1) { 141*be691f3bSpatrick Log *log = LogChannelDWARF::GetLogIfAll(DWARF_LOG_DEBUG_INFO); 142*be691f3bSpatrick LLDB_LOG(log, 143*be691f3bSpatrick "warning: DWARFDebugArangeSet at %#" PRIx64 " contains %u " 144*be691f3bSpatrick "terminator entries", 145*be691f3bSpatrick m_offset, num_terminators); 146*be691f3bSpatrick } 147*be691f3bSpatrick if (last_was_terminator) 148*be691f3bSpatrick return llvm::ErrorSuccess(); 149061da546Spatrick 150061da546Spatrick return llvm::make_error<llvm::object::GenericBinaryError>( 151061da546Spatrick "arange descriptors not terminated by null entry"); 152061da546Spatrick } 153061da546Spatrick 154061da546Spatrick class DescriptorContainsAddress { 155061da546Spatrick public: 156061da546Spatrick DescriptorContainsAddress(dw_addr_t address) : m_address(address) {} 157061da546Spatrick bool operator()(const DWARFDebugArangeSet::Descriptor &desc) const { 158061da546Spatrick return (m_address >= desc.address) && 159061da546Spatrick (m_address < (desc.address + desc.length)); 160061da546Spatrick } 161061da546Spatrick 162061da546Spatrick private: 163061da546Spatrick const dw_addr_t m_address; 164061da546Spatrick }; 165061da546Spatrick 166061da546Spatrick dw_offset_t DWARFDebugArangeSet::FindAddress(dw_addr_t address) const { 167061da546Spatrick DescriptorConstIter end = m_arange_descriptors.end(); 168061da546Spatrick DescriptorConstIter pos = 169061da546Spatrick std::find_if(m_arange_descriptors.begin(), end, // Range 170061da546Spatrick DescriptorContainsAddress(address)); // Predicate 171061da546Spatrick if (pos != end) 172061da546Spatrick return m_header.cu_offset; 173061da546Spatrick 174061da546Spatrick return DW_INVALID_OFFSET; 175061da546Spatrick } 176