1 //===-- DWARFDebugArangeSet.cpp -------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "DWARFDebugArangeSet.h" 10 #include "DWARFDataExtractor.h" 11 #include "LogChannelDWARF.h" 12 #include "llvm/Object/Error.h" 13 #include <cassert> 14 15 using namespace lldb_private; 16 17 DWARFDebugArangeSet::DWARFDebugArangeSet() 18 : m_offset(DW_INVALID_OFFSET), m_next_offset(DW_INVALID_OFFSET) {} 19 20 void DWARFDebugArangeSet::Clear() { 21 m_offset = DW_INVALID_OFFSET; 22 m_next_offset = DW_INVALID_OFFSET; 23 m_header.length = 0; 24 m_header.version = 0; 25 m_header.cu_offset = 0; 26 m_header.addr_size = 0; 27 m_header.seg_size = 0; 28 m_arange_descriptors.clear(); 29 } 30 31 llvm::Error DWARFDebugArangeSet::extract(const DWARFDataExtractor &data, 32 lldb::offset_t *offset_ptr) { 33 assert(data.ValidOffset(*offset_ptr)); 34 35 m_arange_descriptors.clear(); 36 m_offset = *offset_ptr; 37 38 // 7.20 Address Range Table 39 // 40 // Each set of entries in the table of address ranges contained in the 41 // .debug_aranges section begins with a header consisting of: a 4-byte 42 // length containing the length of the set of entries for this compilation 43 // unit, not including the length field itself; a 2-byte version identifier 44 // containing the value 2 for DWARF Version 2; a 4-byte offset into 45 // the.debug_infosection; a 1-byte unsigned integer containing the size in 46 // bytes of an address (or the offset portion of an address for segmented 47 // addressing) on the target system; and a 1-byte unsigned integer 48 // containing the size in bytes of a segment descriptor on the target 49 // system. This header is followed by a series of tuples. Each tuple 50 // consists of an address and a length, each in the size appropriate for an 51 // address on the target architecture. 52 m_header.length = data.GetDWARFInitialLength(offset_ptr); 53 // The length could be 4 bytes or 12 bytes, so use the current offset to 54 // determine the next offset correctly. 55 if (m_header.length > 0) 56 m_next_offset = *offset_ptr + m_header.length; 57 else 58 m_next_offset = DW_INVALID_OFFSET; 59 m_header.version = data.GetU16(offset_ptr); 60 m_header.cu_offset = data.GetDWARFOffset(offset_ptr); 61 m_header.addr_size = data.GetU8(offset_ptr); 62 m_header.seg_size = data.GetU8(offset_ptr); 63 64 // Try to avoid reading invalid arange sets by making sure: 65 // 1 - the version looks good 66 // 2 - the address byte size looks plausible 67 // 3 - the length seems to make sense 68 // 4 - size looks plausible 69 // 5 - the arange tuples do not contain a segment field 70 if (m_header.version < 2 || m_header.version > 5) 71 return llvm::make_error<llvm::object::GenericBinaryError>( 72 "Invalid arange header version"); 73 74 if (m_header.addr_size != 4 && m_header.addr_size != 8) 75 return llvm::make_error<llvm::object::GenericBinaryError>( 76 "Invalid arange header address size"); 77 78 if (m_header.length == 0) 79 return llvm::make_error<llvm::object::GenericBinaryError>( 80 "Invalid arange header length"); 81 82 if (!data.ValidOffset(m_offset + sizeof(m_header.length) + m_header.length - 83 1)) 84 return llvm::make_error<llvm::object::GenericBinaryError>( 85 "Invalid arange header length"); 86 87 if (m_header.seg_size) 88 return llvm::make_error<llvm::object::GenericBinaryError>( 89 "segmented arange entries are not supported"); 90 91 // The first tuple following the header in each set begins at an offset 92 // that is a multiple of the size of a single tuple (that is, twice the 93 // size of an address). The header is padded, if necessary, to the 94 // appropriate boundary. 95 const uint32_t header_size = *offset_ptr - m_offset; 96 const uint32_t tuple_size = m_header.addr_size << 1; 97 uint32_t first_tuple_offset = 0; 98 while (first_tuple_offset < header_size) 99 first_tuple_offset += tuple_size; 100 101 *offset_ptr = m_offset + first_tuple_offset; 102 103 Descriptor arangeDescriptor; 104 105 static_assert(sizeof(arangeDescriptor.address) == 106 sizeof(arangeDescriptor.length), 107 "DWARFDebugArangeSet::Descriptor.address and " 108 "DWARFDebugArangeSet::Descriptor.length must have same size"); 109 110 const lldb::offset_t next_offset = GetNextOffset(); 111 assert(next_offset != DW_INVALID_OFFSET); 112 uint32_t num_terminators = 0; 113 bool last_was_terminator = false; 114 while (*offset_ptr < next_offset) { 115 arangeDescriptor.address = data.GetMaxU64(offset_ptr, m_header.addr_size); 116 arangeDescriptor.length = data.GetMaxU64(offset_ptr, m_header.addr_size); 117 118 // Each set of tuples is terminated by a 0 for the address and 0 for 119 // the length. Some linkers can emit .debug_aranges with multiple 120 // terminator pair entries that are still withing the length of the 121 // DWARFDebugArangeSet. We want to be sure to parse all entries for 122 // this DWARFDebugArangeSet so that we don't stop parsing early and end up 123 // treating addresses as a header of the next DWARFDebugArangeSet. We also 124 // need to make sure we parse all valid address pairs so we don't omit them 125 // from the aranges result, so we can't stop at the first terminator entry 126 // we find. 127 if (arangeDescriptor.address == 0 && arangeDescriptor.length == 0) { 128 ++num_terminators; 129 last_was_terminator = true; 130 } else { 131 last_was_terminator = false; 132 // Only add .debug_aranges address entries that have a non zero size. 133 // Some linkers will zero out the length field for some .debug_aranges 134 // entries if they were stripped. We also could watch out for multiple 135 // entries at address zero and remove those as well. 136 if (arangeDescriptor.length > 0) 137 m_arange_descriptors.push_back(arangeDescriptor); 138 } 139 } 140 if (num_terminators > 1) { 141 Log *log = LogChannelDWARF::GetLogIfAll(DWARF_LOG_DEBUG_INFO); 142 LLDB_LOG(log, 143 "warning: DWARFDebugArangeSet at %#" PRIx64 " contains %u " 144 "terminator entries", 145 m_offset, num_terminators); 146 } 147 if (last_was_terminator) 148 return llvm::ErrorSuccess(); 149 150 return llvm::make_error<llvm::object::GenericBinaryError>( 151 "arange descriptors not terminated by null entry"); 152 } 153 154 class DescriptorContainsAddress { 155 public: 156 DescriptorContainsAddress(dw_addr_t address) : m_address(address) {} 157 bool operator()(const DWARFDebugArangeSet::Descriptor &desc) const { 158 return (m_address >= desc.address) && 159 (m_address < (desc.address + desc.length)); 160 } 161 162 private: 163 const dw_addr_t m_address; 164 }; 165 166 dw_offset_t DWARFDebugArangeSet::FindAddress(dw_addr_t address) const { 167 DescriptorConstIter end = m_arange_descriptors.end(); 168 DescriptorConstIter pos = 169 std::find_if(m_arange_descriptors.begin(), end, // Range 170 DescriptorContainsAddress(address)); // Predicate 171 if (pos != end) 172 return m_header.cu_offset; 173 174 return DW_INVALID_OFFSET; 175 } 176