1 //===-- Address.h -----------------------------------------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #ifndef LLDB_CORE_ADDRESS_H
10 #define LLDB_CORE_ADDRESS_H
11 
12 #include "lldb/Utility/Stream.h"
13 #include "lldb/lldb-defines.h"
14 #include "lldb/lldb-forward.h"
15 #include "lldb/lldb-private-enumerations.h"
16 #include "lldb/lldb-types.h"
17 
18 #include "llvm/ADT/StringRef.h"
19 
20 #include <cstddef>
21 #include <cstdint>
22 
23 namespace lldb_private {
24 class Block;
25 class CompileUnit;
26 class ExecutionContextScope;
27 class Function;
28 class SectionList;
29 class Stream;
30 class Symbol;
31 class SymbolContext;
32 class Target;
33 struct LineEntry;
34 
35 /// \class Address Address.h "lldb/Core/Address.h"
36 /// A section + offset based address class.
37 ///
38 /// The Address class allows addresses to be relative to a section that can
39 /// move during runtime due to images (executables, shared libraries, bundles,
40 /// frameworks) being loaded at different addresses than the addresses found
41 /// in the object file that represents them on disk. There are currently two
42 /// types of addresses for a section:
43 ///     \li file addresses
44 ///     \li load addresses
45 ///
46 /// File addresses represent the virtual addresses that are in the "on disk"
47 /// object files. These virtual addresses are converted to be relative to
48 /// unique sections scoped to the object file so that when/if the addresses
49 /// slide when the images are loaded/unloaded in memory, we can easily track
50 /// these changes without having to update every object (compile unit ranges,
51 /// line tables, function address ranges, lexical block and inlined subroutine
52 /// address ranges, global and static variables) each time an image is loaded
53 /// or unloaded.
54 ///
55 /// Load addresses represent the virtual addresses where each section ends up
56 /// getting loaded at runtime. Before executing a program, it is common for
57 /// all of the load addresses to be unresolved. When a DynamicLoader plug-in
58 /// receives notification that shared libraries have been loaded/unloaded, the
59 /// load addresses of the main executable and any images (shared libraries)
60 /// will be  resolved/unresolved. When this happens, breakpoints that are in
61 /// one of these sections can be set/cleared.
62 class Address {
63 public:
64   /// Dump styles allow the Address::Dump(Stream *,DumpStyle) const function
65   /// to display Address contents in a variety of ways.
66   enum DumpStyle {
67     /// Invalid dump style.
68     DumpStyleInvalid,
69     /// Display as the section name + offset.
70     /// \code
71     /// // address for printf in libSystem.B.dylib as a section name + offset
72     /// libSystem.B.dylib.__TEXT.__text + 0x0005cfdf
73     /// \endcode
74     DumpStyleSectionNameOffset,
75     /// Display as the section pointer + offset (debug output).
76     /// \code
77     /// // address for printf in libSystem.B.dylib as a section pointer +
78     /// offset (lldb::Section *)0x35cc50 + 0x000000000005cfdf
79     /// \endcode
80     DumpStyleSectionPointerOffset,
81     /// Display as the file address (if any).
82     /// \code
83     /// // address for printf in libSystem.B.dylib as a file address
84     /// 0x000000000005dcff
85     /// \endcode
86     ///
87     DumpStyleFileAddress,
88     /// Display as the file address with the module name prepended (if any).
89     /// \code
90     /// // address for printf in libSystem.B.dylib as a file address
91     /// libSystem.B.dylib[0x000000000005dcff]
92     /// \endcode
93     DumpStyleModuleWithFileAddress,
94     /// Display as the load address (if resolved).
95     /// \code
96     /// // address for printf in libSystem.B.dylib as a load address
97     /// 0x00007fff8306bcff
98     /// \endcode
99     DumpStyleLoadAddress,
100     /// Display the details about what an address resolves to. This can be
101     /// anything from a symbol context summary (module, function/symbol, and
102     /// file and line), to information about what the pointer points to if the
103     /// address is in a section (section of pointers, c strings, etc).
104     DumpStyleResolvedDescription,
105     DumpStyleResolvedDescriptionNoModule,
106     DumpStyleResolvedDescriptionNoFunctionArguments,
107     /// Elide the function name; display an offset into the current function.
108     /// Used primarily in disassembly symbolication
109     DumpStyleNoFunctionName,
110     /// Detailed symbol context information for an address for all symbol
111     /// context members.
112     DumpStyleDetailedSymbolContext,
113     /// Dereference a pointer at the current address and then lookup the
114     /// dereferenced address using DumpStyleResolvedDescription
115     DumpStyleResolvedPointerDescription
116   };
117 
118   /// Default constructor.
119   ///
120   /// Initialize with a invalid section (NULL) and an invalid offset
121   /// (LLDB_INVALID_ADDRESS).
122   Address() = default;
123 
124   /// Copy constructor
125   ///
126   /// Makes a copy of the another Address object \a rhs.
127   ///
128   /// \param[in] rhs
129   ///     A const Address object reference to copy.
Address(const Address & rhs)130   Address(const Address &rhs)
131       : m_section_wp(rhs.m_section_wp), m_offset(rhs.m_offset) {}
132 
133   /// Construct with a section pointer and offset.
134   ///
135   /// Initialize the address with the supplied \a section and \a offset.
136   ///
137   /// \param[in] section_sp
138   ///     A section pointer to a valid lldb::Section, or NULL if the
139   ///     address doesn't have a section or will get resolved later.
140   ///
141   /// \param[in] offset
142   ///     The offset in bytes into \a section.
Address(const lldb::SectionSP & section_sp,lldb::addr_t offset)143   Address(const lldb::SectionSP &section_sp, lldb::addr_t offset)
144       : m_section_wp(), // Don't init with section_sp in case section_sp is
145                         // invalid (the weak_ptr will throw)
146         m_offset(offset) {
147     if (section_sp)
148       m_section_wp = section_sp;
149   }
150 
151   /// Construct with a virtual address and section list.
152   ///
153   /// Initialize and resolve the address with the supplied virtual address \a
154   /// file_addr.
155   ///
156   /// \param[in] file_addr
157   ///     A virtual file address.
158   ///
159   /// \param[in] section_list
160   ///     A list of sections, one of which may contain the \a file_addr.
161   Address(lldb::addr_t file_addr, const SectionList *section_list);
162 
163   Address(lldb::addr_t abs_addr);
164 
165 /// Assignment operator.
166 ///
167 /// Copies the address value from another Address object \a rhs into \a this
168 /// object.
169 ///
170 /// \param[in] rhs
171 ///     A const Address object reference to copy.
172 ///
173 /// \return
174 ///     A const Address object reference to \a this.
175   const Address &operator=(const Address &rhs);
176 
177   /// Clear the object's state.
178   ///
179   /// Sets the section to an invalid value (NULL) and an invalid offset
180   /// (LLDB_INVALID_ADDRESS).
Clear()181   void Clear() {
182     m_section_wp.reset();
183     m_offset = LLDB_INVALID_ADDRESS;
184   }
185 
186   /// Compare two Address objects.
187   ///
188   /// \param[in] lhs
189   ///     The Left Hand Side const Address object reference.
190   ///
191   /// \param[in] rhs
192   ///     The Right Hand Side const Address object reference.
193   ///
194   /// \return
195   ///     -1 if lhs < rhs
196   ///     0 if lhs == rhs
197   ///     1 if lhs > rhs
198   static int CompareFileAddress(const Address &lhs, const Address &rhs);
199 
200   static int CompareLoadAddress(const Address &lhs, const Address &rhs,
201                                 Target *target);
202 
203   static int CompareModulePointerAndOffset(const Address &lhs,
204                                            const Address &rhs);
205 
206   // For use with std::map, std::multi_map
207   class ModulePointerAndOffsetLessThanFunctionObject {
208   public:
209     ModulePointerAndOffsetLessThanFunctionObject() = default;
210 
operator()211     bool operator()(const Address &a, const Address &b) const {
212       return Address::CompareModulePointerAndOffset(a, b) < 0;
213     }
214   };
215 
216   /// Write a description of this object to a Stream.
217   bool GetDescription(Stream &s, Target &target,
218                       lldb::DescriptionLevel level) const;
219 
220   /// Dump a description of this object to a Stream.
221   ///
222   /// Dump a description of the contents of this object to the supplied stream
223   /// \a s. There are many ways to display a section offset based address, and
224   /// \a style lets the user choose.
225   ///
226   /// \param[in] s
227   ///     The stream to which to dump the object description.
228   ///
229   /// \param[in] style
230   ///     The display style for the address.
231   ///
232   /// \param[in] fallback_style
233   ///     The display style for the address.
234   ///
235   /// \param[in] addr_byte_size
236   ///     The address byte size for the address.
237   ///
238   /// \param[in] all_ranges
239   ///     If true, dump all valid ranges and value ranges for the variable that
240   ///     contains the address, otherwise dumping the range that contains the
241   ///     address.
242   ///
243   /// \param[in] pattern
244   ///     An optional regex pattern to match against the description. If
245   ///     specified, parts of the description matching this pattern may be
246   ///     highlighted or processed differently. If this parameter is an empty
247   ///     string or not provided, no highlighting is applied.
248   ///
249   /// \return
250   ///     Returns \b true if the address was able to be displayed.
251   ///     File and load addresses may be unresolved and it may not be
252   ///     possible to display a valid value, \b false will be returned
253   ///     in such cases.
254   ///
255   /// \see Address::DumpStyle
256   bool
257   Dump(Stream *s, ExecutionContextScope *exe_scope, DumpStyle style,
258        DumpStyle fallback_style = DumpStyleInvalid,
259        uint32_t addr_byte_size = UINT32_MAX, bool all_ranges = false,
260        std::optional<Stream::HighlightSettings> settings = std::nullopt) const;
261 
262   AddressClass GetAddressClass() const;
263 
264   /// Get the file address.
265   ///
266   /// If an address comes from a file on disk that has section relative
267   /// addresses, then it has a virtual address that is relative to unique
268   /// section in the object file.
269   ///
270   /// \return
271   ///     The valid file virtual address, or LLDB_INVALID_ADDRESS if
272   ///     the address doesn't have a file virtual address (image is
273   ///     from memory only with no representation on disk).
274   lldb::addr_t GetFileAddress() const;
275 
276   /// Get the load address.
277   ///
278   /// If an address comes from a file on disk that has section relative
279   /// addresses, then it has a virtual address that is relative to unique
280   /// section in the object file. Sections get resolved at runtime by
281   /// DynamicLoader plug-ins as images (executables and shared libraries) get
282   /// loaded/unloaded. If a section is loaded, then the load address can be
283   /// resolved.
284   ///
285   /// \return
286   ///     The valid load virtual address, or LLDB_INVALID_ADDRESS if
287   ///     the address is currently not loaded.
288   lldb::addr_t GetLoadAddress(Target *target) const;
289 
290   /// Get the load address as a callable code load address.
291   ///
292   /// This function will first resolve its address to a load address. Then, if
293   /// the address turns out to be in code address, return the load address
294   /// that would be required to call or return to. The address might have
295   /// extra bits set (bit zero will be set to Thumb functions for an ARM
296   /// target) that are required when changing the program counter to setting a
297   /// return address.
298   ///
299   /// \return
300   ///     The valid load virtual address, or LLDB_INVALID_ADDRESS if
301   ///     the address is currently not loaded.
302   lldb::addr_t GetCallableLoadAddress(Target *target,
303                                       bool is_indirect = false) const;
304 
305   /// Get the load address as an opcode load address.
306   ///
307   /// This function will first resolve its address to a load address. Then, if
308   /// the address turns out to be in code address, return the load address for
309   /// an opcode. This address object might have extra bits set (bit zero will
310   /// be set to Thumb functions for an
311   /// ARM target) that are required for changing the program counter
312   /// and this function will remove any bits that are intended for these
313   /// special purposes. The result of this function can be used to safely
314   /// write a software breakpoint trap to memory.
315   ///
316   /// \return
317   ///     The valid load virtual address with extra callable bits
318   ///     removed, or LLDB_INVALID_ADDRESS if the address is currently
319   ///     not loaded.
320   lldb::addr_t GetOpcodeLoadAddress(
321       Target *target,
322       AddressClass addr_class = AddressClass::eInvalid) const;
323 
324   /// Get the section relative offset value.
325   ///
326   /// \return
327   ///     The current offset, or LLDB_INVALID_ADDRESS if this address
328   ///     doesn't contain a valid offset.
GetOffset()329   lldb::addr_t GetOffset() const { return m_offset; }
330 
331   /// Check if an address is section offset.
332   ///
333   /// When converting a virtual file or load address into a section offset
334   /// based address, we often need to know if, given a section list, if the
335   /// address was able to be converted to section offset. This function
336   /// returns true if the current value contained in this object is section
337   /// offset based.
338   ///
339   /// \return
340   ///     Returns \b true if the address has a valid section and
341   ///     offset, \b false otherwise.
IsSectionOffset()342   bool IsSectionOffset() const {
343     return IsValid() && (GetSection().get() != nullptr);
344   }
345 
346   /// Check if the object state is valid.
347   ///
348   /// A valid Address object contains either a section pointer and
349   /// offset (for section offset based addresses), or just a valid offset
350   /// (for absolute addresses that have no section).
351   ///
352   /// \return
353   ///     Returns \b true if the offset is valid, \b false
354   ///     otherwise.
IsValid()355   bool IsValid() const { return m_offset != LLDB_INVALID_ADDRESS; }
356 
357   /// Get the memory cost of this object.
358   ///
359   /// \return
360   ///     The number of bytes that this object occupies in memory.
361   size_t MemorySize() const;
362 
363   /// Resolve a file virtual address using a section list.
364   ///
365   /// Given a list of sections, attempt to resolve \a addr as an offset into
366   /// one of the file sections.
367   ///
368   /// \return
369   ///     Returns \b true if \a addr was able to be resolved, \b false
370   ///     otherwise.
371   bool ResolveAddressUsingFileSections(lldb::addr_t addr,
372                                        const SectionList *sections);
373 
374   /// Resolve this address to its containing function and optionally get
375   /// that function's address range.
376   ///
377   /// \param[out] sym_ctx
378   ///     The symbol context describing the function in which this address lies
379   ///
380   /// \parm[out] addr_range_ptr
381   ///     Pointer to the AddressRange to fill in with the function's address
382   ///     range.  Caller may pass null if they don't need the address range.
383   ///
384   /// \return
385   ///     Returns \b false if the function/symbol could not be resolved
386   ///     or if the address range was requested and could not be resolved;
387   ///     returns \b true otherwise.
388   bool ResolveFunctionScope(lldb_private::SymbolContext &sym_ctx,
389                             lldb_private::AddressRange *addr_range_ptr = nullptr);
390 
391   /// Set the address to represent \a load_addr.
392   ///
393   /// The address will attempt to find a loaded section within \a target that
394   /// contains \a load_addr. If successful, this address object will have a
395   /// valid section and offset. Else this address object will have no section
396   /// (NULL) and the offset will be \a load_addr.
397   ///
398   /// \param[in] load_addr
399   ///     A load address from a current process.
400   ///
401   /// \param[in] target
402   ///     The target to use when trying resolve the address into
403   ///     a section + offset. The Target's SectionLoadList object
404   ///     is used to resolve the address.
405   ///
406   /// \param[in] allow_section_end
407   ///     If true, treat an address pointing to the end of the module as
408   ///     belonging to that module.
409   ///
410   /// \return
411   ///     Returns \b true if the load address was resolved to be
412   ///     section/offset, \b false otherwise. It is often ok for an
413   ///     address to not resolve to a section in a module, this often
414   ///     happens for JIT'ed code, or any load addresses on the stack
415   ///     or heap.
416   bool SetLoadAddress(lldb::addr_t load_addr, Target *target,
417                       bool allow_section_end = false);
418 
419   bool SetOpcodeLoadAddress(
420       lldb::addr_t load_addr, Target *target,
421       AddressClass addr_class = AddressClass::eInvalid,
422       bool allow_section_end = false);
423 
424   bool SetCallableLoadAddress(lldb::addr_t load_addr, Target *target);
425 
426   /// Get accessor for the module for this address.
427   ///
428   /// \return
429   ///     Returns the Module pointer that this address is an offset
430   ///     in, or NULL if this address doesn't belong in a module, or
431   ///     isn't resolved yet.
432   lldb::ModuleSP GetModule() const;
433 
434   /// Get const accessor for the section.
435   ///
436   /// \return
437   ///     Returns the const lldb::Section pointer that this address is an
438   ///     offset in, or NULL if this address is absolute.
GetSection()439   lldb::SectionSP GetSection() const { return m_section_wp.lock(); }
440 
441   /// Set accessor for the offset.
442   ///
443   /// \param[in] offset
444   ///     A new offset value for this object.
445   ///
446   /// \return
447   ///     Returns \b true if the offset changed, \b false otherwise.
SetOffset(lldb::addr_t offset)448   bool SetOffset(lldb::addr_t offset) {
449     bool changed = m_offset != offset;
450     m_offset = offset;
451     return changed;
452   }
453 
SetRawAddress(lldb::addr_t addr)454   void SetRawAddress(lldb::addr_t addr) {
455     m_section_wp.reset();
456     m_offset = addr;
457   }
458 
Slide(int64_t offset)459   bool Slide(int64_t offset) {
460     if (m_offset != LLDB_INVALID_ADDRESS) {
461       m_offset += offset;
462       return true;
463     }
464     return false;
465   }
466 
467   /// Set accessor for the section.
468   ///
469   /// \param[in] section_sp
470   ///     A new lldb::Section pointer to use as the section base. Can
471   ///     be NULL for absolute addresses that are not relative to
472   ///     any section.
SetSection(const lldb::SectionSP & section_sp)473   void SetSection(const lldb::SectionSP &section_sp) {
474     m_section_wp = section_sp;
475   }
476 
ClearSection()477   void ClearSection() { m_section_wp.reset(); }
478 
479   /// Reconstruct a symbol context from an address.
480   ///
481   /// This class doesn't inherit from SymbolContextScope because many address
482   /// objects have short lifespans. Address objects that are section offset
483   /// can reconstruct their symbol context by looking up the address in the
484   /// module found in the section.
485   ///
486   /// \see SymbolContextScope::CalculateSymbolContext(SymbolContext*)
487   uint32_t CalculateSymbolContext(SymbolContext *sc,
488                                   lldb::SymbolContextItem resolve_scope =
489                                       lldb::eSymbolContextEverything) const;
490 
491   lldb::ModuleSP CalculateSymbolContextModule() const;
492 
493   CompileUnit *CalculateSymbolContextCompileUnit() const;
494 
495   Function *CalculateSymbolContextFunction() const;
496 
497   Block *CalculateSymbolContextBlock() const;
498 
499   Symbol *CalculateSymbolContextSymbol() const;
500 
501   bool CalculateSymbolContextLineEntry(LineEntry &line_entry) const;
502 
503   // Returns true if the section should be valid, but isn't because the shared
504   // pointer to the section can't be reconstructed from a weak pointer that
505   // contains a valid weak reference to a section. Returns false if the section
506   // weak pointer has no reference to a section, or if the section is still
507   // valid
508   bool SectionWasDeleted() const;
509 
510 protected:
511   // Member variables.
512   lldb::SectionWP m_section_wp; ///< The section for the address, can be NULL.
513   lldb::addr_t m_offset = LLDB_INVALID_ADDRESS; ///< Offset into section if \a
514                                                 ///< m_section_wp is valid...
515 
516   // Returns true if the m_section_wp once had a reference to a valid section
517   // shared pointer, but no longer does. This can happen if we have an address
518   // from a module that gets unloaded and deleted. This function should only be
519   // called if GetSection() returns an empty shared pointer and you want to
520   // know if this address used to have a valid section.
521   bool SectionWasDeletedPrivate() const;
522 };
523 
524 // NOTE: Be careful using this operator. It can correctly compare two
525 // addresses from the same Module correctly. It can't compare two addresses
526 // from different modules in any meaningful way, but it will compare the module
527 // pointers.
528 //
529 // To sum things up:
530 // - works great for addresses within the same module - it works for addresses
531 // across multiple modules, but don't expect the
532 //   address results to make much sense
533 //
534 // This basically lets Address objects be used in ordered collection classes.
535 bool operator<(const Address &lhs, const Address &rhs);
536 bool operator>(const Address &lhs, const Address &rhs);
537 bool operator==(const Address &lhs, const Address &rhs);
538 bool operator!=(const Address &lhs, const Address &rhs);
539 
540 } // namespace lldb_private
541 
542 #endif // LLDB_CORE_ADDRESS_H
543