1 //===-- Module.h ------------------------------------------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #ifndef LLDB_CORE_MODULE_H
10 #define LLDB_CORE_MODULE_H
11 
12 #include "lldb/Core/Address.h"
13 #include "lldb/Core/ModuleList.h"
14 #include "lldb/Core/ModuleSpec.h"
15 #include "lldb/Symbol/ObjectFile.h"
16 #include "lldb/Symbol/SymbolContextScope.h"
17 #include "lldb/Symbol/TypeSystem.h"
18 #include "lldb/Target/PathMappingList.h"
19 #include "lldb/Target/Statistics.h"
20 #include "lldb/Utility/ArchSpec.h"
21 #include "lldb/Utility/ConstString.h"
22 #include "lldb/Utility/FileSpec.h"
23 #include "lldb/Utility/Status.h"
24 #include "lldb/Utility/UUID.h"
25 #include "lldb/Utility/XcodeSDK.h"
26 #include "lldb/lldb-defines.h"
27 #include "lldb/lldb-enumerations.h"
28 #include "lldb/lldb-forward.h"
29 #include "lldb/lldb-types.h"
30 
31 #include "llvm/ADT/DenseSet.h"
32 #include "llvm/ADT/STLFunctionalExtras.h"
33 #include "llvm/ADT/StringRef.h"
34 #include "llvm/Support/Chrono.h"
35 
36 #include <atomic>
37 #include <cstddef>
38 #include <cstdint>
39 #include <memory>
40 #include <mutex>
41 #include <optional>
42 #include <string>
43 #include <vector>
44 
45 namespace lldb_private {
46 class CompilerDeclContext;
47 class Function;
48 class Log;
49 class ObjectFile;
50 class RegularExpression;
51 class SectionList;
52 class Stream;
53 class Symbol;
54 class SymbolContext;
55 class SymbolContextList;
56 class SymbolFile;
57 class Symtab;
58 class Target;
59 class TypeList;
60 class TypeMap;
61 class VariableList;
62 
63 /// Options used by Module::FindFunctions. This cannot be a nested class
64 /// because it must be forward-declared in ModuleList.h.
65 struct ModuleFunctionSearchOptions {
66   /// Include the symbol table.
67   bool include_symbols = false;
68   /// Include inlined functions.
69   bool include_inlines = false;
70 };
71 
72 /// \class Module Module.h "lldb/Core/Module.h"
73 /// A class that describes an executable image and its associated
74 ///        object and symbol files.
75 ///
76 /// The module is designed to be able to select a single slice of an
77 /// executable image as it would appear on disk and during program execution.
78 ///
79 /// Modules control when and if information is parsed according to which
80 /// accessors are called. For example the object file (ObjectFile)
81 /// representation will only be parsed if the object file is requested using
82 /// the Module::GetObjectFile() is called. The debug symbols will only be
83 /// parsed if the symbol file (SymbolFile) is requested using the
84 /// Module::GetSymbolFile() method.
85 ///
86 /// The module will parse more detailed information as more queries are made.
87 class Module : public std::enable_shared_from_this<Module>,
88                public SymbolContextScope {
89 public:
90   class LookupInfo;
91   // Static functions that can track the lifetime of module objects. This is
92   // handy because we might have Module objects that are in shared pointers
93   // that aren't in the global module list (from ModuleList). If this is the
94   // case we need to know about it. The modules in the global list maintained
95   // by these functions can be viewed using the "target modules list" command
96   // using the "--global" (-g for short).
97   static size_t GetNumberAllocatedModules();
98 
99   static Module *GetAllocatedModuleAtIndex(size_t idx);
100 
101   static std::recursive_mutex &GetAllocationModuleCollectionMutex();
102 
103   /// Construct with file specification and architecture.
104   ///
105   /// Clients that wish to share modules with other targets should use
106   /// ModuleList::GetSharedModule().
107   ///
108   /// \param[in] file_spec
109   ///     The file specification for the on disk representation of
110   ///     this executable image.
111   ///
112   /// \param[in] arch
113   ///     The architecture to set as the current architecture in
114   ///     this module.
115   ///
116   /// \param[in] object_name
117   ///     The name of an object in a module used to extract a module
118   ///     within a module (.a files and modules that contain multiple
119   ///     architectures).
120   ///
121   /// \param[in] object_offset
122   ///     The offset within an existing module used to extract a
123   ///     module within a module (.a files and modules that contain
124   ///     multiple architectures).
125   Module(
126       const FileSpec &file_spec, const ArchSpec &arch,
127       ConstString object_name = ConstString(), lldb::offset_t object_offset = 0,
128       const llvm::sys::TimePoint<> &object_mod_time = llvm::sys::TimePoint<>());
129 
130   Module(const ModuleSpec &module_spec);
131 
132   template <typename ObjFilePlugin, typename... Args>
CreateModuleFromObjectFile(Args &&...args)133   static lldb::ModuleSP CreateModuleFromObjectFile(Args &&...args) {
134     // Must create a module and place it into a shared pointer before we can
135     // create an object file since it has a std::weak_ptr back to the module,
136     // so we need to control the creation carefully in this static function
137     lldb::ModuleSP module_sp(new Module());
138     module_sp->m_objfile_sp =
139         std::make_shared<ObjFilePlugin>(module_sp, std::forward<Args>(args)...);
140     module_sp->m_did_load_objfile.store(true, std::memory_order_relaxed);
141 
142     // Once we get the object file, set module ArchSpec to the one we get from
143     // the object file. If the object file does not have an architecture, we
144     // consider the creation a failure.
145     ArchSpec arch = module_sp->m_objfile_sp->GetArchitecture();
146     if (!arch)
147       return nullptr;
148     module_sp->m_arch = arch;
149 
150     // Also copy the object file's FileSpec.
151     module_sp->m_file = module_sp->m_objfile_sp->GetFileSpec();
152     return module_sp;
153   }
154 
155   /// Destructor.
156   ~Module() override;
157 
158   bool MatchesModuleSpec(const ModuleSpec &module_ref);
159 
160   /// Set the load address for all sections in a module to be the file address
161   /// plus \a slide.
162   ///
163   /// Many times a module will be loaded in a target with a constant offset
164   /// applied to all top level sections. This function can set the load
165   /// address for all top level sections to be the section file address +
166   /// offset.
167   ///
168   /// \param[in] target
169   ///     The target in which to apply the section load addresses.
170   ///
171   /// \param[in] value
172   ///     if \a value_is_offset is true, then value is the offset to
173   ///     apply to all file addresses for all top level sections in
174   ///     the object file as each section load address is being set.
175   ///     If \a value_is_offset is false, then "value" is the new
176   ///     absolute base address for the image.
177   ///
178   /// \param[in] value_is_offset
179   ///     If \b true, then \a value is an offset to apply to each
180   ///     file address of each top level section.
181   ///     If \b false, then \a value is the image base address that
182   ///     will be used to rigidly slide all loadable sections.
183   ///
184   /// \param[out] changed
185   ///     If any section load addresses were changed in \a target,
186   ///     then \a changed will be set to \b true. Else \a changed
187   ///     will be set to false. This allows this function to be
188   ///     called multiple times on the same module for the same
189   ///     target. If the module hasn't moved, then \a changed will
190   ///     be false and no module updated notification will need to
191   ///     be sent out.
192   ///
193   /// \return
194   ///     /b True if any sections were successfully loaded in \a target,
195   ///     /b false otherwise.
196   bool SetLoadAddress(Target &target, lldb::addr_t value, bool value_is_offset,
197                       bool &changed);
198 
199   /// \copydoc SymbolContextScope::CalculateSymbolContext(SymbolContext*)
200   ///
201   /// \see SymbolContextScope
202   void CalculateSymbolContext(SymbolContext *sc) override;
203 
204   lldb::ModuleSP CalculateSymbolContextModule() override;
205 
206   void
207   GetDescription(llvm::raw_ostream &s,
208                  lldb::DescriptionLevel level = lldb::eDescriptionLevelFull);
209 
210   /// Get the module path and object name.
211   ///
212   /// Modules can refer to object files. In this case the specification is
213   /// simple and would return the path to the file:
214   ///
215   ///     "/usr/lib/foo.dylib"
216   ///
217   /// Modules can be .o files inside of a BSD archive (.a file). In this case,
218   /// the object specification will look like:
219   ///
220   ///     "/usr/lib/foo.a(bar.o)"
221   ///
222   /// There are many places where logging wants to log this fully qualified
223   /// specification, so we centralize this functionality here.
224   ///
225   /// \return
226   ///     The object path + object name if there is one.
227   std::string GetSpecificationDescription() const;
228 
229   /// Dump a description of this object to a Stream.
230   ///
231   /// Dump a description of the contents of this object to the supplied stream
232   /// \a s. The dumped content will be only what has been loaded or parsed up
233   /// to this point at which this function is called, so this is a good way to
234   /// see what has been parsed in a module.
235   ///
236   /// \param[in] s
237   ///     The stream to which to dump the object description.
238   void Dump(Stream *s);
239 
240   /// \copydoc SymbolContextScope::DumpSymbolContext(Stream*)
241   ///
242   /// \see SymbolContextScope
243   void DumpSymbolContext(Stream *s) override;
244 
245   /// Find a symbol in the object file's symbol table.
246   ///
247   /// \param[in] name
248   ///     The name of the symbol that we are looking for.
249   ///
250   /// \param[in] symbol_type
251   ///     If set to eSymbolTypeAny, find a symbol of any type that
252   ///     has a name that matches \a name. If set to any other valid
253   ///     SymbolType enumeration value, then search only for
254   ///     symbols that match \a symbol_type.
255   ///
256   /// \return
257   ///     Returns a valid symbol pointer if a symbol was found,
258   ///     nullptr otherwise.
259   const Symbol *FindFirstSymbolWithNameAndType(
260       ConstString name, lldb::SymbolType symbol_type = lldb::eSymbolTypeAny);
261 
262   void FindSymbolsWithNameAndType(ConstString name,
263                                   lldb::SymbolType symbol_type,
264                                   SymbolContextList &sc_list);
265 
266   void FindSymbolsMatchingRegExAndType(
267       const RegularExpression &regex, lldb::SymbolType symbol_type,
268       SymbolContextList &sc_list,
269       Mangled::NamePreference mangling_preference = Mangled::ePreferDemangled);
270 
271   /// Find a function symbols in the object file's symbol table.
272   ///
273   /// \param[in] name
274   ///     The name of the symbol that we are looking for.
275   ///
276   /// \param[in] name_type_mask
277   ///     A mask that has one or more bitwise OR'ed values from the
278   ///     lldb::FunctionNameType enumeration type that indicate what
279   ///     kind of names we are looking for.
280   ///
281   /// \param[out] sc_list
282   ///     A list to append any matching symbol contexts to.
283   void FindFunctionSymbols(ConstString name, uint32_t name_type_mask,
284                            SymbolContextList &sc_list);
285 
286   /// Find compile units by partial or full path.
287   ///
288   /// Finds all compile units that match \a path in all of the modules and
289   /// returns the results in \a sc_list.
290   ///
291   /// \param[in] path
292   ///     The name of the function we are looking for.
293   ///
294   /// \param[out] sc_list
295   ///     A symbol context list that gets filled in with all of the
296   ///     matches.
297   void FindCompileUnits(const FileSpec &path, SymbolContextList &sc_list);
298 
299   /// Find functions by lookup info.
300   ///
301   /// If the function is an inlined function, it will have a block,
302   /// representing the inlined function, and the function will be the
303   /// containing function.  If it is not inlined, then the block will be NULL.
304   ///
305   /// \param[in] lookup_info
306   ///     The lookup info of the function we are looking for.
307   ///
308   /// \param[out] sc_list
309   ///     A symbol context list that gets filled in with all of the
310   ///     matches.
311   void FindFunctions(const LookupInfo &lookup_info,
312                      const CompilerDeclContext &parent_decl_ctx,
313                      const ModuleFunctionSearchOptions &options,
314                      SymbolContextList &sc_list);
315 
316   /// Find functions by name.
317   ///
318   /// If the function is an inlined function, it will have a block,
319   /// representing the inlined function, and the function will be the
320   /// containing function.  If it is not inlined, then the block will be NULL.
321   ///
322   /// \param[in] name
323   ///     The name of the function we are looking for.
324   ///
325   /// \param[in] name_type_mask
326   ///     A bit mask of bits that indicate what kind of names should
327   ///     be used when doing the lookup. Bits include fully qualified
328   ///     names, base names, C++ methods, or ObjC selectors.
329   ///     See FunctionNameType for more details.
330   ///
331   /// \param[out] sc_list
332   ///     A symbol context list that gets filled in with all of the
333   ///     matches.
334   void FindFunctions(ConstString name,
335                      const CompilerDeclContext &parent_decl_ctx,
336                      lldb::FunctionNameType name_type_mask,
337                      const ModuleFunctionSearchOptions &options,
338                      SymbolContextList &sc_list);
339 
340   /// Find functions by compiler context.
341   void FindFunctions(llvm::ArrayRef<CompilerContext> compiler_ctx,
342                      lldb::FunctionNameType name_type_mask,
343                      const ModuleFunctionSearchOptions &options,
344                      SymbolContextList &sc_list);
345 
346   /// Find functions by name.
347   ///
348   /// If the function is an inlined function, it will have a block,
349   /// representing the inlined function, and the function will be the
350   /// containing function.  If it is not inlined, then the block will be NULL.
351   ///
352   /// \param[in] regex
353   ///     A regular expression to use when matching the name.
354   ///
355   /// \param[out] sc_list
356   ///     A symbol context list that gets filled in with all of the
357   ///     matches.
358   void FindFunctions(const RegularExpression &regex,
359                      const ModuleFunctionSearchOptions &options,
360                      SymbolContextList &sc_list);
361 
362   /// Find addresses by file/line
363   ///
364   /// \param[in] target_sp
365   ///     The target the addresses are desired for.
366   ///
367   /// \param[in] file
368   ///     Source file to locate.
369   ///
370   /// \param[in] line
371   ///     Source line to locate.
372   ///
373   /// \param[in] function
374   ///	    Optional filter function. Addresses within this function will be
375   ///     added to the 'local' list. All others will be added to the 'extern'
376   ///     list.
377   ///
378   /// \param[out] output_local
379   ///     All matching addresses within 'function'
380   ///
381   /// \param[out] output_extern
382   ///     All matching addresses not within 'function'
383   void FindAddressesForLine(const lldb::TargetSP target_sp,
384                             const FileSpec &file, uint32_t line,
385                             Function *function,
386                             std::vector<Address> &output_local,
387                             std::vector<Address> &output_extern);
388 
389   /// Find global and static variables by name.
390   ///
391   /// \param[in] name
392   ///     The name of the global or static variable we are looking
393   ///     for.
394   ///
395   /// \param[in] parent_decl_ctx
396   ///     If valid, a decl context that results must exist within
397   ///
398   /// \param[in] max_matches
399   ///     Allow the number of matches to be limited to \a
400   ///     max_matches. Specify UINT32_MAX to get all possible matches.
401   ///
402   /// \param[in] variable_list
403   ///     A list of variables that gets the matches appended to.
404   ///
405   void FindGlobalVariables(ConstString name,
406                            const CompilerDeclContext &parent_decl_ctx,
407                            size_t max_matches, VariableList &variable_list);
408 
409   /// Find global and static variables by regular expression.
410   ///
411   /// \param[in] regex
412   ///     A regular expression to use when matching the name.
413   ///
414   /// \param[in] max_matches
415   ///     Allow the number of matches to be limited to \a
416   ///     max_matches. Specify UINT32_MAX to get all possible matches.
417   ///
418   /// \param[in] variable_list
419   ///     A list of variables that gets the matches appended to.
420   ///
421   void FindGlobalVariables(const RegularExpression &regex, size_t max_matches,
422                            VariableList &variable_list);
423 
424   /// Find types using a type-matching object that contains all search
425   /// parameters.
426   ///
427   /// \see lldb_private::TypeQuery
428   ///
429   /// \param[in] query
430   ///     A type matching object that contains all of the details of the type
431   ///     search.
432   ///
433   /// \param[in] results
434   ///     Any matching types will be populated into the \a results object using
435   ///     TypeMap::InsertUnique(...).
436   void FindTypes(const TypeQuery &query, TypeResults &results);
437 
438   /// Get const accessor for the module architecture.
439   ///
440   /// \return
441   ///     A const reference to the architecture object.
442   const ArchSpec &GetArchitecture() const;
443 
444   /// Get const accessor for the module file specification.
445   ///
446   /// This function returns the file for the module on the host system that is
447   /// running LLDB. This can differ from the path on the platform since we
448   /// might be doing remote debugging.
449   ///
450   /// \return
451   ///     A const reference to the file specification object.
GetFileSpec()452   const FileSpec &GetFileSpec() const { return m_file; }
453 
454   /// Get accessor for the module platform file specification.
455   ///
456   /// Platform file refers to the path of the module as it is known on the
457   /// remote system on which it is being debugged. For local debugging this is
458   /// always the same as Module::GetFileSpec(). But remote debugging might
459   /// mention a file "/usr/lib/liba.dylib" which might be locally downloaded
460   /// and cached. In this case the platform file could be something like:
461   /// "/tmp/lldb/platform-cache/remote.host.computer/usr/lib/liba.dylib" The
462   /// file could also be cached in a local developer kit directory.
463   ///
464   /// \return
465   ///     A const reference to the file specification object.
GetPlatformFileSpec()466   const FileSpec &GetPlatformFileSpec() const {
467     if (m_platform_file)
468       return m_platform_file;
469     return m_file;
470   }
471 
SetPlatformFileSpec(const FileSpec & file)472   void SetPlatformFileSpec(const FileSpec &file) { m_platform_file = file; }
473 
GetRemoteInstallFileSpec()474   const FileSpec &GetRemoteInstallFileSpec() const {
475     return m_remote_install_file;
476   }
477 
SetRemoteInstallFileSpec(const FileSpec & file)478   void SetRemoteInstallFileSpec(const FileSpec &file) {
479     m_remote_install_file = file;
480   }
481 
GetSymbolFileFileSpec()482   const FileSpec &GetSymbolFileFileSpec() const { return m_symfile_spec; }
483 
484   void PreloadSymbols();
485 
486   void SetSymbolFileFileSpec(const FileSpec &file);
487 
GetModificationTime()488   const llvm::sys::TimePoint<> &GetModificationTime() const {
489     return m_mod_time;
490   }
491 
GetObjectModificationTime()492   const llvm::sys::TimePoint<> &GetObjectModificationTime() const {
493     return m_object_mod_time;
494   }
495 
496   /// This callback will be called by SymbolFile implementations when
497   /// parsing a compile unit that contains SDK information.
498   /// \param sysroot will be added to the path remapping dictionary.
499   void RegisterXcodeSDK(llvm::StringRef sdk, llvm::StringRef sysroot);
500 
501   /// Tells whether this module is capable of being the main executable for a
502   /// process.
503   ///
504   /// \return
505   ///     \b true if it is, \b false otherwise.
506   bool IsExecutable();
507 
508   /// Tells whether this module has been loaded in the target passed in. This
509   /// call doesn't distinguish between whether the module is loaded by the
510   /// dynamic loader, or by a "target module add" type call.
511   ///
512   /// \param[in] target
513   ///    The target to check whether this is loaded in.
514   ///
515   /// \return
516   ///     \b true if it is, \b false otherwise.
517   bool IsLoadedInTarget(Target *target);
518 
519   bool LoadScriptingResourceInTarget(Target *target, Status &error,
520                                      Stream &feedback_stream);
521 
522   /// Get the number of compile units for this module.
523   ///
524   /// \return
525   ///     The number of compile units that the symbol vendor plug-in
526   ///     finds.
527   size_t GetNumCompileUnits();
528 
529   lldb::CompUnitSP GetCompileUnitAtIndex(size_t idx);
530 
531   ConstString GetObjectName() const;
532 
GetObjectOffset()533   uint64_t GetObjectOffset() const { return m_object_offset; }
534 
535   /// Get the object file representation for the current architecture.
536   ///
537   /// If the object file has not been located or parsed yet, this function
538   /// will find the best ObjectFile plug-in that can parse Module::m_file.
539   ///
540   /// \return
541   ///     If Module::m_file does not exist, or no plug-in was found
542   ///     that can parse the file, or the object file doesn't contain
543   ///     the current architecture in Module::m_arch, nullptr will be
544   ///     returned, else a valid object file interface will be
545   ///     returned. The returned pointer is owned by this object and
546   ///     remains valid as long as the object is around.
547   virtual ObjectFile *GetObjectFile();
548 
549   /// Get the unified section list for the module. This is the section list
550   /// created by the module's object file and any debug info and symbol files
551   /// created by the symbol vendor.
552   ///
553   /// If the symbol vendor has not been loaded yet, this function will return
554   /// the section list for the object file.
555   ///
556   /// \return
557   ///     Unified module section list.
558   virtual SectionList *GetSectionList();
559 
560   /// Notify the module that the file addresses for the Sections have been
561   /// updated.
562   ///
563   /// If the Section file addresses for a module are updated, this method
564   /// should be called.  Any parts of the module, object file, or symbol file
565   /// that has cached those file addresses must invalidate or update its
566   /// cache.
567   virtual void SectionFileAddressesChanged();
568 
569   /// Returns a reference to the UnwindTable for this Module
570   ///
571   /// The UnwindTable contains FuncUnwinders objects for any function in this
572   /// Module.  If a FuncUnwinders object hasn't been created yet (i.e. the
573   /// function has yet to be unwound in a stack walk), it will be created when
574   /// requested.  Specifically, we do not create FuncUnwinders objects for
575   /// functions until they are needed.
576   ///
577   /// \return
578   ///     Returns the unwind table for this module. If this object has no
579   ///     associated object file, an empty UnwindTable is returned.
580   UnwindTable &GetUnwindTable();
581 
582   llvm::VersionTuple GetVersion();
583 
584   /// Load an object file from memory.
585   ///
586   /// If available, the size of the object file in memory may be passed to
587   /// avoid additional round trips to process memory. If the size is not
588   /// provided, a default value is used. This value should be large enough to
589   /// enable the ObjectFile plugins to read the header of the object file
590   /// without going back to the process.
591   ///
592   /// \return
593   ///     The object file loaded from memory or nullptr, if the operation
594   ///     failed (see the `error` for more information in that case).
595   ObjectFile *GetMemoryObjectFile(const lldb::ProcessSP &process_sp,
596                                   lldb::addr_t header_addr, Status &error,
597                                   size_t size_to_read = 512);
598 
599   /// Get the module's symbol file
600   ///
601   /// If the symbol file has already been loaded, this function returns it. All
602   /// arguments are ignored. If the symbol file has not been located yet, and
603   /// the can_create argument is false, the function returns nullptr. If
604   /// can_create is true, this function will find the best SymbolFile plug-in
605   /// that can use the current object file. feedback_strm, if not null, is used
606   /// to report the details of the search process.
607   virtual SymbolFile *GetSymbolFile(bool can_create = true,
608                                     Stream *feedback_strm = nullptr);
609 
610   Symtab *GetSymtab();
611 
612   /// Get a reference to the UUID value contained in this object.
613   ///
614   /// If the executable image file doesn't not have a UUID value built into
615   /// the file format, an MD5 checksum of the entire file, or slice of the
616   /// file for the current architecture should be used.
617   ///
618   /// \return
619   ///     A const pointer to the internal copy of the UUID value in
620   ///     this module if this module has a valid UUID value, NULL
621   ///     otherwise.
622   const lldb_private::UUID &GetUUID();
623 
624   /// A debugging function that will cause everything in a module to
625   /// be parsed.
626   ///
627   /// All compile units will be parsed, along with all globals and static
628   /// variables and all functions for those compile units. All types, scopes,
629   /// local variables, static variables, global variables, and line tables
630   /// will be parsed. This can be used prior to dumping a module to see a
631   /// complete list of the resulting debug information that gets parsed, or as
632   /// a debug function to ensure that the module can consume all of the debug
633   /// data the symbol vendor provides.
634   void ParseAllDebugSymbols();
635 
636   bool ResolveFileAddress(lldb::addr_t vm_addr, Address &so_addr);
637 
638   /// Resolve the symbol context for the given address.
639   ///
640   /// Tries to resolve the matching symbol context based on a lookup from the
641   /// current symbol vendor.  If the lazy lookup fails, an attempt is made to
642   /// parse the eh_frame section to handle stripped symbols.  If this fails,
643   /// an attempt is made to resolve the symbol to the previous address to
644   /// handle the case of a function with a tail call.
645   ///
646   /// Use properties of the modified SymbolContext to inspect any resolved
647   /// target, module, compilation unit, symbol, function, function block or
648   /// line entry.  Use the return value to determine which of these properties
649   /// have been modified.
650   ///
651   /// \param[in] so_addr
652   ///     A load address to resolve.
653   ///
654   /// \param[in] resolve_scope
655   ///     The scope that should be resolved (see SymbolContext::Scope).
656   ///     A combination of flags from the enumeration SymbolContextItem
657   ///     requesting a resolution depth.  Note that the flags that are
658   ///     actually resolved may be a superset of the requested flags.
659   ///     For instance, eSymbolContextSymbol requires resolution of
660   ///     eSymbolContextModule, and eSymbolContextFunction requires
661   ///     eSymbolContextSymbol.
662   ///
663   /// \param[out] sc
664   ///     The SymbolContext that is modified based on symbol resolution.
665   ///
666   /// \param[in] resolve_tail_call_address
667   ///     Determines if so_addr should resolve to a symbol in the case
668   ///     of a function whose last instruction is a call.  In this case,
669   ///     the PC can be one past the address range of the function.
670   ///
671   /// \return
672   ///     The scope that has been resolved (see SymbolContext::Scope).
673   ///
674   /// \see SymbolContext::Scope
675   uint32_t ResolveSymbolContextForAddress(
676       const Address &so_addr, lldb::SymbolContextItem resolve_scope,
677       SymbolContext &sc, bool resolve_tail_call_address = false);
678 
679   /// Resolve items in the symbol context for a given file and line.
680   ///
681   /// Tries to resolve \a file_path and \a line to a list of matching symbol
682   /// contexts.
683   ///
684   /// The line table entries contains addresses that can be used to further
685   /// resolve the values in each match: the function, block, symbol. Care
686   /// should be taken to minimize the amount of information that is requested
687   /// to only what is needed -- typically the module, compile unit, line table
688   /// and line table entry are sufficient.
689   ///
690   /// \param[in] file_path
691   ///     A path to a source file to match. If \a file_path does not
692   ///     specify a directory, then this query will match all files
693   ///     whose base filename matches. If \a file_path does specify
694   ///     a directory, the fullpath to the file must match.
695   ///
696   /// \param[in] line
697   ///     The source line to match, or zero if just the compile unit
698   ///     should be resolved.
699   ///
700   /// \param[in] check_inlines
701   ///     Check for inline file and line number matches. This option
702   ///     should be used sparingly as it will cause all line tables
703   ///     for every compile unit to be parsed and searched for
704   ///     matching inline file entries.
705   ///
706   /// \param[in] resolve_scope
707   ///     The scope that should be resolved (see
708   ///     SymbolContext::Scope).
709   ///
710   /// \param[out] sc_list
711   ///     A symbol context list that gets matching symbols contexts
712   ///     appended to.
713   ///
714   /// \return
715   ///     The number of matches that were added to \a sc_list.
716   ///
717   /// \see SymbolContext::Scope
718   uint32_t ResolveSymbolContextForFilePath(
719       const char *file_path, uint32_t line, bool check_inlines,
720       lldb::SymbolContextItem resolve_scope, SymbolContextList &sc_list);
721 
722   /// Resolve items in the symbol context for a given file and line.
723   ///
724   /// Tries to resolve \a file_spec and \a line to a list of matching symbol
725   /// contexts.
726   ///
727   /// The line table entries contains addresses that can be used to further
728   /// resolve the values in each match: the function, block, symbol. Care
729   /// should be taken to minimize the amount of information that is requested
730   /// to only what is needed -- typically the module, compile unit, line table
731   /// and line table entry are sufficient.
732   ///
733   /// \param[in] file_spec
734   ///     A file spec to a source file to match. If \a file_path does
735   ///     not specify a directory, then this query will match all
736   ///     files whose base filename matches. If \a file_path does
737   ///     specify a directory, the fullpath to the file must match.
738   ///
739   /// \param[in] line
740   ///     The source line to match, or zero if just the compile unit
741   ///     should be resolved.
742   ///
743   /// \param[in] check_inlines
744   ///     Check for inline file and line number matches. This option
745   ///     should be used sparingly as it will cause all line tables
746   ///     for every compile unit to be parsed and searched for
747   ///     matching inline file entries.
748   ///
749   /// \param[in] resolve_scope
750   ///     The scope that should be resolved (see
751   ///     SymbolContext::Scope).
752   ///
753   /// \param[out] sc_list
754   ///     A symbol context list that gets filled in with all of the
755   ///     matches.
756   ///
757   /// \return
758   ///     A integer that contains SymbolContext::Scope bits set for
759   ///     each item that was successfully resolved.
760   ///
761   /// \see SymbolContext::Scope
762   uint32_t ResolveSymbolContextsForFileSpec(
763       const FileSpec &file_spec, uint32_t line, bool check_inlines,
764       lldb::SymbolContextItem resolve_scope, SymbolContextList &sc_list);
765 
766   void SetFileSpecAndObjectName(const FileSpec &file, ConstString object_name);
767 
768   bool GetIsDynamicLinkEditor();
769 
770   llvm::Expected<lldb::TypeSystemSP>
771   GetTypeSystemForLanguage(lldb::LanguageType language);
772 
773   /// Call \p callback for each \p TypeSystem in this \p Module.
774   /// Return true from callback to keep iterating, false to stop iterating.
775   void ForEachTypeSystem(llvm::function_ref<bool(lldb::TypeSystemSP)> callback);
776 
777   // Special error functions that can do printf style formatting that will
778   // prepend the message with something appropriate for this module (like the
779   // architecture, path and object name (if any)). This centralizes code so
780   // that everyone doesn't need to format their error and log messages on their
781   // own and keeps the output a bit more consistent.
782   template <typename... Args>
LogMessage(Log * log,const char * format,Args &&...args)783   void LogMessage(Log *log, const char *format, Args &&...args) {
784     LogMessage(log, llvm::formatv(format, std::forward<Args>(args)...));
785   }
786 
787   template <typename... Args>
LogMessageVerboseBacktrace(Log * log,const char * format,Args &&...args)788   void LogMessageVerboseBacktrace(Log *log, const char *format,
789                                   Args &&...args) {
790     LogMessageVerboseBacktrace(
791         log, llvm::formatv(format, std::forward<Args>(args)...));
792   }
793 
794   template <typename... Args>
ReportWarning(const char * format,Args &&...args)795   void ReportWarning(const char *format, Args &&...args) {
796     ReportWarning(llvm::formatv(format, std::forward<Args>(args)...));
797   }
798 
799   template <typename... Args>
ReportError(const char * format,Args &&...args)800   void ReportError(const char *format, Args &&...args) {
801     ReportError(llvm::formatv(format, std::forward<Args>(args)...));
802   }
803 
804   // Only report an error once when the module is first detected to be modified
805   // so we don't spam the console with many messages.
806   template <typename... Args>
ReportErrorIfModifyDetected(const char * format,Args &&...args)807   void ReportErrorIfModifyDetected(const char *format, Args &&...args) {
808     ReportErrorIfModifyDetected(
809         llvm::formatv(format, std::forward<Args>(args)...));
810   }
811 
812   void ReportWarningOptimization(std::optional<lldb::user_id_t> debugger_id);
813 
814   void
815   ReportWarningUnsupportedLanguage(lldb::LanguageType language,
816                                    std::optional<lldb::user_id_t> debugger_id);
817 
818   // Return true if the file backing this module has changed since the module
819   // was originally created  since we saved the initial file modification time
820   // when the module first gets created.
821   bool FileHasChanged() const;
822 
823   // SymbolFile and ObjectFile member objects should lock the
824   // module mutex to avoid deadlocks.
GetMutex()825   std::recursive_mutex &GetMutex() const { return m_mutex; }
826 
GetSourceMappingList()827   PathMappingList &GetSourceMappingList() { return m_source_mappings; }
828 
GetSourceMappingList()829   const PathMappingList &GetSourceMappingList() const {
830     return m_source_mappings;
831   }
832 
833   /// Finds a source file given a file spec using the module source path
834   /// remappings (if any).
835   ///
836   /// Tries to resolve \a orig_spec by checking the module source path
837   /// remappings. It makes sure the file exists, so this call can be expensive
838   /// if the remappings are on a network file system, so use this function
839   /// sparingly (not in a tight debug info parsing loop).
840   ///
841   /// \param[in] orig_spec
842   ///     The original source file path to try and remap.
843   ///
844   /// \param[out] new_spec
845   ///     The newly remapped filespec that is guaranteed to exist.
846   ///
847   /// \return
848   ///     /b true if \a orig_spec was successfully located and
849   ///     \a new_spec is filled in with an existing file spec,
850   ///     \b false otherwise.
851   bool FindSourceFile(const FileSpec &orig_spec, FileSpec &new_spec) const;
852 
853   /// Remaps a source file given \a path into \a new_path.
854   ///
855   /// Remaps \a path if any source remappings match. This function does NOT
856   /// stat the file system so it can be used in tight loops where debug info
857   /// is being parsed.
858   ///
859   /// \param[in] path
860   ///     The original source file path to try and remap.
861   ///
862   /// \return
863   ///     The newly remapped filespec that is may or may not exist if
864   ///     \a path was successfully located.
865   std::optional<std::string> RemapSourceFile(llvm::StringRef path) const;
866   bool RemapSourceFile(const char *, std::string &) const = delete;
867 
868   /// Update the ArchSpec to a more specific variant.
869   bool MergeArchitecture(const ArchSpec &arch_spec);
870 
871   /// Accessor for the symbol table parse time metric.
872   ///
873   /// The value is returned as a reference to allow it to be updated by the
874   /// ElapsedTime RAII object.
GetSymtabParseTime()875   StatsDuration &GetSymtabParseTime() { return m_symtab_parse_time; }
876 
877   /// Accessor for the symbol table index time metric.
878   ///
879   /// The value is returned as a reference to allow it to be updated by the
880   /// ElapsedTime RAII object.
GetSymtabIndexTime()881   StatsDuration &GetSymtabIndexTime() { return m_symtab_index_time; }
882 
883   /// \class LookupInfo Module.h "lldb/Core/Module.h"
884   /// A class that encapsulates name lookup information.
885   ///
886   /// Users can type a wide variety of partial names when setting breakpoints
887   /// by name or when looking for functions by name. The SymbolFile object is
888   /// only required to implement name lookup for function basenames and for
889   /// fully mangled names. This means if the user types in a partial name, we
890   /// must reduce this to a name lookup that will work with all SymbolFile
891   /// objects. So we might reduce a name lookup to look for a basename, and then
892   /// prune out any results that don't match.
893   ///
894   /// The "m_name" member variable represents the name as it was typed by the
895   /// user. "m_lookup_name" will be the name we actually search for through
896   /// the symbol or objects files. Lanaguage is included in case we need to
897   /// filter results by language at a later date. The "m_name_type_mask"
898   /// member variable tells us what kinds of names we are looking for and can
899   /// help us prune out unwanted results.
900   ///
901   /// Function lookups are done in Module.cpp, ModuleList.cpp and in
902   /// BreakpointResolverName.cpp and they all now use this class to do lookups
903   /// correctly.
904   class LookupInfo {
905   public:
906     LookupInfo() = default;
907 
908     LookupInfo(ConstString name, lldb::FunctionNameType name_type_mask,
909                lldb::LanguageType language);
910 
GetName()911     ConstString GetName() const { return m_name; }
912 
SetName(ConstString name)913     void SetName(ConstString name) { m_name = name; }
914 
GetLookupName()915     ConstString GetLookupName() const { return m_lookup_name; }
916 
SetLookupName(ConstString name)917     void SetLookupName(ConstString name) { m_lookup_name = name; }
918 
GetNameTypeMask()919     lldb::FunctionNameType GetNameTypeMask() const { return m_name_type_mask; }
920 
SetNameTypeMask(lldb::FunctionNameType mask)921     void SetNameTypeMask(lldb::FunctionNameType mask) {
922       m_name_type_mask = mask;
923     }
924 
GetLanguageType()925     lldb::LanguageType GetLanguageType() const { return m_language; }
926 
927     bool NameMatchesLookupInfo(
928         ConstString function_name,
929         lldb::LanguageType language_type = lldb::eLanguageTypeUnknown) const;
930 
931     void Prune(SymbolContextList &sc_list, size_t start_idx) const;
932 
933   protected:
934     /// What the user originally typed
935     ConstString m_name;
936 
937     /// The actual name will lookup when calling in the object or symbol file
938     ConstString m_lookup_name;
939 
940     /// Limit matches to only be for this language
941     lldb::LanguageType m_language = lldb::eLanguageTypeUnknown;
942 
943     /// One or more bits from lldb::FunctionNameType that indicate what kind of
944     /// names we are looking for
945     lldb::FunctionNameType m_name_type_mask = lldb::eFunctionNameTypeNone;
946 
947     ///< If \b true, then demangled names that match will need to contain
948     ///< "m_name" in order to be considered a match
949     bool m_match_name_after_lookup = false;
950   };
951 
952   /// Get a unique hash for this module.
953   ///
954   /// The hash should be enough to identify the file on disk and the
955   /// architecture of the file. If the module represents an object inside of a
956   /// file, then the hash should include the object name and object offset to
957   /// ensure a unique hash. Some examples:
958   /// - just a regular object file (mach-o, elf, coff, etc) should create a hash
959   /// - a universal mach-o file that contains to multiple architectures,
960   ///   each architecture slice should have a unique hash even though they come
961   ///   from the same file
962   /// - a .o file inside of a BSD archive. Each .o file will have an object name
963   ///   and object offset that should produce a unique hash. The object offset
964   ///   is needed as BSD archive files can contain multiple .o files that have
965   ///   the same name.
966   uint32_t Hash();
967 
968   /// Get a unique cache key for the current module.
969   ///
970   /// The cache key must be unique for a file on disk and not change if the file
971   /// is updated. This allows cache data to use this key as a prefix and as
972   /// files are modified in disk, we will overwrite the cache files. If one file
973   /// can contain multiple files, like a universal mach-o file or like a BSD
974   /// archive, the cache key must contain enough information to differentiate
975   /// these different files.
976   std::string GetCacheKey();
977 
978   /// Get the global index file cache.
979   ///
980   /// LLDB can cache data for a module between runs. This cache directory can be
981   /// used to stored data that previously was manually created each time you debug.
982   /// Examples include debug information indexes, symbol tables, symbol table
983   /// indexes, and more.
984   ///
985   /// \returns
986   ///   If caching is enabled in the lldb settings, return a pointer to the data
987   ///   file cache. If caching is not enabled, return NULL.
988   static DataFileCache *GetIndexCache();
989 protected:
990   // Member Variables
991   mutable std::recursive_mutex m_mutex; ///< A mutex to keep this object happy
992                                         /// in multi-threaded environments.
993 
994   /// The modification time for this module when it was created.
995   llvm::sys::TimePoint<> m_mod_time;
996 
997   ArchSpec m_arch; ///< The architecture for this module.
998   UUID m_uuid; ///< Each module is assumed to have a unique identifier to help
999                /// match it up to debug symbols.
1000   FileSpec m_file; ///< The file representation on disk for this module (if
1001                    /// there is one).
1002   FileSpec m_platform_file; ///< The path to the module on the platform on which
1003                             /// it is being debugged
1004   FileSpec m_remote_install_file; ///< If set when debugging on remote
1005                                   /// platforms, this module will be installed
1006                                   /// at this location
1007   FileSpec m_symfile_spec;   ///< If this path is valid, then this is the file
1008                              /// that _will_ be used as the symbol file for this
1009                              /// module
1010   ConstString m_object_name; ///< The name an object within this module that is
1011                              /// selected, or empty of the module is represented
1012                              /// by \a m_file.
1013   uint64_t m_object_offset = 0;
1014   llvm::sys::TimePoint<> m_object_mod_time;
1015 
1016   /// DataBuffer containing the module image, if it was provided at
1017   /// construction time. Otherwise the data will be retrieved by mapping
1018   /// one of the FileSpec members above.
1019   lldb::DataBufferSP m_data_sp;
1020 
1021   lldb::ObjectFileSP m_objfile_sp; ///< A shared pointer to the object file
1022                                    /// parser for this module as it may or may
1023                                    /// not be shared with the SymbolFile
1024   std::optional<UnwindTable> m_unwind_table; ///< Table of FuncUnwinders
1025                                              /// objects created for this
1026                                              /// Module's functions
1027   lldb::SymbolVendorUP
1028       m_symfile_up; ///< A pointer to the symbol vendor for this module.
1029   std::vector<lldb::SymbolVendorUP>
1030       m_old_symfiles; ///< If anyone calls Module::SetSymbolFileFileSpec() and
1031                       /// changes the symbol file,
1032   ///< we need to keep all old symbol files around in case anyone has type
1033   /// references to them
1034   TypeSystemMap m_type_system_map; ///< A map of any type systems associated
1035                                    /// with this module
1036   /// Module specific source remappings for when you have debug info for a
1037   /// module that doesn't match where the sources currently are.
1038   PathMappingList m_source_mappings =
1039       ModuleList::GetGlobalModuleListProperties().GetSymlinkMappings();
1040 
1041   lldb::SectionListUP m_sections_up; ///< Unified section list for module that
1042                                      /// is used by the ObjectFile and
1043                                      /// ObjectFile instances for the debug info
1044 
1045   std::atomic<bool> m_did_load_objfile{false};
1046   std::atomic<bool> m_did_load_symfile{false};
1047   std::atomic<bool> m_did_set_uuid{false};
1048   mutable bool m_file_has_changed : 1,
1049       m_first_file_changed_log : 1; /// See if the module was modified after it
1050                                     /// was initially opened.
1051   /// We store a symbol table parse time duration here because we might have
1052   /// an object file and a symbol file which both have symbol tables. The parse
1053   /// time for the symbol tables can be aggregated here.
1054   StatsDuration m_symtab_parse_time;
1055   /// We store a symbol named index time duration here because we might have
1056   /// an object file and a symbol file which both have symbol tables. The parse
1057   /// time for the symbol tables can be aggregated here.
1058   StatsDuration m_symtab_index_time;
1059 
1060   std::once_flag m_optimization_warning;
1061   std::once_flag m_language_warning;
1062 
1063   void SymbolIndicesToSymbolContextList(Symtab *symtab,
1064                                         std::vector<uint32_t> &symbol_indexes,
1065                                         SymbolContextList &sc_list);
1066 
1067   bool SetArchitecture(const ArchSpec &new_arch);
1068 
1069   void SetUUID(const lldb_private::UUID &uuid);
1070 
1071   SectionList *GetUnifiedSectionList();
1072 
1073   friend class ModuleList;
1074   friend class ObjectFile;
1075   friend class SymbolFile;
1076 
1077 private:
1078   Module(); // Only used internally by CreateJITModule ()
1079 
1080   Module(const Module &) = delete;
1081   const Module &operator=(const Module &) = delete;
1082 
1083   void LogMessage(Log *log, const llvm::formatv_object_base &payload);
1084   void LogMessageVerboseBacktrace(Log *log,
1085                                   const llvm::formatv_object_base &payload);
1086   void ReportWarning(const llvm::formatv_object_base &payload);
1087   void ReportError(const llvm::formatv_object_base &payload);
1088   void ReportErrorIfModifyDetected(const llvm::formatv_object_base &payload);
1089 };
1090 
1091 } // namespace lldb_private
1092 
1093 #endif // LLDB_CORE_MODULE_H
1094