1 //===- RuntimeDyld.h - Run-time dynamic linker for MC-JIT -------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // Interface for the runtime dynamic linker facilities of the MC-JIT.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #ifndef LLVM_EXECUTIONENGINE_RUNTIMEDYLD_H
14 #define LLVM_EXECUTIONENGINE_RUNTIMEDYLD_H
15 
16 #include "llvm/ADT/FunctionExtras.h"
17 #include "llvm/ADT/STLExtras.h"
18 #include "llvm/ADT/StringRef.h"
19 #include "llvm/DebugInfo/DIContext.h"
20 #include "llvm/ExecutionEngine/JITSymbol.h"
21 #include "llvm/Object/ObjectFile.h"
22 #include "llvm/Support/Error.h"
23 #include <algorithm>
24 #include <cassert>
25 #include <cstddef>
26 #include <cstdint>
27 #include <map>
28 #include <memory>
29 #include <string>
30 #include <system_error>
31 
32 namespace llvm {
33 
34 namespace object {
35 
36 template <typename T> class OwningBinary;
37 
38 } // end namespace object
39 
40 /// Base class for errors originating in RuntimeDyld, e.g. missing relocation
41 /// support.
42 class RuntimeDyldError : public ErrorInfo<RuntimeDyldError> {
43 public:
44   static char ID;
45 
46   RuntimeDyldError(std::string ErrMsg) : ErrMsg(std::move(ErrMsg)) {}
47 
48   void log(raw_ostream &OS) const override;
49   const std::string &getErrorMessage() const { return ErrMsg; }
50   std::error_code convertToErrorCode() const override;
51 
52 private:
53   std::string ErrMsg;
54 };
55 
56 class RuntimeDyldImpl;
57 
58 class RuntimeDyld {
59 public:
60   // Change the address associated with a section when resolving relocations.
61   // Any relocations already associated with the symbol will be re-resolved.
62   void reassignSectionAddress(unsigned SectionID, uint64_t Addr);
63 
64   using NotifyStubEmittedFunction = std::function<void(
65       StringRef FileName, StringRef SectionName, StringRef SymbolName,
66       unsigned SectionID, uint32_t StubOffset)>;
67 
68   /// Information about the loaded object.
69   class LoadedObjectInfo : public llvm::LoadedObjectInfo {
70     friend class RuntimeDyldImpl;
71 
72   public:
73     using ObjSectionToIDMap = std::map<object::SectionRef, unsigned>;
74 
75     LoadedObjectInfo(RuntimeDyldImpl &RTDyld, ObjSectionToIDMap ObjSecToIDMap)
76         : RTDyld(RTDyld), ObjSecToIDMap(std::move(ObjSecToIDMap)) {}
77 
78     virtual object::OwningBinary<object::ObjectFile>
79     getObjectForDebug(const object::ObjectFile &Obj) const = 0;
80 
81     uint64_t
82     getSectionLoadAddress(const object::SectionRef &Sec) const override;
83 
84   protected:
85     virtual void anchor();
86 
87     RuntimeDyldImpl &RTDyld;
88     ObjSectionToIDMap ObjSecToIDMap;
89   };
90 
91   /// Memory Management.
92   class MemoryManager {
93     friend class RuntimeDyld;
94 
95   public:
96     MemoryManager() = default;
97     virtual ~MemoryManager() = default;
98 
99     /// Allocate a memory block of (at least) the given size suitable for
100     /// executable code. The SectionID is a unique identifier assigned by the
101     /// RuntimeDyld instance, and optionally recorded by the memory manager to
102     /// access a loaded section.
103     virtual uint8_t *allocateCodeSection(uintptr_t Size, unsigned Alignment,
104                                          unsigned SectionID,
105                                          StringRef SectionName) = 0;
106 
107     /// Allocate a memory block of (at least) the given size suitable for data.
108     /// The SectionID is a unique identifier assigned by the JIT engine, and
109     /// optionally recorded by the memory manager to access a loaded section.
110     virtual uint8_t *allocateDataSection(uintptr_t Size, unsigned Alignment,
111                                          unsigned SectionID,
112                                          StringRef SectionName,
113                                          bool IsReadOnly) = 0;
114 
115     /// An allocated TLS section
116     struct TLSSection {
117       /// The pointer to the initialization image
118       uint8_t *InitializationImage;
119       /// The TLS offset
120       intptr_t Offset;
121     };
122 
123     /// Allocate a memory block of (at least) the given size to be used for
124     /// thread-local storage (TLS).
125     virtual TLSSection allocateTLSSection(uintptr_t Size, unsigned Alignment,
126                                           unsigned SectionID,
127                                           StringRef SectionName);
128 
129     /// Inform the memory manager about the total amount of memory required to
130     /// allocate all sections to be loaded:
131     /// \p CodeSize - the total size of all code sections
132     /// \p DataSizeRO - the total size of all read-only data sections
133     /// \p DataSizeRW - the total size of all read-write data sections
134     ///
135     /// Note that by default the callback is disabled. To enable it
136     /// redefine the method needsToReserveAllocationSpace to return true.
137     virtual void reserveAllocationSpace(uintptr_t CodeSize, uint32_t CodeAlign,
138                                         uintptr_t RODataSize,
139                                         uint32_t RODataAlign,
140                                         uintptr_t RWDataSize,
141                                         uint32_t RWDataAlign) {}
142 
143     /// Override to return true to enable the reserveAllocationSpace callback.
144     virtual bool needsToReserveAllocationSpace() { return false; }
145 
146     /// Override to return false to tell LLVM no stub space will be needed.
147     /// This requires some guarantees depending on architecuture, but when
148     /// you know what you are doing it saves allocated space.
149     virtual bool allowStubAllocation() const { return true; }
150 
151     /// Register the EH frames with the runtime so that c++ exceptions work.
152     ///
153     /// \p Addr parameter provides the local address of the EH frame section
154     /// data, while \p LoadAddr provides the address of the data in the target
155     /// address space.  If the section has not been remapped (which will usually
156     /// be the case for local execution) these two values will be the same.
157     virtual void registerEHFrames(uint8_t *Addr, uint64_t LoadAddr,
158                                   size_t Size) = 0;
159     virtual void deregisterEHFrames() = 0;
160 
161     /// This method is called when object loading is complete and section page
162     /// permissions can be applied.  It is up to the memory manager implementation
163     /// to decide whether or not to act on this method.  The memory manager will
164     /// typically allocate all sections as read-write and then apply specific
165     /// permissions when this method is called.  Code sections cannot be executed
166     /// until this function has been called.  In addition, any cache coherency
167     /// operations needed to reliably use the memory are also performed.
168     ///
169     /// Returns true if an error occurred, false otherwise.
170     virtual bool finalizeMemory(std::string *ErrMsg = nullptr) = 0;
171 
172     /// This method is called after an object has been loaded into memory but
173     /// before relocations are applied to the loaded sections.
174     ///
175     /// Memory managers which are preparing code for execution in an external
176     /// address space can use this call to remap the section addresses for the
177     /// newly loaded object.
178     ///
179     /// For clients that do not need access to an ExecutionEngine instance this
180     /// method should be preferred to its cousin
181     /// MCJITMemoryManager::notifyObjectLoaded as this method is compatible with
182     /// ORC JIT stacks.
183     virtual void notifyObjectLoaded(RuntimeDyld &RTDyld,
184                                     const object::ObjectFile &Obj) {}
185 
186   private:
187     virtual void anchor();
188 
189     bool FinalizationLocked = false;
190   };
191 
192   /// Construct a RuntimeDyld instance.
193   RuntimeDyld(MemoryManager &MemMgr, JITSymbolResolver &Resolver);
194   RuntimeDyld(const RuntimeDyld &) = delete;
195   RuntimeDyld &operator=(const RuntimeDyld &) = delete;
196   ~RuntimeDyld();
197 
198   /// Add the referenced object file to the list of objects to be loaded and
199   /// relocated.
200   std::unique_ptr<LoadedObjectInfo> loadObject(const object::ObjectFile &O);
201 
202   /// Get the address of our local copy of the symbol. This may or may not
203   /// be the address used for relocation (clients can copy the data around
204   /// and resolve relocatons based on where they put it).
205   void *getSymbolLocalAddress(StringRef Name) const;
206 
207   /// Get the section ID for the section containing the given symbol.
208   unsigned getSymbolSectionID(StringRef Name) const;
209 
210   /// Get the target address and flags for the named symbol.
211   /// This address is the one used for relocation.
212   JITEvaluatedSymbol getSymbol(StringRef Name) const;
213 
214   /// Returns a copy of the symbol table. This can be used by on-finalized
215   /// callbacks to extract the symbol table before throwing away the
216   /// RuntimeDyld instance. Because the map keys (StringRefs) are backed by
217   /// strings inside the RuntimeDyld instance, the map should be processed
218   /// before the RuntimeDyld instance is discarded.
219   std::map<StringRef, JITEvaluatedSymbol> getSymbolTable() const;
220 
221   /// Resolve the relocations for all symbols we currently know about.
222   void resolveRelocations();
223 
224   /// Map a section to its target address space value.
225   /// Map the address of a JIT section as returned from the memory manager
226   /// to the address in the target process as the running code will see it.
227   /// This is the address which will be used for relocation resolution.
228   void mapSectionAddress(const void *LocalAddress, uint64_t TargetAddress);
229 
230   /// Returns the section's working memory.
231   StringRef getSectionContent(unsigned SectionID) const;
232 
233   /// If the section was loaded, return the section's load address,
234   /// otherwise return None.
235   uint64_t getSectionLoadAddress(unsigned SectionID) const;
236 
237   /// Set the NotifyStubEmitted callback. This is used for debugging
238   /// purposes. A callback is made for each stub that is generated.
239   void setNotifyStubEmitted(NotifyStubEmittedFunction NotifyStubEmitted) {
240     this->NotifyStubEmitted = std::move(NotifyStubEmitted);
241   }
242 
243   /// Register any EH frame sections that have been loaded but not previously
244   /// registered with the memory manager.  Note, RuntimeDyld is responsible
245   /// for identifying the EH frame and calling the memory manager with the
246   /// EH frame section data.  However, the memory manager itself will handle
247   /// the actual target-specific EH frame registration.
248   void registerEHFrames();
249 
250   void deregisterEHFrames();
251 
252   bool hasError();
253   StringRef getErrorString();
254 
255   /// By default, only sections that are "required for execution" are passed to
256   /// the RTDyldMemoryManager, and other sections are discarded. Passing 'true'
257   /// to this method will cause RuntimeDyld to pass all sections to its
258   /// memory manager regardless of whether they are "required to execute" in the
259   /// usual sense. This is useful for inspecting metadata sections that may not
260   /// contain relocations, E.g. Debug info, stackmaps.
261   ///
262   /// Must be called before the first object file is loaded.
263   void setProcessAllSections(bool ProcessAllSections) {
264     assert(!Dyld && "setProcessAllSections must be called before loadObject.");
265     this->ProcessAllSections = ProcessAllSections;
266   }
267 
268   /// Perform all actions needed to make the code owned by this RuntimeDyld
269   /// instance executable:
270   ///
271   /// 1) Apply relocations.
272   /// 2) Register EH frames.
273   /// 3) Update memory permissions*.
274   ///
275   /// * Finalization is potentially recursive**, and the 3rd step will only be
276   ///   applied by the outermost call to finalize. This allows different
277   ///   RuntimeDyld instances to share a memory manager without the innermost
278   ///   finalization locking the memory and causing relocation fixup errors in
279   ///   outer instances.
280   ///
281   /// ** Recursive finalization occurs when one RuntimeDyld instances needs the
282   ///   address of a symbol owned by some other instance in order to apply
283   ///   relocations.
284   ///
285   void finalizeWithMemoryManagerLocking();
286 
287 private:
288   friend void jitLinkForORC(
289       object::OwningBinary<object::ObjectFile> O,
290       RuntimeDyld::MemoryManager &MemMgr, JITSymbolResolver &Resolver,
291       bool ProcessAllSections,
292       unique_function<Error(const object::ObjectFile &Obj, LoadedObjectInfo &,
293                             std::map<StringRef, JITEvaluatedSymbol>)>
294           OnLoaded,
295       unique_function<void(object::OwningBinary<object::ObjectFile> O,
296                            std::unique_ptr<LoadedObjectInfo>, Error)>
297           OnEmitted);
298 
299   // RuntimeDyldImpl is the actual class. RuntimeDyld is just the public
300   // interface.
301   std::unique_ptr<RuntimeDyldImpl> Dyld;
302   MemoryManager &MemMgr;
303   JITSymbolResolver &Resolver;
304   bool ProcessAllSections;
305   NotifyStubEmittedFunction NotifyStubEmitted;
306 };
307 
308 // Asynchronous JIT link for ORC.
309 //
310 // Warning: This API is experimental and probably should not be used by anyone
311 // but ORC's RTDyldObjectLinkingLayer2. Internally it constructs a RuntimeDyld
312 // instance and uses continuation passing to perform the fix-up and finalize
313 // steps asynchronously.
314 void jitLinkForORC(
315     object::OwningBinary<object::ObjectFile> O,
316     RuntimeDyld::MemoryManager &MemMgr, JITSymbolResolver &Resolver,
317     bool ProcessAllSections,
318     unique_function<Error(const object::ObjectFile &Obj,
319                           RuntimeDyld::LoadedObjectInfo &,
320                           std::map<StringRef, JITEvaluatedSymbol>)>
321         OnLoaded,
322     unique_function<void(object::OwningBinary<object::ObjectFile>,
323                          std::unique_ptr<RuntimeDyld::LoadedObjectInfo>, Error)>
324         OnEmitted);
325 
326 } // end namespace llvm
327 
328 #endif // LLVM_EXECUTIONENGINE_RUNTIMEDYLD_H
329