1 //===- RuntimeDyld.h - Run-time dynamic linker for MC-JIT -------*- C++ -*-===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // Interface for the runtime dynamic linker facilities of the MC-JIT. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #ifndef LLVM_EXECUTIONENGINE_RUNTIMEDYLD_H 14 #define LLVM_EXECUTIONENGINE_RUNTIMEDYLD_H 15 16 #include "llvm/ADT/FunctionExtras.h" 17 #include "llvm/ADT/STLExtras.h" 18 #include "llvm/ADT/StringRef.h" 19 #include "llvm/DebugInfo/DIContext.h" 20 #include "llvm/ExecutionEngine/JITSymbol.h" 21 #include "llvm/Object/ObjectFile.h" 22 #include "llvm/Support/Error.h" 23 #include <algorithm> 24 #include <cassert> 25 #include <cstddef> 26 #include <cstdint> 27 #include <map> 28 #include <memory> 29 #include <string> 30 #include <system_error> 31 32 namespace llvm { 33 34 namespace object { 35 36 template <typename T> class OwningBinary; 37 38 } // end namespace object 39 40 /// Base class for errors originating in RuntimeDyld, e.g. missing relocation 41 /// support. 42 class RuntimeDyldError : public ErrorInfo<RuntimeDyldError> { 43 public: 44 static char ID; 45 46 RuntimeDyldError(std::string ErrMsg) : ErrMsg(std::move(ErrMsg)) {} 47 48 void log(raw_ostream &OS) const override; 49 const std::string &getErrorMessage() const { return ErrMsg; } 50 std::error_code convertToErrorCode() const override; 51 52 private: 53 std::string ErrMsg; 54 }; 55 56 class RuntimeDyldImpl; 57 58 class RuntimeDyld { 59 public: 60 // Change the address associated with a section when resolving relocations. 61 // Any relocations already associated with the symbol will be re-resolved. 62 void reassignSectionAddress(unsigned SectionID, uint64_t Addr); 63 64 using NotifyStubEmittedFunction = std::function<void( 65 StringRef FileName, StringRef SectionName, StringRef SymbolName, 66 unsigned SectionID, uint32_t StubOffset)>; 67 68 /// Information about the loaded object. 69 class LoadedObjectInfo : public llvm::LoadedObjectInfo { 70 friend class RuntimeDyldImpl; 71 72 public: 73 using ObjSectionToIDMap = std::map<object::SectionRef, unsigned>; 74 75 LoadedObjectInfo(RuntimeDyldImpl &RTDyld, ObjSectionToIDMap ObjSecToIDMap) 76 : RTDyld(RTDyld), ObjSecToIDMap(std::move(ObjSecToIDMap)) {} 77 78 virtual object::OwningBinary<object::ObjectFile> 79 getObjectForDebug(const object::ObjectFile &Obj) const = 0; 80 81 uint64_t 82 getSectionLoadAddress(const object::SectionRef &Sec) const override; 83 84 protected: 85 virtual void anchor(); 86 87 RuntimeDyldImpl &RTDyld; 88 ObjSectionToIDMap ObjSecToIDMap; 89 }; 90 91 /// Memory Management. 92 class MemoryManager { 93 friend class RuntimeDyld; 94 95 public: 96 MemoryManager() = default; 97 virtual ~MemoryManager() = default; 98 99 /// Allocate a memory block of (at least) the given size suitable for 100 /// executable code. The SectionID is a unique identifier assigned by the 101 /// RuntimeDyld instance, and optionally recorded by the memory manager to 102 /// access a loaded section. 103 virtual uint8_t *allocateCodeSection(uintptr_t Size, unsigned Alignment, 104 unsigned SectionID, 105 StringRef SectionName) = 0; 106 107 /// Allocate a memory block of (at least) the given size suitable for data. 108 /// The SectionID is a unique identifier assigned by the JIT engine, and 109 /// optionally recorded by the memory manager to access a loaded section. 110 virtual uint8_t *allocateDataSection(uintptr_t Size, unsigned Alignment, 111 unsigned SectionID, 112 StringRef SectionName, 113 bool IsReadOnly) = 0; 114 115 /// An allocated TLS section 116 struct TLSSection { 117 /// The pointer to the initialization image 118 uint8_t *InitializationImage; 119 /// The TLS offset 120 intptr_t Offset; 121 }; 122 123 /// Allocate a memory block of (at least) the given size to be used for 124 /// thread-local storage (TLS). 125 virtual TLSSection allocateTLSSection(uintptr_t Size, unsigned Alignment, 126 unsigned SectionID, 127 StringRef SectionName); 128 129 /// Inform the memory manager about the total amount of memory required to 130 /// allocate all sections to be loaded: 131 /// \p CodeSize - the total size of all code sections 132 /// \p DataSizeRO - the total size of all read-only data sections 133 /// \p DataSizeRW - the total size of all read-write data sections 134 /// 135 /// Note that by default the callback is disabled. To enable it 136 /// redefine the method needsToReserveAllocationSpace to return true. 137 virtual void reserveAllocationSpace(uintptr_t CodeSize, uint32_t CodeAlign, 138 uintptr_t RODataSize, 139 uint32_t RODataAlign, 140 uintptr_t RWDataSize, 141 uint32_t RWDataAlign) {} 142 143 /// Override to return true to enable the reserveAllocationSpace callback. 144 virtual bool needsToReserveAllocationSpace() { return false; } 145 146 /// Override to return false to tell LLVM no stub space will be needed. 147 /// This requires some guarantees depending on architecuture, but when 148 /// you know what you are doing it saves allocated space. 149 virtual bool allowStubAllocation() const { return true; } 150 151 /// Register the EH frames with the runtime so that c++ exceptions work. 152 /// 153 /// \p Addr parameter provides the local address of the EH frame section 154 /// data, while \p LoadAddr provides the address of the data in the target 155 /// address space. If the section has not been remapped (which will usually 156 /// be the case for local execution) these two values will be the same. 157 virtual void registerEHFrames(uint8_t *Addr, uint64_t LoadAddr, 158 size_t Size) = 0; 159 virtual void deregisterEHFrames() = 0; 160 161 /// This method is called when object loading is complete and section page 162 /// permissions can be applied. It is up to the memory manager implementation 163 /// to decide whether or not to act on this method. The memory manager will 164 /// typically allocate all sections as read-write and then apply specific 165 /// permissions when this method is called. Code sections cannot be executed 166 /// until this function has been called. In addition, any cache coherency 167 /// operations needed to reliably use the memory are also performed. 168 /// 169 /// Returns true if an error occurred, false otherwise. 170 virtual bool finalizeMemory(std::string *ErrMsg = nullptr) = 0; 171 172 /// This method is called after an object has been loaded into memory but 173 /// before relocations are applied to the loaded sections. 174 /// 175 /// Memory managers which are preparing code for execution in an external 176 /// address space can use this call to remap the section addresses for the 177 /// newly loaded object. 178 /// 179 /// For clients that do not need access to an ExecutionEngine instance this 180 /// method should be preferred to its cousin 181 /// MCJITMemoryManager::notifyObjectLoaded as this method is compatible with 182 /// ORC JIT stacks. 183 virtual void notifyObjectLoaded(RuntimeDyld &RTDyld, 184 const object::ObjectFile &Obj) {} 185 186 private: 187 virtual void anchor(); 188 189 bool FinalizationLocked = false; 190 }; 191 192 /// Construct a RuntimeDyld instance. 193 RuntimeDyld(MemoryManager &MemMgr, JITSymbolResolver &Resolver); 194 RuntimeDyld(const RuntimeDyld &) = delete; 195 RuntimeDyld &operator=(const RuntimeDyld &) = delete; 196 ~RuntimeDyld(); 197 198 /// Add the referenced object file to the list of objects to be loaded and 199 /// relocated. 200 std::unique_ptr<LoadedObjectInfo> loadObject(const object::ObjectFile &O); 201 202 /// Get the address of our local copy of the symbol. This may or may not 203 /// be the address used for relocation (clients can copy the data around 204 /// and resolve relocatons based on where they put it). 205 void *getSymbolLocalAddress(StringRef Name) const; 206 207 /// Get the section ID for the section containing the given symbol. 208 unsigned getSymbolSectionID(StringRef Name) const; 209 210 /// Get the target address and flags for the named symbol. 211 /// This address is the one used for relocation. 212 JITEvaluatedSymbol getSymbol(StringRef Name) const; 213 214 /// Returns a copy of the symbol table. This can be used by on-finalized 215 /// callbacks to extract the symbol table before throwing away the 216 /// RuntimeDyld instance. Because the map keys (StringRefs) are backed by 217 /// strings inside the RuntimeDyld instance, the map should be processed 218 /// before the RuntimeDyld instance is discarded. 219 std::map<StringRef, JITEvaluatedSymbol> getSymbolTable() const; 220 221 /// Resolve the relocations for all symbols we currently know about. 222 void resolveRelocations(); 223 224 /// Map a section to its target address space value. 225 /// Map the address of a JIT section as returned from the memory manager 226 /// to the address in the target process as the running code will see it. 227 /// This is the address which will be used for relocation resolution. 228 void mapSectionAddress(const void *LocalAddress, uint64_t TargetAddress); 229 230 /// Returns the section's working memory. 231 StringRef getSectionContent(unsigned SectionID) const; 232 233 /// If the section was loaded, return the section's load address, 234 /// otherwise return None. 235 uint64_t getSectionLoadAddress(unsigned SectionID) const; 236 237 /// Set the NotifyStubEmitted callback. This is used for debugging 238 /// purposes. A callback is made for each stub that is generated. 239 void setNotifyStubEmitted(NotifyStubEmittedFunction NotifyStubEmitted) { 240 this->NotifyStubEmitted = std::move(NotifyStubEmitted); 241 } 242 243 /// Register any EH frame sections that have been loaded but not previously 244 /// registered with the memory manager. Note, RuntimeDyld is responsible 245 /// for identifying the EH frame and calling the memory manager with the 246 /// EH frame section data. However, the memory manager itself will handle 247 /// the actual target-specific EH frame registration. 248 void registerEHFrames(); 249 250 void deregisterEHFrames(); 251 252 bool hasError(); 253 StringRef getErrorString(); 254 255 /// By default, only sections that are "required for execution" are passed to 256 /// the RTDyldMemoryManager, and other sections are discarded. Passing 'true' 257 /// to this method will cause RuntimeDyld to pass all sections to its 258 /// memory manager regardless of whether they are "required to execute" in the 259 /// usual sense. This is useful for inspecting metadata sections that may not 260 /// contain relocations, E.g. Debug info, stackmaps. 261 /// 262 /// Must be called before the first object file is loaded. 263 void setProcessAllSections(bool ProcessAllSections) { 264 assert(!Dyld && "setProcessAllSections must be called before loadObject."); 265 this->ProcessAllSections = ProcessAllSections; 266 } 267 268 /// Perform all actions needed to make the code owned by this RuntimeDyld 269 /// instance executable: 270 /// 271 /// 1) Apply relocations. 272 /// 2) Register EH frames. 273 /// 3) Update memory permissions*. 274 /// 275 /// * Finalization is potentially recursive**, and the 3rd step will only be 276 /// applied by the outermost call to finalize. This allows different 277 /// RuntimeDyld instances to share a memory manager without the innermost 278 /// finalization locking the memory and causing relocation fixup errors in 279 /// outer instances. 280 /// 281 /// ** Recursive finalization occurs when one RuntimeDyld instances needs the 282 /// address of a symbol owned by some other instance in order to apply 283 /// relocations. 284 /// 285 void finalizeWithMemoryManagerLocking(); 286 287 private: 288 friend void jitLinkForORC( 289 object::OwningBinary<object::ObjectFile> O, 290 RuntimeDyld::MemoryManager &MemMgr, JITSymbolResolver &Resolver, 291 bool ProcessAllSections, 292 unique_function<Error(const object::ObjectFile &Obj, LoadedObjectInfo &, 293 std::map<StringRef, JITEvaluatedSymbol>)> 294 OnLoaded, 295 unique_function<void(object::OwningBinary<object::ObjectFile> O, 296 std::unique_ptr<LoadedObjectInfo>, Error)> 297 OnEmitted); 298 299 // RuntimeDyldImpl is the actual class. RuntimeDyld is just the public 300 // interface. 301 std::unique_ptr<RuntimeDyldImpl> Dyld; 302 MemoryManager &MemMgr; 303 JITSymbolResolver &Resolver; 304 bool ProcessAllSections; 305 NotifyStubEmittedFunction NotifyStubEmitted; 306 }; 307 308 // Asynchronous JIT link for ORC. 309 // 310 // Warning: This API is experimental and probably should not be used by anyone 311 // but ORC's RTDyldObjectLinkingLayer2. Internally it constructs a RuntimeDyld 312 // instance and uses continuation passing to perform the fix-up and finalize 313 // steps asynchronously. 314 void jitLinkForORC( 315 object::OwningBinary<object::ObjectFile> O, 316 RuntimeDyld::MemoryManager &MemMgr, JITSymbolResolver &Resolver, 317 bool ProcessAllSections, 318 unique_function<Error(const object::ObjectFile &Obj, 319 RuntimeDyld::LoadedObjectInfo &, 320 std::map<StringRef, JITEvaluatedSymbol>)> 321 OnLoaded, 322 unique_function<void(object::OwningBinary<object::ObjectFile>, 323 std::unique_ptr<RuntimeDyld::LoadedObjectInfo>, Error)> 324 OnEmitted); 325 326 } // end namespace llvm 327 328 #endif // LLVM_EXECUTIONENGINE_RUNTIMEDYLD_H 329