1//===-- MCJIT.h - Class definition for the MCJIT ----------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#ifndef LLVM_LIB_EXECUTIONENGINE_MCJIT_MCJIT_H
10#define LLVM_LIB_EXECUTIONENGINE_MCJIT_MCJIT_H
11
12#include "llvm/ADT/SmallPtrSet.h"
13#include "llvm/ADT/SmallVector.h"
14#include "llvm/ExecutionEngine/ExecutionEngine.h"
15#include "llvm/ExecutionEngine/ObjectCache.h"
16#include "llvm/ExecutionEngine/RTDyldMemoryManager.h"
17#include "llvm/ExecutionEngine/RuntimeDyld.h"
18#include "llvm/IR/Module.h"
19#include "llvm/Support/SmallVectorMemoryBuffer.h"
20
21namespace llvm {
22class MCJIT;
23
24// This is a helper class that the MCJIT execution engine uses for linking
25// functions across modules that it owns.  It aggregates the memory manager
26// that is passed in to the MCJIT constructor and defers most functionality
27// to that object.
28class LinkingSymbolResolver : public LegacyJITSymbolResolver {
29public:
30  LinkingSymbolResolver(MCJIT &Parent,
31                        std::shared_ptr<LegacyJITSymbolResolver> Resolver)
32      : ParentEngine(Parent), ClientResolver(std::move(Resolver)) {}
33
34  JITSymbol findSymbol(const std::string &Name) override;
35
36  // MCJIT doesn't support logical dylibs.
37  JITSymbol findSymbolInLogicalDylib(const std::string &Name) override {
38    return nullptr;
39  }
40
41private:
42  MCJIT &ParentEngine;
43  std::shared_ptr<LegacyJITSymbolResolver> ClientResolver;
44  void anchor() override;
45};
46
47// About Module states: added->loaded->finalized.
48//
49// The purpose of the "added" state is having modules in standby. (added=known
50// but not compiled). The idea is that you can add a module to provide function
51// definitions but if nothing in that module is referenced by a module in which
52// a function is executed (note the wording here because it's not exactly the
53// ideal case) then the module never gets compiled. This is sort of lazy
54// compilation.
55//
56// The purpose of the "loaded" state (loaded=compiled and required sections
57// copied into local memory but not yet ready for execution) is to have an
58// intermediate state wherein clients can remap the addresses of sections, using
59// MCJIT::mapSectionAddress, (in preparation for later copying to a new location
60// or an external process) before relocations and page permissions are applied.
61//
62// It might not be obvious at first glance, but the "remote-mcjit" case in the
63// lli tool does this.  In that case, the intermediate action is taken by the
64// RemoteMemoryManager in response to the notifyObjectLoaded function being
65// called.
66
67class MCJIT : public ExecutionEngine {
68  MCJIT(std::unique_ptr<Module> M, std::unique_ptr<TargetMachine> tm,
69        std::shared_ptr<MCJITMemoryManager> MemMgr,
70        std::shared_ptr<LegacyJITSymbolResolver> Resolver);
71
72  typedef llvm::SmallPtrSet<Module *, 4> ModulePtrSet;
73
74  class OwningModuleContainer {
75  public:
76    OwningModuleContainer() {
77    }
78    ~OwningModuleContainer() {
79      freeModulePtrSet(AddedModules);
80      freeModulePtrSet(LoadedModules);
81      freeModulePtrSet(FinalizedModules);
82    }
83
84    ModulePtrSet::iterator begin_added() { return AddedModules.begin(); }
85    ModulePtrSet::iterator end_added() { return AddedModules.end(); }
86    iterator_range<ModulePtrSet::iterator> added() {
87      return make_range(begin_added(), end_added());
88    }
89
90    ModulePtrSet::iterator begin_loaded() { return LoadedModules.begin(); }
91    ModulePtrSet::iterator end_loaded() { return LoadedModules.end(); }
92
93    ModulePtrSet::iterator begin_finalized() { return FinalizedModules.begin(); }
94    ModulePtrSet::iterator end_finalized() { return FinalizedModules.end(); }
95
96    void addModule(std::unique_ptr<Module> M) {
97      AddedModules.insert(M.release());
98    }
99
100    bool removeModule(Module *M) {
101      return AddedModules.erase(M) || LoadedModules.erase(M) ||
102             FinalizedModules.erase(M);
103    }
104
105    bool hasModuleBeenAddedButNotLoaded(Module *M) {
106      return AddedModules.count(M) != 0;
107    }
108
109    bool hasModuleBeenLoaded(Module *M) {
110      // If the module is in either the "loaded" or "finalized" sections it
111      // has been loaded.
112      return (LoadedModules.count(M) != 0 ) || (FinalizedModules.count(M) != 0);
113    }
114
115    bool hasModuleBeenFinalized(Module *M) {
116      return FinalizedModules.count(M) != 0;
117    }
118
119    bool ownsModule(Module* M) {
120      return (AddedModules.count(M) != 0) || (LoadedModules.count(M) != 0) ||
121             (FinalizedModules.count(M) != 0);
122    }
123
124    void markModuleAsLoaded(Module *M) {
125      // This checks against logic errors in the MCJIT implementation.
126      // This function should never be called with either a Module that MCJIT
127      // does not own or a Module that has already been loaded and/or finalized.
128      assert(AddedModules.count(M) &&
129             "markModuleAsLoaded: Module not found in AddedModules");
130
131      // Remove the module from the "Added" set.
132      AddedModules.erase(M);
133
134      // Add the Module to the "Loaded" set.
135      LoadedModules.insert(M);
136    }
137
138    void markModuleAsFinalized(Module *M) {
139      // This checks against logic errors in the MCJIT implementation.
140      // This function should never be called with either a Module that MCJIT
141      // does not own, a Module that has not been loaded or a Module that has
142      // already been finalized.
143      assert(LoadedModules.count(M) &&
144             "markModuleAsFinalized: Module not found in LoadedModules");
145
146      // Remove the module from the "Loaded" section of the list.
147      LoadedModules.erase(M);
148
149      // Add the Module to the "Finalized" section of the list by inserting it
150      // before the 'end' iterator.
151      FinalizedModules.insert(M);
152    }
153
154    void markAllLoadedModulesAsFinalized() {
155      for (ModulePtrSet::iterator I = LoadedModules.begin(),
156                                  E = LoadedModules.end();
157           I != E; ++I) {
158        Module *M = *I;
159        FinalizedModules.insert(M);
160      }
161      LoadedModules.clear();
162    }
163
164  private:
165    ModulePtrSet AddedModules;
166    ModulePtrSet LoadedModules;
167    ModulePtrSet FinalizedModules;
168
169    void freeModulePtrSet(ModulePtrSet& MPS) {
170      // Go through the module set and delete everything.
171      for (ModulePtrSet::iterator I = MPS.begin(), E = MPS.end(); I != E; ++I) {
172        Module *M = *I;
173        delete M;
174      }
175      MPS.clear();
176    }
177  };
178
179  std::unique_ptr<TargetMachine> TM;
180  MCContext *Ctx;
181  std::shared_ptr<MCJITMemoryManager> MemMgr;
182  LinkingSymbolResolver Resolver;
183  RuntimeDyld Dyld;
184  std::vector<JITEventListener*> EventListeners;
185
186  OwningModuleContainer OwnedModules;
187
188  SmallVector<object::OwningBinary<object::Archive>, 2> Archives;
189  SmallVector<std::unique_ptr<MemoryBuffer>, 2> Buffers;
190
191  SmallVector<std::unique_ptr<object::ObjectFile>, 2> LoadedObjects;
192
193  // An optional ObjectCache to be notified of compiled objects and used to
194  // perform lookup of pre-compiled code to avoid re-compilation.
195  ObjectCache *ObjCache;
196
197  Function *FindFunctionNamedInModulePtrSet(StringRef FnName,
198                                            ModulePtrSet::iterator I,
199                                            ModulePtrSet::iterator E);
200
201  GlobalVariable *FindGlobalVariableNamedInModulePtrSet(StringRef Name,
202                                                        bool AllowInternal,
203                                                        ModulePtrSet::iterator I,
204                                                        ModulePtrSet::iterator E);
205
206  void runStaticConstructorsDestructorsInModulePtrSet(bool isDtors,
207                                                      ModulePtrSet::iterator I,
208                                                      ModulePtrSet::iterator E);
209
210public:
211  ~MCJIT() override;
212
213  /// @name ExecutionEngine interface implementation
214  /// @{
215  void addModule(std::unique_ptr<Module> M) override;
216  void addObjectFile(std::unique_ptr<object::ObjectFile> O) override;
217  void addObjectFile(object::OwningBinary<object::ObjectFile> O) override;
218  void addArchive(object::OwningBinary<object::Archive> O) override;
219  bool removeModule(Module *M) override;
220
221  /// FindFunctionNamed - Search all of the active modules to find the function that
222  /// defines FnName.  This is very slow operation and shouldn't be used for
223  /// general code.
224  Function *FindFunctionNamed(StringRef FnName) override;
225
226  /// FindGlobalVariableNamed - Search all of the active modules to find the
227  /// global variable that defines Name.  This is very slow operation and
228  /// shouldn't be used for general code.
229  GlobalVariable *FindGlobalVariableNamed(StringRef Name,
230                                          bool AllowInternal = false) override;
231
232  /// Sets the object manager that MCJIT should use to avoid compilation.
233  void setObjectCache(ObjectCache *manager) override;
234
235  void setProcessAllSections(bool ProcessAllSections) override {
236    Dyld.setProcessAllSections(ProcessAllSections);
237  }
238
239  void generateCodeForModule(Module *M) override;
240
241  /// finalizeObject - ensure the module is fully processed and is usable.
242  ///
243  /// It is the user-level function for completing the process of making the
244  /// object usable for execution. It should be called after sections within an
245  /// object have been relocated using mapSectionAddress.  When this method is
246  /// called the MCJIT execution engine will reapply relocations for a loaded
247  /// object.
248  /// Is it OK to finalize a set of modules, add modules and finalize again.
249  // FIXME: Do we really need both of these?
250  void finalizeObject() override;
251  virtual void finalizeModule(Module *);
252  void finalizeLoadedModules();
253
254  /// runStaticConstructorsDestructors - This method is used to execute all of
255  /// the static constructors or destructors for a program.
256  ///
257  /// \param isDtors - Run the destructors instead of constructors.
258  void runStaticConstructorsDestructors(bool isDtors) override;
259
260  void *getPointerToFunction(Function *F) override;
261
262  GenericValue runFunction(Function *F,
263                           ArrayRef<GenericValue> ArgValues) override;
264
265  /// getPointerToNamedFunction - This method returns the address of the
266  /// specified function by using the dlsym function call.  As such it is only
267  /// useful for resolving library symbols, not code generated symbols.
268  ///
269  /// If AbortOnFailure is false and no function with the given name is
270  /// found, this function silently returns a null pointer. Otherwise,
271  /// it prints a message to stderr and aborts.
272  ///
273  void *getPointerToNamedFunction(StringRef Name,
274                                  bool AbortOnFailure = true) override;
275
276  /// mapSectionAddress - map a section to its target address space value.
277  /// Map the address of a JIT section as returned from the memory manager
278  /// to the address in the target process as the running code will see it.
279  /// This is the address which will be used for relocation resolution.
280  void mapSectionAddress(const void *LocalAddress,
281                         uint64_t TargetAddress) override {
282    Dyld.mapSectionAddress(LocalAddress, TargetAddress);
283  }
284  void RegisterJITEventListener(JITEventListener *L) override;
285  void UnregisterJITEventListener(JITEventListener *L) override;
286
287  // If successful, these function will implicitly finalize all loaded objects.
288  // To get a function address within MCJIT without causing a finalize, use
289  // getSymbolAddress.
290  uint64_t getGlobalValueAddress(const std::string &Name) override;
291  uint64_t getFunctionAddress(const std::string &Name) override;
292
293  TargetMachine *getTargetMachine() override { return TM.get(); }
294
295  /// @}
296  /// @name (Private) Registration Interfaces
297  /// @{
298
299  static void Register() {
300    MCJITCtor = createJIT;
301  }
302
303  static ExecutionEngine *
304  createJIT(std::unique_ptr<Module> M, std::string *ErrorStr,
305            std::shared_ptr<MCJITMemoryManager> MemMgr,
306            std::shared_ptr<LegacyJITSymbolResolver> Resolver,
307            std::unique_ptr<TargetMachine> TM);
308
309  // @}
310
311  // Takes a mangled name and returns the corresponding JITSymbol (if a
312  // definition of that mangled name has been added to the JIT).
313  JITSymbol findSymbol(const std::string &Name, bool CheckFunctionsOnly);
314
315  // DEPRECATED - Please use findSymbol instead.
316  //
317  // This is not directly exposed via the ExecutionEngine API, but it is
318  // used by the LinkingMemoryManager.
319  //
320  // getSymbolAddress takes an unmangled name and returns the corresponding
321  // JITSymbol if a definition of the name has been added to the JIT.
322  uint64_t getSymbolAddress(const std::string &Name,
323                            bool CheckFunctionsOnly);
324
325protected:
326  /// emitObject -- Generate a JITed object in memory from the specified module
327  /// Currently, MCJIT only supports a single module and the module passed to
328  /// this function call is expected to be the contained module.  The module
329  /// is passed as a parameter here to prepare for multiple module support in
330  /// the future.
331  std::unique_ptr<MemoryBuffer> emitObject(Module *M);
332
333  void notifyObjectLoaded(const object::ObjectFile &Obj,
334                          const RuntimeDyld::LoadedObjectInfo &L);
335  void notifyFreeingObject(const object::ObjectFile &Obj);
336
337  JITSymbol findExistingSymbol(const std::string &Name);
338  Module *findModuleForSymbol(const std::string &Name, bool CheckFunctionsOnly);
339};
340
341} // end llvm namespace
342
343#endif // LLVM_LIB_EXECUTIONENGINE_MCJIT_MCJIT_H
344