1 //===- JITSymbol.h - JIT symbol abstraction ---------------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // Abstraction for target process addresses.
10 //
11 //===----------------------------------------------------------------------===//
12
13 #ifndef LLVM_EXECUTIONENGINE_JITSYMBOL_H
14 #define LLVM_EXECUTIONENGINE_JITSYMBOL_H
15
16 #include <algorithm>
17 #include <cassert>
18 #include <cstddef>
19 #include <cstdint>
20 #include <functional>
21 #include <map>
22 #include <set>
23 #include <string>
24
25 #include "llvm/ADT/BitmaskEnum.h"
26 #include "llvm/ADT/FunctionExtras.h"
27 #include "llvm/ADT/StringRef.h"
28 #include "llvm/Support/Error.h"
29
30 namespace llvm {
31
32 class GlobalValue;
33 class GlobalValueSummary;
34
35 namespace object {
36
37 class SymbolRef;
38
39 } // end namespace object
40
41 /// Represents an address in the target process's address space.
42 using JITTargetAddress = uint64_t;
43
44 /// Convert a JITTargetAddress to a pointer.
45 ///
46 /// Note: This is a raw cast of the address bit pattern to the given pointer
47 /// type. When casting to a function pointer in order to execute JIT'd code
48 /// jitTargetAddressToFunction should be preferred, as it will also perform
49 /// pointer signing on targets that require it.
jitTargetAddressToPointer(JITTargetAddress Addr)50 template <typename T> T jitTargetAddressToPointer(JITTargetAddress Addr) {
51 static_assert(std::is_pointer<T>::value, "T must be a pointer type");
52 uintptr_t IntPtr = static_cast<uintptr_t>(Addr);
53 assert(IntPtr == Addr && "JITTargetAddress value out of range for uintptr_t");
54 return reinterpret_cast<T>(IntPtr);
55 }
56
57 /// Convert a JITTargetAddress to a callable function pointer.
58 ///
59 /// Casts the given address to a callable function pointer. This operation
60 /// will perform pointer signing for platforms that require it (e.g. arm64e).
jitTargetAddressToFunction(JITTargetAddress Addr)61 template <typename T> T jitTargetAddressToFunction(JITTargetAddress Addr) {
62 static_assert(std::is_pointer<T>::value &&
63 std::is_function<std::remove_pointer_t<T>>::value,
64 "T must be a function pointer type");
65 return jitTargetAddressToPointer<T>(Addr);
66 }
67
68 /// Convert a pointer to a JITTargetAddress.
pointerToJITTargetAddress(T * Ptr)69 template <typename T> JITTargetAddress pointerToJITTargetAddress(T *Ptr) {
70 return static_cast<JITTargetAddress>(reinterpret_cast<uintptr_t>(Ptr));
71 }
72
73 /// Flags for symbols in the JIT.
74 class JITSymbolFlags {
75 public:
76 using UnderlyingType = uint8_t;
77 using TargetFlagsType = uint8_t;
78
79 enum FlagNames : UnderlyingType {
80 None = 0,
81 HasError = 1U << 0,
82 Weak = 1U << 1,
83 Common = 1U << 2,
84 Absolute = 1U << 3,
85 Exported = 1U << 4,
86 Callable = 1U << 5,
87 MaterializationSideEffectsOnly = 1U << 6,
88 LLVM_MARK_AS_BITMASK_ENUM( // LargestValue =
89 MaterializationSideEffectsOnly)
90 };
91
92 /// Default-construct a JITSymbolFlags instance.
93 JITSymbolFlags() = default;
94
95 /// Construct a JITSymbolFlags instance from the given flags.
JITSymbolFlags(FlagNames Flags)96 JITSymbolFlags(FlagNames Flags) : Flags(Flags) {}
97
98 /// Construct a JITSymbolFlags instance from the given flags and target
99 /// flags.
JITSymbolFlags(FlagNames Flags,TargetFlagsType TargetFlags)100 JITSymbolFlags(FlagNames Flags, TargetFlagsType TargetFlags)
101 : TargetFlags(TargetFlags), Flags(Flags) {}
102
103 /// Implicitly convert to bool. Returs true if any flag is set.
104 explicit operator bool() const { return Flags != None || TargetFlags != 0; }
105
106 /// Compare for equality.
107 bool operator==(const JITSymbolFlags &RHS) const {
108 return Flags == RHS.Flags && TargetFlags == RHS.TargetFlags;
109 }
110
111 /// Bitwise AND-assignment for FlagNames.
112 JITSymbolFlags &operator&=(const FlagNames &RHS) {
113 Flags &= RHS;
114 return *this;
115 }
116
117 /// Bitwise OR-assignment for FlagNames.
118 JITSymbolFlags &operator|=(const FlagNames &RHS) {
119 Flags |= RHS;
120 return *this;
121 }
122
123 /// Return true if there was an error retrieving this symbol.
hasError()124 bool hasError() const {
125 return (Flags & HasError) == HasError;
126 }
127
128 /// Returns true if the Weak flag is set.
isWeak()129 bool isWeak() const {
130 return (Flags & Weak) == Weak;
131 }
132
133 /// Returns true if the Common flag is set.
isCommon()134 bool isCommon() const {
135 return (Flags & Common) == Common;
136 }
137
138 /// Returns true if the symbol isn't weak or common.
isStrong()139 bool isStrong() const {
140 return !isWeak() && !isCommon();
141 }
142
143 /// Returns true if the Exported flag is set.
isExported()144 bool isExported() const {
145 return (Flags & Exported) == Exported;
146 }
147
148 /// Returns true if the given symbol is known to be callable.
isCallable()149 bool isCallable() const { return (Flags & Callable) == Callable; }
150
151 /// Returns true if this symbol is a materialization-side-effects-only
152 /// symbol. Such symbols do not have a real address. They exist to trigger
153 /// and support synchronization of materialization side effects, e.g. for
154 /// collecting initialization information. These symbols will vanish from
155 /// the symbol table immediately upon reaching the ready state, and will
156 /// appear to queries as if they were never defined (except that query
157 /// callback execution will be delayed until they reach the ready state).
158 /// MaterializationSideEffectOnly symbols should only be queried using the
159 /// SymbolLookupFlags::WeaklyReferencedSymbol flag (see
160 /// llvm/include/llvm/ExecutionEngine/Orc/Core.h).
hasMaterializationSideEffectsOnly()161 bool hasMaterializationSideEffectsOnly() const {
162 return (Flags & MaterializationSideEffectsOnly) ==
163 MaterializationSideEffectsOnly;
164 }
165
166 /// Get the underlying flags value as an integer.
getRawFlagsValue()167 UnderlyingType getRawFlagsValue() const {
168 return static_cast<UnderlyingType>(Flags);
169 }
170
171 /// Return a reference to the target-specific flags.
getTargetFlags()172 TargetFlagsType& getTargetFlags() { return TargetFlags; }
173
174 /// Return a reference to the target-specific flags.
getTargetFlags()175 const TargetFlagsType& getTargetFlags() const { return TargetFlags; }
176
177 /// Construct a JITSymbolFlags value based on the flags of the given global
178 /// value.
179 static JITSymbolFlags fromGlobalValue(const GlobalValue &GV);
180
181 /// Construct a JITSymbolFlags value based on the flags of the given global
182 /// value summary.
183 static JITSymbolFlags fromSummary(GlobalValueSummary *S);
184
185 /// Construct a JITSymbolFlags value based on the flags of the given libobject
186 /// symbol.
187 static Expected<JITSymbolFlags>
188 fromObjectSymbol(const object::SymbolRef &Symbol);
189
190 private:
191 TargetFlagsType TargetFlags = 0;
192 FlagNames Flags = None;
193 };
194
195 inline JITSymbolFlags operator&(const JITSymbolFlags &LHS,
196 const JITSymbolFlags::FlagNames &RHS) {
197 JITSymbolFlags Tmp = LHS;
198 Tmp &= RHS;
199 return Tmp;
200 }
201
202 inline JITSymbolFlags operator|(const JITSymbolFlags &LHS,
203 const JITSymbolFlags::FlagNames &RHS) {
204 JITSymbolFlags Tmp = LHS;
205 Tmp |= RHS;
206 return Tmp;
207 }
208
209 /// ARM-specific JIT symbol flags.
210 /// FIXME: This should be moved into a target-specific header.
211 class ARMJITSymbolFlags {
212 public:
213 ARMJITSymbolFlags() = default;
214
215 enum FlagNames {
216 None = 0,
217 Thumb = 1 << 0
218 };
219
220 operator JITSymbolFlags::TargetFlagsType&() { return Flags; }
221
222 static ARMJITSymbolFlags fromObjectSymbol(const object::SymbolRef &Symbol);
223
224 private:
225 JITSymbolFlags::TargetFlagsType Flags = 0;
226 };
227
228 /// Represents a symbol that has been evaluated to an address already.
229 class JITEvaluatedSymbol {
230 public:
231 JITEvaluatedSymbol() = default;
232
233 /// Create a 'null' symbol.
JITEvaluatedSymbol(std::nullptr_t)234 JITEvaluatedSymbol(std::nullptr_t) {}
235
236 /// Create a symbol for the given address and flags.
JITEvaluatedSymbol(JITTargetAddress Address,JITSymbolFlags Flags)237 JITEvaluatedSymbol(JITTargetAddress Address, JITSymbolFlags Flags)
238 : Address(Address), Flags(Flags) {}
239
240 /// Create a symbol from the given pointer with the given flags.
241 template <typename T>
242 static JITEvaluatedSymbol
243 fromPointer(T *P, JITSymbolFlags Flags = JITSymbolFlags::Exported) {
244 return JITEvaluatedSymbol(pointerToJITTargetAddress(P), Flags);
245 }
246
247 /// An evaluated symbol converts to 'true' if its address is non-zero.
248 explicit operator bool() const { return Address != 0; }
249
250 /// Return the address of this symbol.
getAddress()251 JITTargetAddress getAddress() const { return Address; }
252
253 /// Return the flags for this symbol.
getFlags()254 JITSymbolFlags getFlags() const { return Flags; }
255
256 /// Set the flags for this symbol.
setFlags(JITSymbolFlags Flags)257 void setFlags(JITSymbolFlags Flags) { this->Flags = std::move(Flags); }
258
259 private:
260 JITTargetAddress Address = 0;
261 JITSymbolFlags Flags;
262 };
263
264 /// Represents a symbol in the JIT.
265 class JITSymbol {
266 public:
267 using GetAddressFtor = unique_function<Expected<JITTargetAddress>()>;
268
269 /// Create a 'null' symbol, used to represent a "symbol not found"
270 /// result from a successful (non-erroneous) lookup.
JITSymbol(std::nullptr_t)271 JITSymbol(std::nullptr_t)
272 : CachedAddr(0) {}
273
274 /// Create a JITSymbol representing an error in the symbol lookup
275 /// process (e.g. a network failure during a remote lookup).
JITSymbol(Error Err)276 JITSymbol(Error Err)
277 : Err(std::move(Err)), Flags(JITSymbolFlags::HasError) {}
278
279 /// Create a symbol for a definition with a known address.
JITSymbol(JITTargetAddress Addr,JITSymbolFlags Flags)280 JITSymbol(JITTargetAddress Addr, JITSymbolFlags Flags)
281 : CachedAddr(Addr), Flags(Flags) {}
282
283 /// Construct a JITSymbol from a JITEvaluatedSymbol.
JITSymbol(JITEvaluatedSymbol Sym)284 JITSymbol(JITEvaluatedSymbol Sym)
285 : CachedAddr(Sym.getAddress()), Flags(Sym.getFlags()) {}
286
287 /// Create a symbol for a definition that doesn't have a known address
288 /// yet.
289 /// @param GetAddress A functor to materialize a definition (fixing the
290 /// address) on demand.
291 ///
292 /// This constructor allows a JIT layer to provide a reference to a symbol
293 /// definition without actually materializing the definition up front. The
294 /// user can materialize the definition at any time by calling the getAddress
295 /// method.
JITSymbol(GetAddressFtor GetAddress,JITSymbolFlags Flags)296 JITSymbol(GetAddressFtor GetAddress, JITSymbolFlags Flags)
297 : GetAddress(std::move(GetAddress)), CachedAddr(0), Flags(Flags) {}
298
299 JITSymbol(const JITSymbol&) = delete;
300 JITSymbol& operator=(const JITSymbol&) = delete;
301
JITSymbol(JITSymbol && Other)302 JITSymbol(JITSymbol &&Other)
303 : GetAddress(std::move(Other.GetAddress)), Flags(std::move(Other.Flags)) {
304 if (Flags.hasError())
305 Err = std::move(Other.Err);
306 else
307 CachedAddr = std::move(Other.CachedAddr);
308 }
309
310 JITSymbol& operator=(JITSymbol &&Other) {
311 GetAddress = std::move(Other.GetAddress);
312 Flags = std::move(Other.Flags);
313 if (Flags.hasError())
314 Err = std::move(Other.Err);
315 else
316 CachedAddr = std::move(Other.CachedAddr);
317 return *this;
318 }
319
~JITSymbol()320 ~JITSymbol() {
321 if (Flags.hasError())
322 Err.~Error();
323 else
324 CachedAddr.~JITTargetAddress();
325 }
326
327 /// Returns true if the symbol exists, false otherwise.
328 explicit operator bool() const {
329 return !Flags.hasError() && (CachedAddr || GetAddress);
330 }
331
332 /// Move the error field value out of this JITSymbol.
takeError()333 Error takeError() {
334 if (Flags.hasError())
335 return std::move(Err);
336 return Error::success();
337 }
338
339 /// Get the address of the symbol in the target address space. Returns
340 /// '0' if the symbol does not exist.
getAddress()341 Expected<JITTargetAddress> getAddress() {
342 assert(!Flags.hasError() && "getAddress called on error value");
343 if (GetAddress) {
344 if (auto CachedAddrOrErr = GetAddress()) {
345 GetAddress = nullptr;
346 CachedAddr = *CachedAddrOrErr;
347 assert(CachedAddr && "Symbol could not be materialized.");
348 } else
349 return CachedAddrOrErr.takeError();
350 }
351 return CachedAddr;
352 }
353
getFlags()354 JITSymbolFlags getFlags() const { return Flags; }
355
356 private:
357 GetAddressFtor GetAddress;
358 union {
359 JITTargetAddress CachedAddr;
360 Error Err;
361 };
362 JITSymbolFlags Flags;
363 };
364
365 /// Symbol resolution interface.
366 ///
367 /// Allows symbol flags and addresses to be looked up by name.
368 /// Symbol queries are done in bulk (i.e. you request resolution of a set of
369 /// symbols, rather than a single one) to reduce IPC overhead in the case of
370 /// remote JITing, and expose opportunities for parallel compilation.
371 class JITSymbolResolver {
372 public:
373 using LookupSet = std::set<StringRef>;
374 using LookupResult = std::map<StringRef, JITEvaluatedSymbol>;
375 using OnResolvedFunction = unique_function<void(Expected<LookupResult>)>;
376
377 virtual ~JITSymbolResolver() = default;
378
379 /// Returns the fully resolved address and flags for each of the given
380 /// symbols.
381 ///
382 /// This method will return an error if any of the given symbols can not be
383 /// resolved, or if the resolution process itself triggers an error.
384 virtual void lookup(const LookupSet &Symbols,
385 OnResolvedFunction OnResolved) = 0;
386
387 /// Returns the subset of the given symbols that should be materialized by
388 /// the caller. Only weak/common symbols should be looked up, as strong
389 /// definitions are implicitly always part of the caller's responsibility.
390 virtual Expected<LookupSet>
391 getResponsibilitySet(const LookupSet &Symbols) = 0;
392
393 private:
394 virtual void anchor();
395 };
396
397 /// Legacy symbol resolution interface.
398 class LegacyJITSymbolResolver : public JITSymbolResolver {
399 public:
400 /// Performs lookup by, for each symbol, first calling
401 /// findSymbolInLogicalDylib and if that fails calling
402 /// findSymbol.
403 void lookup(const LookupSet &Symbols, OnResolvedFunction OnResolved) final;
404
405 /// Performs flags lookup by calling findSymbolInLogicalDylib and
406 /// returning the flags value for that symbol.
407 Expected<LookupSet> getResponsibilitySet(const LookupSet &Symbols) final;
408
409 /// This method returns the address of the specified symbol if it exists
410 /// within the logical dynamic library represented by this JITSymbolResolver.
411 /// Unlike findSymbol, queries through this interface should return addresses
412 /// for hidden symbols.
413 ///
414 /// This is of particular importance for the Orc JIT APIs, which support lazy
415 /// compilation by breaking up modules: Each of those broken out modules
416 /// must be able to resolve hidden symbols provided by the others. Clients
417 /// writing memory managers for MCJIT can usually ignore this method.
418 ///
419 /// This method will be queried by RuntimeDyld when checking for previous
420 /// definitions of common symbols.
421 virtual JITSymbol findSymbolInLogicalDylib(const std::string &Name) = 0;
422
423 /// This method returns the address of the specified function or variable.
424 /// It is used to resolve symbols during module linking.
425 ///
426 /// If the returned symbol's address is equal to ~0ULL then RuntimeDyld will
427 /// skip all relocations for that symbol, and the client will be responsible
428 /// for handling them manually.
429 virtual JITSymbol findSymbol(const std::string &Name) = 0;
430
431 private:
432 void anchor() override;
433 };
434
435 } // end namespace llvm
436
437 #endif // LLVM_EXECUTIONENGINE_JITSYMBOL_H
438