1 //===- ObjectFile.h - File format independent object file -------*- C++ -*-===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file declares a file format independent ObjectFile class.
11 //
12 //===----------------------------------------------------------------------===//
13
14 #ifndef LLVM_OBJECT_OBJECT_FILE_H
15 #define LLVM_OBJECT_OBJECT_FILE_H
16
17 #include "llvm/Object/Binary.h"
18 #include "llvm/ADT/StringRef.h"
19 #include "llvm/Support/DataTypes.h"
20 #include "llvm/Support/ErrorHandling.h"
21 #include "llvm/Support/MemoryBuffer.h"
22 #include <cstring>
23
24 namespace llvm {
25 namespace object {
26
27 class ObjectFile;
28
29 union DataRefImpl {
30 struct {
31 // ELF needs this for relocations. This entire union should probably be a
32 // char[max(8, sizeof(uintptr_t))] and require the impl to cast.
33 uint16_t a, b;
34 uint32_t c;
35 } w;
36 struct {
37 uint32_t a, b;
38 } d;
39 uintptr_t p;
40 };
41
42 template<class content_type>
43 class content_iterator {
44 content_type Current;
45 public:
content_iterator(content_type symb)46 content_iterator(content_type symb)
47 : Current(symb) {}
48
49 const content_type* operator->() const {
50 return &Current;
51 }
52
53 const content_type &operator*() const {
54 return Current;
55 }
56
57 bool operator==(const content_iterator &other) const {
58 return Current == other.Current;
59 }
60
61 bool operator!=(const content_iterator &other) const {
62 return !(*this == other);
63 }
64
increment(error_code & err)65 content_iterator& increment(error_code &err) {
66 content_type next;
67 if (error_code ec = Current.getNext(next))
68 err = ec;
69 else
70 Current = next;
71 return *this;
72 }
73 };
74
75 static bool operator ==(const DataRefImpl &a, const DataRefImpl &b) {
76 // Check bitwise identical. This is the only legal way to compare a union w/o
77 // knowing which member is in use.
78 return std::memcmp(&a, &b, sizeof(DataRefImpl)) == 0;
79 }
80
81 /// SymbolRef - This is a value type class that represents a single symbol in
82 /// the list of symbols in the object file.
83 class SymbolRef {
84 friend class SectionRef;
85 DataRefImpl SymbolPimpl;
86 const ObjectFile *OwningObject;
87
88 public:
SymbolRef()89 SymbolRef() : OwningObject(NULL) {
90 std::memset(&SymbolPimpl, 0, sizeof(SymbolPimpl));
91 }
92
93 enum SymbolType {
94 ST_Function,
95 ST_Data,
96 ST_External, // Defined in another object file
97 ST_Other
98 };
99
100 SymbolRef(DataRefImpl SymbolP, const ObjectFile *Owner);
101
102 bool operator==(const SymbolRef &Other) const;
103
104 error_code getNext(SymbolRef &Result) const;
105
106 error_code getName(StringRef &Result) const;
107 error_code getAddress(uint64_t &Result) const;
108 error_code getOffset(uint64_t &Result) const;
109 error_code getSize(uint64_t &Result) const;
110 error_code getSymbolType(SymbolRef::SymbolType &Result) const;
111
112 /// Returns the ascii char that should be displayed in a symbol table dump via
113 /// nm for this symbol.
114 error_code getNMTypeChar(char &Result) const;
115
116 /// Returns true for symbols that are internal to the object file format such
117 /// as section symbols.
118 error_code isInternal(bool &Result) const;
119
120 /// Returns true for symbols that can be used in another objects,
121 /// such as library functions
122 error_code isGlobal(bool &Result) const;
123
124 DataRefImpl getRawDataRefImpl() const;
125 };
126 typedef content_iterator<SymbolRef> symbol_iterator;
127
128 /// RelocationRef - This is a value type class that represents a single
129 /// relocation in the list of relocations in the object file.
130 class RelocationRef {
131 DataRefImpl RelocationPimpl;
132 const ObjectFile *OwningObject;
133
134 public:
RelocationRef()135 RelocationRef() : OwningObject(NULL) {
136 std::memset(&RelocationPimpl, 0, sizeof(RelocationPimpl));
137 }
138
139 RelocationRef(DataRefImpl RelocationP, const ObjectFile *Owner);
140
141 bool operator==(const RelocationRef &Other) const;
142
143 error_code getNext(RelocationRef &Result) const;
144
145 error_code getAddress(uint64_t &Result) const;
146 error_code getSymbol(SymbolRef &Result) const;
147 error_code getType(uint32_t &Result) const;
148
149 /// @brief Get a string that represents the type of this relocation.
150 ///
151 /// This is for display purposes only.
152 error_code getTypeName(SmallVectorImpl<char> &Result) const;
153 error_code getAdditionalInfo(int64_t &Result) const;
154
155 /// @brief Get a string that represents the calculation of the value of this
156 /// relocation.
157 ///
158 /// This is for display purposes only.
159 error_code getValueString(SmallVectorImpl<char> &Result) const;
160 };
161 typedef content_iterator<RelocationRef> relocation_iterator;
162
163 /// SectionRef - This is a value type class that represents a single section in
164 /// the list of sections in the object file.
165 class SectionRef {
166 friend class SymbolRef;
167 DataRefImpl SectionPimpl;
168 const ObjectFile *OwningObject;
169
170 public:
SectionRef()171 SectionRef() : OwningObject(NULL) {
172 std::memset(&SectionPimpl, 0, sizeof(SectionPimpl));
173 }
174
175 SectionRef(DataRefImpl SectionP, const ObjectFile *Owner);
176
177 bool operator==(const SectionRef &Other) const;
178
179 error_code getNext(SectionRef &Result) const;
180
181 error_code getName(StringRef &Result) const;
182 error_code getAddress(uint64_t &Result) const;
183 error_code getSize(uint64_t &Result) const;
184 error_code getContents(StringRef &Result) const;
185
186 /// @brief Get the alignment of this section as the actual value (not log 2).
187 error_code getAlignment(uint64_t &Result) const;
188
189 // FIXME: Move to the normalization layer when it's created.
190 error_code isText(bool &Result) const;
191 error_code isData(bool &Result) const;
192 error_code isBSS(bool &Result) const;
193
194 error_code containsSymbol(SymbolRef S, bool &Result) const;
195
196 relocation_iterator begin_relocations() const;
197 relocation_iterator end_relocations() const;
198 };
199 typedef content_iterator<SectionRef> section_iterator;
200
201 const uint64_t UnknownAddressOrSize = ~0ULL;
202
203 /// ObjectFile - This class is the base class for all object file types.
204 /// Concrete instances of this object are created by createObjectFile, which
205 /// figure out which type to create.
206 class ObjectFile : public Binary {
207 private:
208 ObjectFile(); // = delete
209 ObjectFile(const ObjectFile &other); // = delete
210
211 protected:
212 ObjectFile(unsigned int Type, MemoryBuffer *source, error_code &ec);
213
base()214 const uint8_t *base() const {
215 return reinterpret_cast<const uint8_t *>(Data->getBufferStart());
216 }
217
218 // These functions are for SymbolRef to call internally. The main goal of
219 // this is to allow SymbolRef::SymbolPimpl to point directly to the symbol
220 // entry in the memory mapped object file. SymbolPimpl cannot contain any
221 // virtual functions because then it could not point into the memory mapped
222 // file.
223 //
224 // Implementations assume that the DataRefImpl is valid and has not been
225 // modified externally. It's UB otherwise.
226 friend class SymbolRef;
227 virtual error_code getSymbolNext(DataRefImpl Symb, SymbolRef &Res) const = 0;
228 virtual error_code getSymbolName(DataRefImpl Symb, StringRef &Res) const = 0;
229 virtual error_code getSymbolAddress(DataRefImpl Symb, uint64_t &Res) const =0;
230 virtual error_code getSymbolOffset(DataRefImpl Symb, uint64_t &Res) const =0;
231 virtual error_code getSymbolSize(DataRefImpl Symb, uint64_t &Res) const = 0;
232 virtual error_code getSymbolNMTypeChar(DataRefImpl Symb, char &Res) const = 0;
233 virtual error_code isSymbolInternal(DataRefImpl Symb, bool &Res) const = 0;
234 virtual error_code isSymbolGlobal(DataRefImpl Symb, bool &Res) const = 0;
235 virtual error_code getSymbolType(DataRefImpl Symb, SymbolRef::SymbolType &Res) const = 0;
236
237 // Same as above for SectionRef.
238 friend class SectionRef;
239 virtual error_code getSectionNext(DataRefImpl Sec, SectionRef &Res) const = 0;
240 virtual error_code getSectionName(DataRefImpl Sec, StringRef &Res) const = 0;
241 virtual error_code getSectionAddress(DataRefImpl Sec, uint64_t &Res) const =0;
242 virtual error_code getSectionSize(DataRefImpl Sec, uint64_t &Res) const = 0;
243 virtual error_code getSectionContents(DataRefImpl Sec, StringRef &Res)const=0;
244 virtual error_code getSectionAlignment(DataRefImpl Sec, uint64_t &Res)const=0;
245 virtual error_code isSectionText(DataRefImpl Sec, bool &Res) const = 0;
246 virtual error_code isSectionData(DataRefImpl Sec, bool &Res) const = 0;
247 virtual error_code isSectionBSS(DataRefImpl Sec, bool &Res) const = 0;
248 virtual error_code sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb,
249 bool &Result) const = 0;
250 virtual relocation_iterator getSectionRelBegin(DataRefImpl Sec) const = 0;
251 virtual relocation_iterator getSectionRelEnd(DataRefImpl Sec) const = 0;
252
253
254 // Same as above for RelocationRef.
255 friend class RelocationRef;
256 virtual error_code getRelocationNext(DataRefImpl Rel,
257 RelocationRef &Res) const = 0;
258 virtual error_code getRelocationAddress(DataRefImpl Rel,
259 uint64_t &Res) const =0;
260 virtual error_code getRelocationSymbol(DataRefImpl Rel,
261 SymbolRef &Res) const = 0;
262 virtual error_code getRelocationType(DataRefImpl Rel,
263 uint32_t &Res) const = 0;
264 virtual error_code getRelocationTypeName(DataRefImpl Rel,
265 SmallVectorImpl<char> &Result) const = 0;
266 virtual error_code getRelocationAdditionalInfo(DataRefImpl Rel,
267 int64_t &Res) const = 0;
268 virtual error_code getRelocationValueString(DataRefImpl Rel,
269 SmallVectorImpl<char> &Result) const = 0;
270
271 public:
272
273 virtual symbol_iterator begin_symbols() const = 0;
274 virtual symbol_iterator end_symbols() const = 0;
275
276 virtual section_iterator begin_sections() const = 0;
277 virtual section_iterator end_sections() const = 0;
278
279 /// @brief The number of bytes used to represent an address in this object
280 /// file format.
281 virtual uint8_t getBytesInAddress() const = 0;
282
283 virtual StringRef getFileFormatName() const = 0;
284 virtual /* Triple::ArchType */ unsigned getArch() const = 0;
285
286 /// @returns Pointer to ObjectFile subclass to handle this type of object.
287 /// @param ObjectPath The path to the object file. ObjectPath.isObject must
288 /// return true.
289 /// @brief Create ObjectFile from path.
290 static ObjectFile *createObjectFile(StringRef ObjectPath);
291 static ObjectFile *createObjectFile(MemoryBuffer *Object);
292
classof(const Binary * v)293 static inline bool classof(const Binary *v) {
294 return v->getType() >= isObject &&
295 v->getType() < lastObject;
296 }
classof(const ObjectFile * v)297 static inline bool classof(const ObjectFile *v) { return true; }
298
299 public:
300 static ObjectFile *createCOFFObjectFile(MemoryBuffer *Object);
301 static ObjectFile *createELFObjectFile(MemoryBuffer *Object);
302 static ObjectFile *createMachOObjectFile(MemoryBuffer *Object);
303 };
304
305 // Inline function definitions.
SymbolRef(DataRefImpl SymbolP,const ObjectFile * Owner)306 inline SymbolRef::SymbolRef(DataRefImpl SymbolP, const ObjectFile *Owner)
307 : SymbolPimpl(SymbolP)
308 , OwningObject(Owner) {}
309
310 inline bool SymbolRef::operator==(const SymbolRef &Other) const {
311 return SymbolPimpl == Other.SymbolPimpl;
312 }
313
getNext(SymbolRef & Result)314 inline error_code SymbolRef::getNext(SymbolRef &Result) const {
315 return OwningObject->getSymbolNext(SymbolPimpl, Result);
316 }
317
getName(StringRef & Result)318 inline error_code SymbolRef::getName(StringRef &Result) const {
319 return OwningObject->getSymbolName(SymbolPimpl, Result);
320 }
321
getAddress(uint64_t & Result)322 inline error_code SymbolRef::getAddress(uint64_t &Result) const {
323 return OwningObject->getSymbolAddress(SymbolPimpl, Result);
324 }
325
getOffset(uint64_t & Result)326 inline error_code SymbolRef::getOffset(uint64_t &Result) const {
327 return OwningObject->getSymbolOffset(SymbolPimpl, Result);
328 }
329
getSize(uint64_t & Result)330 inline error_code SymbolRef::getSize(uint64_t &Result) const {
331 return OwningObject->getSymbolSize(SymbolPimpl, Result);
332 }
333
getNMTypeChar(char & Result)334 inline error_code SymbolRef::getNMTypeChar(char &Result) const {
335 return OwningObject->getSymbolNMTypeChar(SymbolPimpl, Result);
336 }
337
isInternal(bool & Result)338 inline error_code SymbolRef::isInternal(bool &Result) const {
339 return OwningObject->isSymbolInternal(SymbolPimpl, Result);
340 }
341
isGlobal(bool & Result)342 inline error_code SymbolRef::isGlobal(bool &Result) const {
343 return OwningObject->isSymbolGlobal(SymbolPimpl, Result);
344 }
345
getSymbolType(SymbolRef::SymbolType & Result)346 inline error_code SymbolRef::getSymbolType(SymbolRef::SymbolType &Result) const {
347 return OwningObject->getSymbolType(SymbolPimpl, Result);
348 }
349
getRawDataRefImpl()350 inline DataRefImpl SymbolRef::getRawDataRefImpl() const {
351 return SymbolPimpl;
352 }
353
354
355 /// SectionRef
SectionRef(DataRefImpl SectionP,const ObjectFile * Owner)356 inline SectionRef::SectionRef(DataRefImpl SectionP,
357 const ObjectFile *Owner)
358 : SectionPimpl(SectionP)
359 , OwningObject(Owner) {}
360
361 inline bool SectionRef::operator==(const SectionRef &Other) const {
362 return SectionPimpl == Other.SectionPimpl;
363 }
364
getNext(SectionRef & Result)365 inline error_code SectionRef::getNext(SectionRef &Result) const {
366 return OwningObject->getSectionNext(SectionPimpl, Result);
367 }
368
getName(StringRef & Result)369 inline error_code SectionRef::getName(StringRef &Result) const {
370 return OwningObject->getSectionName(SectionPimpl, Result);
371 }
372
getAddress(uint64_t & Result)373 inline error_code SectionRef::getAddress(uint64_t &Result) const {
374 return OwningObject->getSectionAddress(SectionPimpl, Result);
375 }
376
getSize(uint64_t & Result)377 inline error_code SectionRef::getSize(uint64_t &Result) const {
378 return OwningObject->getSectionSize(SectionPimpl, Result);
379 }
380
getContents(StringRef & Result)381 inline error_code SectionRef::getContents(StringRef &Result) const {
382 return OwningObject->getSectionContents(SectionPimpl, Result);
383 }
384
getAlignment(uint64_t & Result)385 inline error_code SectionRef::getAlignment(uint64_t &Result) const {
386 return OwningObject->getSectionAlignment(SectionPimpl, Result);
387 }
388
isText(bool & Result)389 inline error_code SectionRef::isText(bool &Result) const {
390 return OwningObject->isSectionText(SectionPimpl, Result);
391 }
392
isData(bool & Result)393 inline error_code SectionRef::isData(bool &Result) const {
394 return OwningObject->isSectionData(SectionPimpl, Result);
395 }
396
isBSS(bool & Result)397 inline error_code SectionRef::isBSS(bool &Result) const {
398 return OwningObject->isSectionBSS(SectionPimpl, Result);
399 }
400
containsSymbol(SymbolRef S,bool & Result)401 inline error_code SectionRef::containsSymbol(SymbolRef S, bool &Result) const {
402 return OwningObject->sectionContainsSymbol(SectionPimpl, S.SymbolPimpl,
403 Result);
404 }
405
begin_relocations()406 inline relocation_iterator SectionRef::begin_relocations() const {
407 return OwningObject->getSectionRelBegin(SectionPimpl);
408 }
409
end_relocations()410 inline relocation_iterator SectionRef::end_relocations() const {
411 return OwningObject->getSectionRelEnd(SectionPimpl);
412 }
413
414
415 /// RelocationRef
RelocationRef(DataRefImpl RelocationP,const ObjectFile * Owner)416 inline RelocationRef::RelocationRef(DataRefImpl RelocationP,
417 const ObjectFile *Owner)
418 : RelocationPimpl(RelocationP)
419 , OwningObject(Owner) {}
420
421 inline bool RelocationRef::operator==(const RelocationRef &Other) const {
422 return RelocationPimpl == Other.RelocationPimpl;
423 }
424
getNext(RelocationRef & Result)425 inline error_code RelocationRef::getNext(RelocationRef &Result) const {
426 return OwningObject->getRelocationNext(RelocationPimpl, Result);
427 }
428
getAddress(uint64_t & Result)429 inline error_code RelocationRef::getAddress(uint64_t &Result) const {
430 return OwningObject->getRelocationAddress(RelocationPimpl, Result);
431 }
432
getSymbol(SymbolRef & Result)433 inline error_code RelocationRef::getSymbol(SymbolRef &Result) const {
434 return OwningObject->getRelocationSymbol(RelocationPimpl, Result);
435 }
436
getType(uint32_t & Result)437 inline error_code RelocationRef::getType(uint32_t &Result) const {
438 return OwningObject->getRelocationType(RelocationPimpl, Result);
439 }
440
getTypeName(SmallVectorImpl<char> & Result)441 inline error_code RelocationRef::getTypeName(SmallVectorImpl<char> &Result)
442 const {
443 return OwningObject->getRelocationTypeName(RelocationPimpl, Result);
444 }
445
getAdditionalInfo(int64_t & Result)446 inline error_code RelocationRef::getAdditionalInfo(int64_t &Result) const {
447 return OwningObject->getRelocationAdditionalInfo(RelocationPimpl, Result);
448 }
449
getValueString(SmallVectorImpl<char> & Result)450 inline error_code RelocationRef::getValueString(SmallVectorImpl<char> &Result)
451 const {
452 return OwningObject->getRelocationValueString(RelocationPimpl, Result);
453 }
454
455 } // end namespace object
456 } // end namespace llvm
457
458 #endif
459