1 //===- MachOObjectFile.cpp - Mach-O object file binding ---------*- C++ -*-===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file defines the MachOObjectFile class, which binds the MachOObject
11 // class to the generic ObjectFile wrapper.
12 //
13 //===----------------------------------------------------------------------===//
14
15 #include "llvm/Object/MachO.h"
16 #include "llvm/ADT/Triple.h"
17 #include "llvm/Object/MachOFormat.h"
18 #include "llvm/Support/DataExtractor.h"
19 #include "llvm/Support/Format.h"
20 #include "llvm/Support/Host.h"
21 #include "llvm/Support/MemoryBuffer.h"
22 #include <cctype>
23 #include <cstring>
24 #include <limits>
25
26 using namespace llvm;
27 using namespace object;
28
29 namespace llvm {
30 namespace object {
31
32 struct SymbolTableEntryBase {
33 uint32_t StringIndex;
34 uint8_t Type;
35 uint8_t SectionIndex;
36 uint16_t Flags;
37 };
38
39 struct SectionBase {
40 char Name[16];
41 char SegmentName[16];
42 };
43
44 template<typename T>
SwapValue(T & Value)45 static void SwapValue(T &Value) {
46 Value = sys::SwapByteOrder(Value);
47 }
48
49 template<typename T>
50 static void SwapStruct(T &Value);
51
52 template<>
SwapStruct(macho::RelocationEntry & H)53 void SwapStruct(macho::RelocationEntry &H) {
54 SwapValue(H.Word0);
55 SwapValue(H.Word1);
56 }
57
58 template<>
SwapStruct(macho::LoadCommand & L)59 void SwapStruct(macho::LoadCommand &L) {
60 SwapValue(L.Type);
61 SwapValue(L.Size);
62 }
63
64 template<>
SwapStruct(SymbolTableEntryBase & S)65 void SwapStruct(SymbolTableEntryBase &S) {
66 SwapValue(S.StringIndex);
67 SwapValue(S.Flags);
68 }
69
70 template<>
SwapStruct(macho::Section & S)71 void SwapStruct(macho::Section &S) {
72 SwapValue(S.Address);
73 SwapValue(S.Size);
74 SwapValue(S.Offset);
75 SwapValue(S.Align);
76 SwapValue(S.RelocationTableOffset);
77 SwapValue(S.NumRelocationTableEntries);
78 SwapValue(S.Flags);
79 SwapValue(S.Reserved1);
80 SwapValue(S.Reserved2);
81 }
82
83 template<>
SwapStruct(macho::Section64 & S)84 void SwapStruct(macho::Section64 &S) {
85 SwapValue(S.Address);
86 SwapValue(S.Size);
87 SwapValue(S.Offset);
88 SwapValue(S.Align);
89 SwapValue(S.RelocationTableOffset);
90 SwapValue(S.NumRelocationTableEntries);
91 SwapValue(S.Flags);
92 SwapValue(S.Reserved1);
93 SwapValue(S.Reserved2);
94 SwapValue(S.Reserved3);
95 }
96
97 template<>
SwapStruct(macho::SymbolTableEntry & S)98 void SwapStruct(macho::SymbolTableEntry &S) {
99 SwapValue(S.StringIndex);
100 SwapValue(S.Flags);
101 SwapValue(S.Value);
102 }
103
104 template<>
SwapStruct(macho::Symbol64TableEntry & S)105 void SwapStruct(macho::Symbol64TableEntry &S) {
106 SwapValue(S.StringIndex);
107 SwapValue(S.Flags);
108 SwapValue(S.Value);
109 }
110
111 template<>
SwapStruct(macho::Header & H)112 void SwapStruct(macho::Header &H) {
113 SwapValue(H.Magic);
114 SwapValue(H.CPUType);
115 SwapValue(H.CPUSubtype);
116 SwapValue(H.FileType);
117 SwapValue(H.NumLoadCommands);
118 SwapValue(H.SizeOfLoadCommands);
119 SwapValue(H.Flags);
120 }
121
122 template<>
SwapStruct(macho::Header64Ext & E)123 void SwapStruct(macho::Header64Ext &E) {
124 SwapValue(E.Reserved);
125 }
126
127 template<>
SwapStruct(macho::SymtabLoadCommand & C)128 void SwapStruct(macho::SymtabLoadCommand &C) {
129 SwapValue(C.Type);
130 SwapValue(C.Size);
131 SwapValue(C.SymbolTableOffset);
132 SwapValue(C.NumSymbolTableEntries);
133 SwapValue(C.StringTableOffset);
134 SwapValue(C.StringTableSize);
135 }
136
137 template<>
SwapStruct(macho::DysymtabLoadCommand & C)138 void SwapStruct(macho::DysymtabLoadCommand &C) {
139 SwapValue(C.Type);
140 SwapValue(C.Size);
141 SwapValue(C.LocalSymbolsIndex);
142 SwapValue(C.NumLocalSymbols);
143 SwapValue(C.ExternalSymbolsIndex);
144 SwapValue(C.NumExternalSymbols);
145 SwapValue(C.UndefinedSymbolsIndex);
146 SwapValue(C.NumUndefinedSymbols);
147 SwapValue(C.TOCOffset);
148 SwapValue(C.NumTOCEntries);
149 SwapValue(C.ModuleTableOffset);
150 SwapValue(C.NumModuleTableEntries);
151 SwapValue(C.ReferenceSymbolTableOffset);
152 SwapValue(C.NumReferencedSymbolTableEntries);
153 SwapValue(C.IndirectSymbolTableOffset);
154 SwapValue(C.NumIndirectSymbolTableEntries);
155 SwapValue(C.ExternalRelocationTableOffset);
156 SwapValue(C.NumExternalRelocationTableEntries);
157 SwapValue(C.LocalRelocationTableOffset);
158 SwapValue(C.NumLocalRelocationTableEntries);
159 }
160
161 template<>
SwapStruct(macho::LinkeditDataLoadCommand & C)162 void SwapStruct(macho::LinkeditDataLoadCommand &C) {
163 SwapValue(C.Type);
164 SwapValue(C.Size);
165 SwapValue(C.DataOffset);
166 SwapValue(C.DataSize);
167 }
168
169 template<>
SwapStruct(macho::SegmentLoadCommand & C)170 void SwapStruct(macho::SegmentLoadCommand &C) {
171 SwapValue(C.Type);
172 SwapValue(C.Size);
173 SwapValue(C.VMAddress);
174 SwapValue(C.VMSize);
175 SwapValue(C.FileOffset);
176 SwapValue(C.FileSize);
177 SwapValue(C.MaxVMProtection);
178 SwapValue(C.InitialVMProtection);
179 SwapValue(C.NumSections);
180 SwapValue(C.Flags);
181 }
182
183 template<>
SwapStruct(macho::Segment64LoadCommand & C)184 void SwapStruct(macho::Segment64LoadCommand &C) {
185 SwapValue(C.Type);
186 SwapValue(C.Size);
187 SwapValue(C.VMAddress);
188 SwapValue(C.VMSize);
189 SwapValue(C.FileOffset);
190 SwapValue(C.FileSize);
191 SwapValue(C.MaxVMProtection);
192 SwapValue(C.InitialVMProtection);
193 SwapValue(C.NumSections);
194 SwapValue(C.Flags);
195 }
196
197 template<>
SwapStruct(macho::IndirectSymbolTableEntry & C)198 void SwapStruct(macho::IndirectSymbolTableEntry &C) {
199 SwapValue(C.Index);
200 }
201
202 template<>
SwapStruct(macho::LinkerOptionsLoadCommand & C)203 void SwapStruct(macho::LinkerOptionsLoadCommand &C) {
204 SwapValue(C.Type);
205 SwapValue(C.Size);
206 SwapValue(C.Count);
207 }
208
209 template<>
SwapStruct(macho::DataInCodeTableEntry & C)210 void SwapStruct(macho::DataInCodeTableEntry &C) {
211 SwapValue(C.Offset);
212 SwapValue(C.Length);
213 SwapValue(C.Kind);
214 }
215
216 template<typename T>
getStruct(const MachOObjectFile * O,const char * P)217 T getStruct(const MachOObjectFile *O, const char *P) {
218 T Cmd;
219 memcpy(&Cmd, P, sizeof(T));
220 if (O->isLittleEndian() != sys::IsLittleEndianHost)
221 SwapStruct(Cmd);
222 return Cmd;
223 }
224
225 static uint32_t
getSegmentLoadCommandNumSections(const MachOObjectFile * O,const MachOObjectFile::LoadCommandInfo & L)226 getSegmentLoadCommandNumSections(const MachOObjectFile *O,
227 const MachOObjectFile::LoadCommandInfo &L) {
228 if (O->is64Bit()) {
229 macho::Segment64LoadCommand S = O->getSegment64LoadCommand(L);
230 return S.NumSections;
231 }
232 macho::SegmentLoadCommand S = O->getSegmentLoadCommand(L);
233 return S.NumSections;
234 }
235
236 static const char *
getSectionPtr(const MachOObjectFile * O,MachOObjectFile::LoadCommandInfo L,unsigned Sec)237 getSectionPtr(const MachOObjectFile *O, MachOObjectFile::LoadCommandInfo L,
238 unsigned Sec) {
239 uintptr_t CommandAddr = reinterpret_cast<uintptr_t>(L.Ptr);
240
241 bool Is64 = O->is64Bit();
242 unsigned SegmentLoadSize = Is64 ? sizeof(macho::Segment64LoadCommand) :
243 sizeof(macho::SegmentLoadCommand);
244 unsigned SectionSize = Is64 ? sizeof(macho::Section64) :
245 sizeof(macho::Section);
246
247 uintptr_t SectionAddr = CommandAddr + SegmentLoadSize + Sec * SectionSize;
248 return reinterpret_cast<const char*>(SectionAddr);
249 }
250
getPtr(const MachOObjectFile * O,size_t Offset)251 static const char *getPtr(const MachOObjectFile *O, size_t Offset) {
252 return O->getData().substr(Offset, 1).data();
253 }
254
255 static SymbolTableEntryBase
getSymbolTableEntryBase(const MachOObjectFile * O,DataRefImpl DRI)256 getSymbolTableEntryBase(const MachOObjectFile *O, DataRefImpl DRI) {
257 const char *P = reinterpret_cast<const char *>(DRI.p);
258 return getStruct<SymbolTableEntryBase>(O, P);
259 }
260
parseSegmentOrSectionName(const char * P)261 static StringRef parseSegmentOrSectionName(const char *P) {
262 if (P[15] == 0)
263 // Null terminated.
264 return P;
265 // Not null terminated, so this is a 16 char string.
266 return StringRef(P, 16);
267 }
268
269 // Helper to advance a section or symbol iterator multiple increments at a time.
270 template<class T>
advance(T & it,size_t Val)271 static error_code advance(T &it, size_t Val) {
272 error_code ec;
273 while (Val--) {
274 it.increment(ec);
275 }
276 return ec;
277 }
278
279 template<class T>
advanceTo(T & it,size_t Val)280 static void advanceTo(T &it, size_t Val) {
281 if (error_code ec = advance(it, Val))
282 report_fatal_error(ec.message());
283 }
284
getCPUType(const MachOObjectFile * O)285 static unsigned getCPUType(const MachOObjectFile *O) {
286 return O->getHeader().CPUType;
287 }
288
printRelocationTargetName(const MachOObjectFile * O,const macho::RelocationEntry & RE,raw_string_ostream & fmt)289 static void printRelocationTargetName(const MachOObjectFile *O,
290 const macho::RelocationEntry &RE,
291 raw_string_ostream &fmt) {
292 bool IsScattered = O->isRelocationScattered(RE);
293
294 // Target of a scattered relocation is an address. In the interest of
295 // generating pretty output, scan through the symbol table looking for a
296 // symbol that aligns with that address. If we find one, print it.
297 // Otherwise, we just print the hex address of the target.
298 if (IsScattered) {
299 uint32_t Val = O->getPlainRelocationSymbolNum(RE);
300
301 error_code ec;
302 for (symbol_iterator SI = O->begin_symbols(), SE = O->end_symbols();
303 SI != SE; SI.increment(ec)) {
304 if (ec) report_fatal_error(ec.message());
305
306 uint64_t Addr;
307 StringRef Name;
308
309 if ((ec = SI->getAddress(Addr)))
310 report_fatal_error(ec.message());
311 if (Addr != Val) continue;
312 if ((ec = SI->getName(Name)))
313 report_fatal_error(ec.message());
314 fmt << Name;
315 return;
316 }
317
318 // If we couldn't find a symbol that this relocation refers to, try
319 // to find a section beginning instead.
320 for (section_iterator SI = O->begin_sections(), SE = O->end_sections();
321 SI != SE; SI.increment(ec)) {
322 if (ec) report_fatal_error(ec.message());
323
324 uint64_t Addr;
325 StringRef Name;
326
327 if ((ec = SI->getAddress(Addr)))
328 report_fatal_error(ec.message());
329 if (Addr != Val) continue;
330 if ((ec = SI->getName(Name)))
331 report_fatal_error(ec.message());
332 fmt << Name;
333 return;
334 }
335
336 fmt << format("0x%x", Val);
337 return;
338 }
339
340 StringRef S;
341 bool isExtern = O->getPlainRelocationExternal(RE);
342 uint64_t Val = O->getPlainRelocationSymbolNum(RE);
343
344 if (isExtern) {
345 symbol_iterator SI = O->begin_symbols();
346 advanceTo(SI, Val);
347 SI->getName(S);
348 } else {
349 section_iterator SI = O->begin_sections();
350 // Adjust for the fact that sections are 1-indexed.
351 advanceTo(SI, Val - 1);
352 SI->getName(S);
353 }
354
355 fmt << S;
356 }
357
getPlainRelocationAddress(const macho::RelocationEntry & RE)358 static uint32_t getPlainRelocationAddress(const macho::RelocationEntry &RE) {
359 return RE.Word0;
360 }
361
362 static unsigned
getScatteredRelocationAddress(const macho::RelocationEntry & RE)363 getScatteredRelocationAddress(const macho::RelocationEntry &RE) {
364 return RE.Word0 & 0xffffff;
365 }
366
getPlainRelocationPCRel(const MachOObjectFile * O,const macho::RelocationEntry & RE)367 static bool getPlainRelocationPCRel(const MachOObjectFile *O,
368 const macho::RelocationEntry &RE) {
369 if (O->isLittleEndian())
370 return (RE.Word1 >> 24) & 1;
371 return (RE.Word1 >> 7) & 1;
372 }
373
374 static bool
getScatteredRelocationPCRel(const MachOObjectFile * O,const macho::RelocationEntry & RE)375 getScatteredRelocationPCRel(const MachOObjectFile *O,
376 const macho::RelocationEntry &RE) {
377 return (RE.Word0 >> 30) & 1;
378 }
379
getPlainRelocationLength(const MachOObjectFile * O,const macho::RelocationEntry & RE)380 static unsigned getPlainRelocationLength(const MachOObjectFile *O,
381 const macho::RelocationEntry &RE) {
382 if (O->isLittleEndian())
383 return (RE.Word1 >> 25) & 3;
384 return (RE.Word1 >> 5) & 3;
385 }
386
387 static unsigned
getScatteredRelocationLength(const macho::RelocationEntry & RE)388 getScatteredRelocationLength(const macho::RelocationEntry &RE) {
389 return (RE.Word0 >> 28) & 3;
390 }
391
getPlainRelocationType(const MachOObjectFile * O,const macho::RelocationEntry & RE)392 static unsigned getPlainRelocationType(const MachOObjectFile *O,
393 const macho::RelocationEntry &RE) {
394 if (O->isLittleEndian())
395 return RE.Word1 >> 28;
396 return RE.Word1 & 0xf;
397 }
398
getScatteredRelocationType(const macho::RelocationEntry & RE)399 static unsigned getScatteredRelocationType(const macho::RelocationEntry &RE) {
400 return (RE.Word0 >> 24) & 0xf;
401 }
402
getSectionFlags(const MachOObjectFile * O,DataRefImpl Sec)403 static uint32_t getSectionFlags(const MachOObjectFile *O,
404 DataRefImpl Sec) {
405 if (O->is64Bit()) {
406 macho::Section64 Sect = O->getSection64(Sec);
407 return Sect.Flags;
408 }
409 macho::Section Sect = O->getSection(Sec);
410 return Sect.Flags;
411 }
412
MachOObjectFile(MemoryBuffer * Object,bool IsLittleEndian,bool Is64bits,error_code & ec)413 MachOObjectFile::MachOObjectFile(MemoryBuffer *Object,
414 bool IsLittleEndian, bool Is64bits,
415 error_code &ec)
416 : ObjectFile(getMachOType(IsLittleEndian, Is64bits), Object),
417 SymtabLoadCmd(NULL), DysymtabLoadCmd(NULL), DataInCodeLoadCmd(NULL) {
418 uint32_t LoadCommandCount = this->getHeader().NumLoadCommands;
419 macho::LoadCommandType SegmentLoadType = is64Bit() ?
420 macho::LCT_Segment64 : macho::LCT_Segment;
421
422 MachOObjectFile::LoadCommandInfo Load = getFirstLoadCommandInfo();
423 for (unsigned I = 0; ; ++I) {
424 if (Load.C.Type == macho::LCT_Symtab) {
425 assert(!SymtabLoadCmd && "Multiple symbol tables");
426 SymtabLoadCmd = Load.Ptr;
427 } else if (Load.C.Type == macho::LCT_Dysymtab) {
428 assert(!DysymtabLoadCmd && "Multiple dynamic symbol tables");
429 DysymtabLoadCmd = Load.Ptr;
430 } else if (Load.C.Type == macho::LCT_DataInCode) {
431 assert(!DataInCodeLoadCmd && "Multiple data in code tables");
432 DataInCodeLoadCmd = Load.Ptr;
433 } else if (Load.C.Type == SegmentLoadType) {
434 uint32_t NumSections = getSegmentLoadCommandNumSections(this, Load);
435 for (unsigned J = 0; J < NumSections; ++J) {
436 const char *Sec = getSectionPtr(this, Load, J);
437 Sections.push_back(Sec);
438 }
439 }
440
441 if (I == LoadCommandCount - 1)
442 break;
443 else
444 Load = getNextLoadCommandInfo(Load);
445 }
446 }
447
getSymbolNext(DataRefImpl Symb,SymbolRef & Res) const448 error_code MachOObjectFile::getSymbolNext(DataRefImpl Symb,
449 SymbolRef &Res) const {
450 unsigned SymbolTableEntrySize = is64Bit() ?
451 sizeof(macho::Symbol64TableEntry) :
452 sizeof(macho::SymbolTableEntry);
453 Symb.p += SymbolTableEntrySize;
454 Res = SymbolRef(Symb, this);
455 return object_error::success;
456 }
457
getSymbolName(DataRefImpl Symb,StringRef & Res) const458 error_code MachOObjectFile::getSymbolName(DataRefImpl Symb,
459 StringRef &Res) const {
460 StringRef StringTable = getStringTableData();
461 SymbolTableEntryBase Entry = getSymbolTableEntryBase(this, Symb);
462 const char *Start = &StringTable.data()[Entry.StringIndex];
463 Res = StringRef(Start);
464 return object_error::success;
465 }
466
getSymbolAddress(DataRefImpl Symb,uint64_t & Res) const467 error_code MachOObjectFile::getSymbolAddress(DataRefImpl Symb,
468 uint64_t &Res) const {
469 if (is64Bit()) {
470 macho::Symbol64TableEntry Entry = getSymbol64TableEntry(Symb);
471 Res = Entry.Value;
472 } else {
473 macho::SymbolTableEntry Entry = getSymbolTableEntry(Symb);
474 Res = Entry.Value;
475 }
476 return object_error::success;
477 }
478
479 error_code
getSymbolFileOffset(DataRefImpl Symb,uint64_t & Res) const480 MachOObjectFile::getSymbolFileOffset(DataRefImpl Symb,
481 uint64_t &Res) const {
482 SymbolTableEntryBase Entry = getSymbolTableEntryBase(this, Symb);
483 getSymbolAddress(Symb, Res);
484 if (Entry.SectionIndex) {
485 uint64_t Delta;
486 DataRefImpl SecRel;
487 SecRel.d.a = Entry.SectionIndex-1;
488 if (is64Bit()) {
489 macho::Section64 Sec = getSection64(SecRel);
490 Delta = Sec.Offset - Sec.Address;
491 } else {
492 macho::Section Sec = getSection(SecRel);
493 Delta = Sec.Offset - Sec.Address;
494 }
495
496 Res += Delta;
497 }
498
499 return object_error::success;
500 }
501
getSymbolAlignment(DataRefImpl DRI,uint32_t & Result) const502 error_code MachOObjectFile::getSymbolAlignment(DataRefImpl DRI,
503 uint32_t &Result) const {
504 uint32_t flags;
505 this->getSymbolFlags(DRI, flags);
506 if (flags & SymbolRef::SF_Common) {
507 SymbolTableEntryBase Entry = getSymbolTableEntryBase(this, DRI);
508 Result = 1 << MachO::GET_COMM_ALIGN(Entry.Flags);
509 } else {
510 Result = 0;
511 }
512 return object_error::success;
513 }
514
getSymbolSize(DataRefImpl DRI,uint64_t & Result) const515 error_code MachOObjectFile::getSymbolSize(DataRefImpl DRI,
516 uint64_t &Result) const {
517 uint64_t BeginOffset;
518 uint64_t EndOffset = 0;
519 uint8_t SectionIndex;
520
521 SymbolTableEntryBase Entry = getSymbolTableEntryBase(this, DRI);
522 uint64_t Value;
523 getSymbolAddress(DRI, Value);
524
525 BeginOffset = Value;
526
527 SectionIndex = Entry.SectionIndex;
528 if (!SectionIndex) {
529 uint32_t flags = SymbolRef::SF_None;
530 this->getSymbolFlags(DRI, flags);
531 if (flags & SymbolRef::SF_Common)
532 Result = Value;
533 else
534 Result = UnknownAddressOrSize;
535 return object_error::success;
536 }
537 // Unfortunately symbols are unsorted so we need to touch all
538 // symbols from load command
539 error_code ec;
540 for (symbol_iterator I = begin_symbols(), E = end_symbols(); I != E;
541 I.increment(ec)) {
542 DataRefImpl DRI = I->getRawDataRefImpl();
543 Entry = getSymbolTableEntryBase(this, DRI);
544 getSymbolAddress(DRI, Value);
545 if (Entry.SectionIndex == SectionIndex && Value > BeginOffset)
546 if (!EndOffset || Value < EndOffset)
547 EndOffset = Value;
548 }
549 if (!EndOffset) {
550 uint64_t Size;
551 DataRefImpl Sec;
552 Sec.d.a = SectionIndex-1;
553 getSectionSize(Sec, Size);
554 getSectionAddress(Sec, EndOffset);
555 EndOffset += Size;
556 }
557 Result = EndOffset - BeginOffset;
558 return object_error::success;
559 }
560
getSymbolType(DataRefImpl Symb,SymbolRef::Type & Res) const561 error_code MachOObjectFile::getSymbolType(DataRefImpl Symb,
562 SymbolRef::Type &Res) const {
563 SymbolTableEntryBase Entry = getSymbolTableEntryBase(this, Symb);
564 uint8_t n_type = Entry.Type;
565
566 Res = SymbolRef::ST_Other;
567
568 // If this is a STAB debugging symbol, we can do nothing more.
569 if (n_type & MachO::NlistMaskStab) {
570 Res = SymbolRef::ST_Debug;
571 return object_error::success;
572 }
573
574 switch (n_type & MachO::NlistMaskType) {
575 case MachO::NListTypeUndefined :
576 Res = SymbolRef::ST_Unknown;
577 break;
578 case MachO::NListTypeSection :
579 Res = SymbolRef::ST_Function;
580 break;
581 }
582 return object_error::success;
583 }
584
getSymbolNMTypeChar(DataRefImpl Symb,char & Res) const585 error_code MachOObjectFile::getSymbolNMTypeChar(DataRefImpl Symb,
586 char &Res) const {
587 SymbolTableEntryBase Entry = getSymbolTableEntryBase(this, Symb);
588 uint8_t Type = Entry.Type;
589 uint16_t Flags = Entry.Flags;
590
591 char Char;
592 switch (Type & macho::STF_TypeMask) {
593 case macho::STT_Undefined:
594 Char = 'u';
595 break;
596 case macho::STT_Absolute:
597 case macho::STT_Section:
598 Char = 's';
599 break;
600 default:
601 Char = '?';
602 break;
603 }
604
605 if (Flags & (macho::STF_External | macho::STF_PrivateExtern))
606 Char = toupper(static_cast<unsigned char>(Char));
607 Res = Char;
608 return object_error::success;
609 }
610
getSymbolFlags(DataRefImpl DRI,uint32_t & Result) const611 error_code MachOObjectFile::getSymbolFlags(DataRefImpl DRI,
612 uint32_t &Result) const {
613 SymbolTableEntryBase Entry = getSymbolTableEntryBase(this, DRI);
614
615 uint8_t MachOType = Entry.Type;
616 uint16_t MachOFlags = Entry.Flags;
617
618 // TODO: Correctly set SF_ThreadLocal
619 Result = SymbolRef::SF_None;
620
621 if ((MachOType & MachO::NlistMaskType) == MachO::NListTypeUndefined)
622 Result |= SymbolRef::SF_Undefined;
623
624 if (MachOFlags & macho::STF_StabsEntryMask)
625 Result |= SymbolRef::SF_FormatSpecific;
626
627 if (MachOType & MachO::NlistMaskExternal) {
628 Result |= SymbolRef::SF_Global;
629 if ((MachOType & MachO::NlistMaskType) == MachO::NListTypeUndefined) {
630 uint64_t Value;
631 getSymbolAddress(DRI, Value);
632 if (Value)
633 Result |= SymbolRef::SF_Common;
634 }
635 }
636
637 if (MachOFlags & (MachO::NListDescWeakRef | MachO::NListDescWeakDef))
638 Result |= SymbolRef::SF_Weak;
639
640 if ((MachOType & MachO::NlistMaskType) == MachO::NListTypeAbsolute)
641 Result |= SymbolRef::SF_Absolute;
642
643 return object_error::success;
644 }
645
646 error_code
getSymbolSection(DataRefImpl Symb,section_iterator & Res) const647 MachOObjectFile::getSymbolSection(DataRefImpl Symb,
648 section_iterator &Res) const {
649 SymbolTableEntryBase Entry = getSymbolTableEntryBase(this, Symb);
650 uint8_t index = Entry.SectionIndex;
651
652 if (index == 0) {
653 Res = end_sections();
654 } else {
655 DataRefImpl DRI;
656 DRI.d.a = index - 1;
657 Res = section_iterator(SectionRef(DRI, this));
658 }
659
660 return object_error::success;
661 }
662
getSymbolValue(DataRefImpl Symb,uint64_t & Val) const663 error_code MachOObjectFile::getSymbolValue(DataRefImpl Symb,
664 uint64_t &Val) const {
665 report_fatal_error("getSymbolValue unimplemented in MachOObjectFile");
666 }
667
getSectionNext(DataRefImpl Sec,SectionRef & Res) const668 error_code MachOObjectFile::getSectionNext(DataRefImpl Sec,
669 SectionRef &Res) const {
670 Sec.d.a++;
671 Res = SectionRef(Sec, this);
672 return object_error::success;
673 }
674
675 error_code
getSectionName(DataRefImpl Sec,StringRef & Result) const676 MachOObjectFile::getSectionName(DataRefImpl Sec, StringRef &Result) const {
677 ArrayRef<char> Raw = getSectionRawName(Sec);
678 Result = parseSegmentOrSectionName(Raw.data());
679 return object_error::success;
680 }
681
682 error_code
getSectionAddress(DataRefImpl Sec,uint64_t & Res) const683 MachOObjectFile::getSectionAddress(DataRefImpl Sec, uint64_t &Res) const {
684 if (is64Bit()) {
685 macho::Section64 Sect = getSection64(Sec);
686 Res = Sect.Address;
687 } else {
688 macho::Section Sect = getSection(Sec);
689 Res = Sect.Address;
690 }
691 return object_error::success;
692 }
693
694 error_code
getSectionSize(DataRefImpl Sec,uint64_t & Res) const695 MachOObjectFile::getSectionSize(DataRefImpl Sec, uint64_t &Res) const {
696 if (is64Bit()) {
697 macho::Section64 Sect = getSection64(Sec);
698 Res = Sect.Size;
699 } else {
700 macho::Section Sect = getSection(Sec);
701 Res = Sect.Size;
702 }
703
704 return object_error::success;
705 }
706
707 error_code
getSectionContents(DataRefImpl Sec,StringRef & Res) const708 MachOObjectFile::getSectionContents(DataRefImpl Sec, StringRef &Res) const {
709 uint32_t Offset;
710 uint64_t Size;
711
712 if (is64Bit()) {
713 macho::Section64 Sect = getSection64(Sec);
714 Offset = Sect.Offset;
715 Size = Sect.Size;
716 } else {
717 macho::Section Sect =getSection(Sec);
718 Offset = Sect.Offset;
719 Size = Sect.Size;
720 }
721
722 Res = this->getData().substr(Offset, Size);
723 return object_error::success;
724 }
725
726 error_code
getSectionAlignment(DataRefImpl Sec,uint64_t & Res) const727 MachOObjectFile::getSectionAlignment(DataRefImpl Sec, uint64_t &Res) const {
728 uint32_t Align;
729 if (is64Bit()) {
730 macho::Section64 Sect = getSection64(Sec);
731 Align = Sect.Align;
732 } else {
733 macho::Section Sect = getSection(Sec);
734 Align = Sect.Align;
735 }
736
737 Res = uint64_t(1) << Align;
738 return object_error::success;
739 }
740
741 error_code
isSectionText(DataRefImpl Sec,bool & Res) const742 MachOObjectFile::isSectionText(DataRefImpl Sec, bool &Res) const {
743 uint32_t Flags = getSectionFlags(this, Sec);
744 Res = Flags & macho::SF_PureInstructions;
745 return object_error::success;
746 }
747
isSectionData(DataRefImpl DRI,bool & Result) const748 error_code MachOObjectFile::isSectionData(DataRefImpl DRI, bool &Result) const {
749 // FIXME: Unimplemented.
750 Result = false;
751 return object_error::success;
752 }
753
isSectionBSS(DataRefImpl DRI,bool & Result) const754 error_code MachOObjectFile::isSectionBSS(DataRefImpl DRI, bool &Result) const {
755 // FIXME: Unimplemented.
756 Result = false;
757 return object_error::success;
758 }
759
760 error_code
isSectionRequiredForExecution(DataRefImpl Sec,bool & Result) const761 MachOObjectFile::isSectionRequiredForExecution(DataRefImpl Sec,
762 bool &Result) const {
763 // FIXME: Unimplemented.
764 Result = true;
765 return object_error::success;
766 }
767
isSectionVirtual(DataRefImpl Sec,bool & Result) const768 error_code MachOObjectFile::isSectionVirtual(DataRefImpl Sec,
769 bool &Result) const {
770 // FIXME: Unimplemented.
771 Result = false;
772 return object_error::success;
773 }
774
775 error_code
isSectionZeroInit(DataRefImpl Sec,bool & Res) const776 MachOObjectFile::isSectionZeroInit(DataRefImpl Sec, bool &Res) const {
777 uint32_t Flags = getSectionFlags(this, Sec);
778 unsigned SectionType = Flags & MachO::SectionFlagMaskSectionType;
779 Res = SectionType == MachO::SectionTypeZeroFill ||
780 SectionType == MachO::SectionTypeZeroFillLarge;
781 return object_error::success;
782 }
783
isSectionReadOnlyData(DataRefImpl Sec,bool & Result) const784 error_code MachOObjectFile::isSectionReadOnlyData(DataRefImpl Sec,
785 bool &Result) const {
786 // Consider using the code from isSectionText to look for __const sections.
787 // Alternately, emit S_ATTR_PURE_INSTRUCTIONS and/or S_ATTR_SOME_INSTRUCTIONS
788 // to use section attributes to distinguish code from data.
789
790 // FIXME: Unimplemented.
791 Result = false;
792 return object_error::success;
793 }
794
795 error_code
sectionContainsSymbol(DataRefImpl Sec,DataRefImpl Symb,bool & Result) const796 MachOObjectFile::sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb,
797 bool &Result) const {
798 SymbolRef::Type ST;
799 this->getSymbolType(Symb, ST);
800 if (ST == SymbolRef::ST_Unknown) {
801 Result = false;
802 return object_error::success;
803 }
804
805 uint64_t SectBegin, SectEnd;
806 getSectionAddress(Sec, SectBegin);
807 getSectionSize(Sec, SectEnd);
808 SectEnd += SectBegin;
809
810 uint64_t SymAddr;
811 getSymbolAddress(Symb, SymAddr);
812 Result = (SymAddr >= SectBegin) && (SymAddr < SectEnd);
813
814 return object_error::success;
815 }
816
getSectionRelBegin(DataRefImpl Sec) const817 relocation_iterator MachOObjectFile::getSectionRelBegin(DataRefImpl Sec) const {
818 uint32_t Offset;
819 if (is64Bit()) {
820 macho::Section64 Sect = getSection64(Sec);
821 Offset = Sect.RelocationTableOffset;
822 } else {
823 macho::Section Sect = getSection(Sec);
824 Offset = Sect.RelocationTableOffset;
825 }
826
827 DataRefImpl Ret;
828 Ret.p = reinterpret_cast<uintptr_t>(getPtr(this, Offset));
829 return relocation_iterator(RelocationRef(Ret, this));
830 }
831
832 relocation_iterator
getSectionRelEnd(DataRefImpl Sec) const833 MachOObjectFile::getSectionRelEnd(DataRefImpl Sec) const {
834 uint32_t Offset;
835 uint32_t Num;
836 if (is64Bit()) {
837 macho::Section64 Sect = getSection64(Sec);
838 Offset = Sect.RelocationTableOffset;
839 Num = Sect.NumRelocationTableEntries;
840 } else {
841 macho::Section Sect = getSection(Sec);
842 Offset = Sect.RelocationTableOffset;
843 Num = Sect.NumRelocationTableEntries;
844 }
845
846 const macho::RelocationEntry *P =
847 reinterpret_cast<const macho::RelocationEntry*>(getPtr(this, Offset));
848
849 DataRefImpl Ret;
850 Ret.p = reinterpret_cast<uintptr_t>(P + Num);
851 return relocation_iterator(RelocationRef(Ret, this));
852 }
853
getRelocationNext(DataRefImpl Rel,RelocationRef & Res) const854 error_code MachOObjectFile::getRelocationNext(DataRefImpl Rel,
855 RelocationRef &Res) const {
856 const macho::RelocationEntry *P =
857 reinterpret_cast<const macho::RelocationEntry *>(Rel.p);
858 Rel.p = reinterpret_cast<uintptr_t>(P + 1);
859 Res = RelocationRef(Rel, this);
860 return object_error::success;
861 }
862
863 error_code
getRelocationAddress(DataRefImpl Rel,uint64_t & Res) const864 MachOObjectFile::getRelocationAddress(DataRefImpl Rel, uint64_t &Res) const {
865 report_fatal_error("getRelocationAddress not implemented in MachOObjectFile");
866 }
867
getRelocationOffset(DataRefImpl Rel,uint64_t & Res) const868 error_code MachOObjectFile::getRelocationOffset(DataRefImpl Rel,
869 uint64_t &Res) const {
870 macho::RelocationEntry RE = getRelocation(Rel);
871 Res = getAnyRelocationAddress(RE);
872 return object_error::success;
873 }
874
875 symbol_iterator
getRelocationSymbol(DataRefImpl Rel) const876 MachOObjectFile::getRelocationSymbol(DataRefImpl Rel) const {
877 macho::RelocationEntry RE = getRelocation(Rel);
878 uint32_t SymbolIdx = getPlainRelocationSymbolNum(RE);
879 bool isExtern = getPlainRelocationExternal(RE);
880 if (!isExtern)
881 return end_symbols();
882
883 macho::SymtabLoadCommand S = getSymtabLoadCommand();
884 unsigned SymbolTableEntrySize = is64Bit() ?
885 sizeof(macho::Symbol64TableEntry) :
886 sizeof(macho::SymbolTableEntry);
887 uint64_t Offset = S.SymbolTableOffset + SymbolIdx * SymbolTableEntrySize;
888 DataRefImpl Sym;
889 Sym.p = reinterpret_cast<uintptr_t>(getPtr(this, Offset));
890 return symbol_iterator(SymbolRef(Sym, this));
891 }
892
getRelocationType(DataRefImpl Rel,uint64_t & Res) const893 error_code MachOObjectFile::getRelocationType(DataRefImpl Rel,
894 uint64_t &Res) const {
895 macho::RelocationEntry RE = getRelocation(Rel);
896 Res = getAnyRelocationType(RE);
897 return object_error::success;
898 }
899
900 error_code
getRelocationTypeName(DataRefImpl Rel,SmallVectorImpl<char> & Result) const901 MachOObjectFile::getRelocationTypeName(DataRefImpl Rel,
902 SmallVectorImpl<char> &Result) const {
903 StringRef res;
904 uint64_t RType;
905 getRelocationType(Rel, RType);
906
907 unsigned Arch = this->getArch();
908
909 switch (Arch) {
910 case Triple::x86: {
911 static const char *const Table[] = {
912 "GENERIC_RELOC_VANILLA",
913 "GENERIC_RELOC_PAIR",
914 "GENERIC_RELOC_SECTDIFF",
915 "GENERIC_RELOC_PB_LA_PTR",
916 "GENERIC_RELOC_LOCAL_SECTDIFF",
917 "GENERIC_RELOC_TLV" };
918
919 if (RType > 6)
920 res = "Unknown";
921 else
922 res = Table[RType];
923 break;
924 }
925 case Triple::x86_64: {
926 static const char *const Table[] = {
927 "X86_64_RELOC_UNSIGNED",
928 "X86_64_RELOC_SIGNED",
929 "X86_64_RELOC_BRANCH",
930 "X86_64_RELOC_GOT_LOAD",
931 "X86_64_RELOC_GOT",
932 "X86_64_RELOC_SUBTRACTOR",
933 "X86_64_RELOC_SIGNED_1",
934 "X86_64_RELOC_SIGNED_2",
935 "X86_64_RELOC_SIGNED_4",
936 "X86_64_RELOC_TLV" };
937
938 if (RType > 9)
939 res = "Unknown";
940 else
941 res = Table[RType];
942 break;
943 }
944 case Triple::arm: {
945 static const char *const Table[] = {
946 "ARM_RELOC_VANILLA",
947 "ARM_RELOC_PAIR",
948 "ARM_RELOC_SECTDIFF",
949 "ARM_RELOC_LOCAL_SECTDIFF",
950 "ARM_RELOC_PB_LA_PTR",
951 "ARM_RELOC_BR24",
952 "ARM_THUMB_RELOC_BR22",
953 "ARM_THUMB_32BIT_BRANCH",
954 "ARM_RELOC_HALF",
955 "ARM_RELOC_HALF_SECTDIFF" };
956
957 if (RType > 9)
958 res = "Unknown";
959 else
960 res = Table[RType];
961 break;
962 }
963 case Triple::ppc: {
964 static const char *const Table[] = {
965 "PPC_RELOC_VANILLA",
966 "PPC_RELOC_PAIR",
967 "PPC_RELOC_BR14",
968 "PPC_RELOC_BR24",
969 "PPC_RELOC_HI16",
970 "PPC_RELOC_LO16",
971 "PPC_RELOC_HA16",
972 "PPC_RELOC_LO14",
973 "PPC_RELOC_SECTDIFF",
974 "PPC_RELOC_PB_LA_PTR",
975 "PPC_RELOC_HI16_SECTDIFF",
976 "PPC_RELOC_LO16_SECTDIFF",
977 "PPC_RELOC_HA16_SECTDIFF",
978 "PPC_RELOC_JBSR",
979 "PPC_RELOC_LO14_SECTDIFF",
980 "PPC_RELOC_LOCAL_SECTDIFF" };
981
982 res = Table[RType];
983 break;
984 }
985 case Triple::UnknownArch:
986 res = "Unknown";
987 break;
988 }
989 Result.append(res.begin(), res.end());
990 return object_error::success;
991 }
992
993 error_code
getRelocationValueString(DataRefImpl Rel,SmallVectorImpl<char> & Result) const994 MachOObjectFile::getRelocationValueString(DataRefImpl Rel,
995 SmallVectorImpl<char> &Result) const {
996 macho::RelocationEntry RE = getRelocation(Rel);
997
998 unsigned Arch = this->getArch();
999
1000 std::string fmtbuf;
1001 raw_string_ostream fmt(fmtbuf);
1002 unsigned Type = this->getAnyRelocationType(RE);
1003 bool IsPCRel = this->getAnyRelocationPCRel(RE);
1004
1005 // Determine any addends that should be displayed with the relocation.
1006 // These require decoding the relocation type, which is triple-specific.
1007
1008 // X86_64 has entirely custom relocation types.
1009 if (Arch == Triple::x86_64) {
1010 bool isPCRel = getAnyRelocationPCRel(RE);
1011
1012 switch (Type) {
1013 case macho::RIT_X86_64_GOTLoad: // X86_64_RELOC_GOT_LOAD
1014 case macho::RIT_X86_64_GOT: { // X86_64_RELOC_GOT
1015 printRelocationTargetName(this, RE, fmt);
1016 fmt << "@GOT";
1017 if (isPCRel) fmt << "PCREL";
1018 break;
1019 }
1020 case macho::RIT_X86_64_Subtractor: { // X86_64_RELOC_SUBTRACTOR
1021 DataRefImpl RelNext = Rel;
1022 RelNext.d.a++;
1023 macho::RelocationEntry RENext = getRelocation(RelNext);
1024
1025 // X86_64_SUBTRACTOR must be followed by a relocation of type
1026 // X86_64_RELOC_UNSIGNED.
1027 // NOTE: Scattered relocations don't exist on x86_64.
1028 unsigned RType = getAnyRelocationType(RENext);
1029 if (RType != 0)
1030 report_fatal_error("Expected X86_64_RELOC_UNSIGNED after "
1031 "X86_64_RELOC_SUBTRACTOR.");
1032
1033 // The X86_64_RELOC_UNSIGNED contains the minuend symbol,
1034 // X86_64_SUBTRACTOR contains to the subtrahend.
1035 printRelocationTargetName(this, RENext, fmt);
1036 fmt << "-";
1037 printRelocationTargetName(this, RE, fmt);
1038 break;
1039 }
1040 case macho::RIT_X86_64_TLV:
1041 printRelocationTargetName(this, RE, fmt);
1042 fmt << "@TLV";
1043 if (isPCRel) fmt << "P";
1044 break;
1045 case macho::RIT_X86_64_Signed1: // X86_64_RELOC_SIGNED1
1046 printRelocationTargetName(this, RE, fmt);
1047 fmt << "-1";
1048 break;
1049 case macho::RIT_X86_64_Signed2: // X86_64_RELOC_SIGNED2
1050 printRelocationTargetName(this, RE, fmt);
1051 fmt << "-2";
1052 break;
1053 case macho::RIT_X86_64_Signed4: // X86_64_RELOC_SIGNED4
1054 printRelocationTargetName(this, RE, fmt);
1055 fmt << "-4";
1056 break;
1057 default:
1058 printRelocationTargetName(this, RE, fmt);
1059 break;
1060 }
1061 // X86 and ARM share some relocation types in common.
1062 } else if (Arch == Triple::x86 || Arch == Triple::arm) {
1063 // Generic relocation types...
1064 switch (Type) {
1065 case macho::RIT_Pair: // GENERIC_RELOC_PAIR - prints no info
1066 return object_error::success;
1067 case macho::RIT_Difference: { // GENERIC_RELOC_SECTDIFF
1068 DataRefImpl RelNext = Rel;
1069 RelNext.d.a++;
1070 macho::RelocationEntry RENext = getRelocation(RelNext);
1071
1072 // X86 sect diff's must be followed by a relocation of type
1073 // GENERIC_RELOC_PAIR.
1074 unsigned RType = getAnyRelocationType(RENext);
1075
1076 if (RType != 1)
1077 report_fatal_error("Expected GENERIC_RELOC_PAIR after "
1078 "GENERIC_RELOC_SECTDIFF.");
1079
1080 printRelocationTargetName(this, RE, fmt);
1081 fmt << "-";
1082 printRelocationTargetName(this, RENext, fmt);
1083 break;
1084 }
1085 }
1086
1087 if (Arch == Triple::x86) {
1088 // All X86 relocations that need special printing were already
1089 // handled in the generic code.
1090 switch (Type) {
1091 case macho::RIT_Generic_LocalDifference:{// GENERIC_RELOC_LOCAL_SECTDIFF
1092 DataRefImpl RelNext = Rel;
1093 RelNext.d.a++;
1094 macho::RelocationEntry RENext = getRelocation(RelNext);
1095
1096 // X86 sect diff's must be followed by a relocation of type
1097 // GENERIC_RELOC_PAIR.
1098 unsigned RType = getAnyRelocationType(RENext);
1099 if (RType != 1)
1100 report_fatal_error("Expected GENERIC_RELOC_PAIR after "
1101 "GENERIC_RELOC_LOCAL_SECTDIFF.");
1102
1103 printRelocationTargetName(this, RE, fmt);
1104 fmt << "-";
1105 printRelocationTargetName(this, RENext, fmt);
1106 break;
1107 }
1108 case macho::RIT_Generic_TLV: {
1109 printRelocationTargetName(this, RE, fmt);
1110 fmt << "@TLV";
1111 if (IsPCRel) fmt << "P";
1112 break;
1113 }
1114 default:
1115 printRelocationTargetName(this, RE, fmt);
1116 }
1117 } else { // ARM-specific relocations
1118 switch (Type) {
1119 case macho::RIT_ARM_Half: // ARM_RELOC_HALF
1120 case macho::RIT_ARM_HalfDifference: { // ARM_RELOC_HALF_SECTDIFF
1121 // Half relocations steal a bit from the length field to encode
1122 // whether this is an upper16 or a lower16 relocation.
1123 bool isUpper = getAnyRelocationLength(RE) >> 1;
1124
1125 if (isUpper)
1126 fmt << ":upper16:(";
1127 else
1128 fmt << ":lower16:(";
1129 printRelocationTargetName(this, RE, fmt);
1130
1131 DataRefImpl RelNext = Rel;
1132 RelNext.d.a++;
1133 macho::RelocationEntry RENext = getRelocation(RelNext);
1134
1135 // ARM half relocs must be followed by a relocation of type
1136 // ARM_RELOC_PAIR.
1137 unsigned RType = getAnyRelocationType(RENext);
1138 if (RType != 1)
1139 report_fatal_error("Expected ARM_RELOC_PAIR after "
1140 "GENERIC_RELOC_HALF");
1141
1142 // NOTE: The half of the target virtual address is stashed in the
1143 // address field of the secondary relocation, but we can't reverse
1144 // engineer the constant offset from it without decoding the movw/movt
1145 // instruction to find the other half in its immediate field.
1146
1147 // ARM_RELOC_HALF_SECTDIFF encodes the second section in the
1148 // symbol/section pointer of the follow-on relocation.
1149 if (Type == macho::RIT_ARM_HalfDifference) {
1150 fmt << "-";
1151 printRelocationTargetName(this, RENext, fmt);
1152 }
1153
1154 fmt << ")";
1155 break;
1156 }
1157 default: {
1158 printRelocationTargetName(this, RE, fmt);
1159 }
1160 }
1161 }
1162 } else
1163 printRelocationTargetName(this, RE, fmt);
1164
1165 fmt.flush();
1166 Result.append(fmtbuf.begin(), fmtbuf.end());
1167 return object_error::success;
1168 }
1169
1170 error_code
getRelocationHidden(DataRefImpl Rel,bool & Result) const1171 MachOObjectFile::getRelocationHidden(DataRefImpl Rel, bool &Result) const {
1172 unsigned Arch = getArch();
1173 uint64_t Type;
1174 getRelocationType(Rel, Type);
1175
1176 Result = false;
1177
1178 // On arches that use the generic relocations, GENERIC_RELOC_PAIR
1179 // is always hidden.
1180 if (Arch == Triple::x86 || Arch == Triple::arm) {
1181 if (Type == macho::RIT_Pair) Result = true;
1182 } else if (Arch == Triple::x86_64) {
1183 // On x86_64, X86_64_RELOC_UNSIGNED is hidden only when it follows
1184 // an X86_64_RELOC_SUBTRACTOR.
1185 if (Type == macho::RIT_X86_64_Unsigned && Rel.d.a > 0) {
1186 DataRefImpl RelPrev = Rel;
1187 RelPrev.d.a--;
1188 uint64_t PrevType;
1189 getRelocationType(RelPrev, PrevType);
1190 if (PrevType == macho::RIT_X86_64_Subtractor)
1191 Result = true;
1192 }
1193 }
1194
1195 return object_error::success;
1196 }
1197
getLibraryNext(DataRefImpl LibData,LibraryRef & Res) const1198 error_code MachOObjectFile::getLibraryNext(DataRefImpl LibData,
1199 LibraryRef &Res) const {
1200 report_fatal_error("Needed libraries unimplemented in MachOObjectFile");
1201 }
1202
getLibraryPath(DataRefImpl LibData,StringRef & Res) const1203 error_code MachOObjectFile::getLibraryPath(DataRefImpl LibData,
1204 StringRef &Res) const {
1205 report_fatal_error("Needed libraries unimplemented in MachOObjectFile");
1206 }
1207
begin_symbols() const1208 symbol_iterator MachOObjectFile::begin_symbols() const {
1209 DataRefImpl DRI;
1210 if (!SymtabLoadCmd)
1211 return symbol_iterator(SymbolRef(DRI, this));
1212
1213 macho::SymtabLoadCommand Symtab = getSymtabLoadCommand();
1214 DRI.p = reinterpret_cast<uintptr_t>(getPtr(this, Symtab.SymbolTableOffset));
1215 return symbol_iterator(SymbolRef(DRI, this));
1216 }
1217
end_symbols() const1218 symbol_iterator MachOObjectFile::end_symbols() const {
1219 DataRefImpl DRI;
1220 if (!SymtabLoadCmd)
1221 return symbol_iterator(SymbolRef(DRI, this));
1222
1223 macho::SymtabLoadCommand Symtab = getSymtabLoadCommand();
1224 unsigned SymbolTableEntrySize = is64Bit() ?
1225 sizeof(macho::Symbol64TableEntry) :
1226 sizeof(macho::SymbolTableEntry);
1227 unsigned Offset = Symtab.SymbolTableOffset +
1228 Symtab.NumSymbolTableEntries * SymbolTableEntrySize;
1229 DRI.p = reinterpret_cast<uintptr_t>(getPtr(this, Offset));
1230 return symbol_iterator(SymbolRef(DRI, this));
1231 }
1232
begin_dynamic_symbols() const1233 symbol_iterator MachOObjectFile::begin_dynamic_symbols() const {
1234 // TODO: implement
1235 report_fatal_error("Dynamic symbols unimplemented in MachOObjectFile");
1236 }
1237
end_dynamic_symbols() const1238 symbol_iterator MachOObjectFile::end_dynamic_symbols() const {
1239 // TODO: implement
1240 report_fatal_error("Dynamic symbols unimplemented in MachOObjectFile");
1241 }
1242
begin_sections() const1243 section_iterator MachOObjectFile::begin_sections() const {
1244 DataRefImpl DRI;
1245 return section_iterator(SectionRef(DRI, this));
1246 }
1247
end_sections() const1248 section_iterator MachOObjectFile::end_sections() const {
1249 DataRefImpl DRI;
1250 DRI.d.a = Sections.size();
1251 return section_iterator(SectionRef(DRI, this));
1252 }
1253
begin_libraries_needed() const1254 library_iterator MachOObjectFile::begin_libraries_needed() const {
1255 // TODO: implement
1256 report_fatal_error("Needed libraries unimplemented in MachOObjectFile");
1257 }
1258
end_libraries_needed() const1259 library_iterator MachOObjectFile::end_libraries_needed() const {
1260 // TODO: implement
1261 report_fatal_error("Needed libraries unimplemented in MachOObjectFile");
1262 }
1263
getBytesInAddress() const1264 uint8_t MachOObjectFile::getBytesInAddress() const {
1265 return is64Bit() ? 8 : 4;
1266 }
1267
getFileFormatName() const1268 StringRef MachOObjectFile::getFileFormatName() const {
1269 unsigned CPUType = getCPUType(this);
1270 if (!is64Bit()) {
1271 switch (CPUType) {
1272 case llvm::MachO::CPUTypeI386:
1273 return "Mach-O 32-bit i386";
1274 case llvm::MachO::CPUTypeARM:
1275 return "Mach-O arm";
1276 case llvm::MachO::CPUTypePowerPC:
1277 return "Mach-O 32-bit ppc";
1278 default:
1279 assert((CPUType & llvm::MachO::CPUArchABI64) == 0 &&
1280 "64-bit object file when we're not 64-bit?");
1281 return "Mach-O 32-bit unknown";
1282 }
1283 }
1284
1285 // Make sure the cpu type has the correct mask.
1286 assert((CPUType & llvm::MachO::CPUArchABI64)
1287 == llvm::MachO::CPUArchABI64 &&
1288 "32-bit object file when we're 64-bit?");
1289
1290 switch (CPUType) {
1291 case llvm::MachO::CPUTypeX86_64:
1292 return "Mach-O 64-bit x86-64";
1293 case llvm::MachO::CPUTypePowerPC64:
1294 return "Mach-O 64-bit ppc64";
1295 default:
1296 return "Mach-O 64-bit unknown";
1297 }
1298 }
1299
getArch(uint32_t CPUType)1300 Triple::ArchType MachOObjectFile::getArch(uint32_t CPUType) {
1301 switch (CPUType) {
1302 case llvm::MachO::CPUTypeI386:
1303 return Triple::x86;
1304 case llvm::MachO::CPUTypeX86_64:
1305 return Triple::x86_64;
1306 case llvm::MachO::CPUTypeARM:
1307 return Triple::arm;
1308 case llvm::MachO::CPUTypePowerPC:
1309 return Triple::ppc;
1310 case llvm::MachO::CPUTypePowerPC64:
1311 return Triple::ppc64;
1312 default:
1313 return Triple::UnknownArch;
1314 }
1315 }
1316
getArch() const1317 unsigned MachOObjectFile::getArch() const {
1318 return getArch(getCPUType(this));
1319 }
1320
getLoadName() const1321 StringRef MachOObjectFile::getLoadName() const {
1322 // TODO: Implement
1323 report_fatal_error("get_load_name() unimplemented in MachOObjectFile");
1324 }
1325
getSectionRelBegin(unsigned Index) const1326 relocation_iterator MachOObjectFile::getSectionRelBegin(unsigned Index) const {
1327 DataRefImpl DRI;
1328 DRI.d.a = Index;
1329 return getSectionRelBegin(DRI);
1330 }
1331
getSectionRelEnd(unsigned Index) const1332 relocation_iterator MachOObjectFile::getSectionRelEnd(unsigned Index) const {
1333 DataRefImpl DRI;
1334 DRI.d.a = Index;
1335 return getSectionRelEnd(DRI);
1336 }
1337
begin_dices() const1338 dice_iterator MachOObjectFile::begin_dices() const {
1339 DataRefImpl DRI;
1340 if (!DataInCodeLoadCmd)
1341 return dice_iterator(DiceRef(DRI, this));
1342
1343 macho::LinkeditDataLoadCommand DicLC = getDataInCodeLoadCommand();
1344 DRI.p = reinterpret_cast<uintptr_t>(getPtr(this, DicLC.DataOffset));
1345 return dice_iterator(DiceRef(DRI, this));
1346 }
1347
end_dices() const1348 dice_iterator MachOObjectFile::end_dices() const {
1349 DataRefImpl DRI;
1350 if (!DataInCodeLoadCmd)
1351 return dice_iterator(DiceRef(DRI, this));
1352
1353 macho::LinkeditDataLoadCommand DicLC = getDataInCodeLoadCommand();
1354 unsigned Offset = DicLC.DataOffset + DicLC.DataSize;
1355 DRI.p = reinterpret_cast<uintptr_t>(getPtr(this, Offset));
1356 return dice_iterator(DiceRef(DRI, this));
1357 }
1358
1359 StringRef
getSectionFinalSegmentName(DataRefImpl Sec) const1360 MachOObjectFile::getSectionFinalSegmentName(DataRefImpl Sec) const {
1361 ArrayRef<char> Raw = getSectionRawFinalSegmentName(Sec);
1362 return parseSegmentOrSectionName(Raw.data());
1363 }
1364
1365 ArrayRef<char>
getSectionRawName(DataRefImpl Sec) const1366 MachOObjectFile::getSectionRawName(DataRefImpl Sec) const {
1367 const SectionBase *Base =
1368 reinterpret_cast<const SectionBase*>(Sections[Sec.d.a]);
1369 return ArrayRef<char>(Base->Name);
1370 }
1371
1372 ArrayRef<char>
getSectionRawFinalSegmentName(DataRefImpl Sec) const1373 MachOObjectFile::getSectionRawFinalSegmentName(DataRefImpl Sec) const {
1374 const SectionBase *Base =
1375 reinterpret_cast<const SectionBase*>(Sections[Sec.d.a]);
1376 return ArrayRef<char>(Base->SegmentName);
1377 }
1378
1379 bool
isRelocationScattered(const macho::RelocationEntry & RE) const1380 MachOObjectFile::isRelocationScattered(const macho::RelocationEntry &RE)
1381 const {
1382 if (getCPUType(this) == llvm::MachO::CPUTypeX86_64)
1383 return false;
1384 return getPlainRelocationAddress(RE) & macho::RF_Scattered;
1385 }
1386
getPlainRelocationSymbolNum(const macho::RelocationEntry & RE) const1387 unsigned MachOObjectFile::getPlainRelocationSymbolNum(
1388 const macho::RelocationEntry &RE) const {
1389 if (isLittleEndian())
1390 return RE.Word1 & 0xffffff;
1391 return RE.Word1 >> 8;
1392 }
1393
getPlainRelocationExternal(const macho::RelocationEntry & RE) const1394 bool MachOObjectFile::getPlainRelocationExternal(
1395 const macho::RelocationEntry &RE) const {
1396 if (isLittleEndian())
1397 return (RE.Word1 >> 27) & 1;
1398 return (RE.Word1 >> 4) & 1;
1399 }
1400
getScatteredRelocationScattered(const macho::RelocationEntry & RE) const1401 bool MachOObjectFile::getScatteredRelocationScattered(
1402 const macho::RelocationEntry &RE) const {
1403 return RE.Word0 >> 31;
1404 }
1405
getScatteredRelocationValue(const macho::RelocationEntry & RE) const1406 uint32_t MachOObjectFile::getScatteredRelocationValue(
1407 const macho::RelocationEntry &RE) const {
1408 return RE.Word1;
1409 }
1410
getAnyRelocationAddress(const macho::RelocationEntry & RE) const1411 unsigned MachOObjectFile::getAnyRelocationAddress(
1412 const macho::RelocationEntry &RE) const {
1413 if (isRelocationScattered(RE))
1414 return getScatteredRelocationAddress(RE);
1415 return getPlainRelocationAddress(RE);
1416 }
1417
1418 unsigned
getAnyRelocationPCRel(const macho::RelocationEntry & RE) const1419 MachOObjectFile::getAnyRelocationPCRel(const macho::RelocationEntry &RE) const {
1420 if (isRelocationScattered(RE))
1421 return getScatteredRelocationPCRel(this, RE);
1422 return getPlainRelocationPCRel(this, RE);
1423 }
1424
getAnyRelocationLength(const macho::RelocationEntry & RE) const1425 unsigned MachOObjectFile::getAnyRelocationLength(
1426 const macho::RelocationEntry &RE) const {
1427 if (isRelocationScattered(RE))
1428 return getScatteredRelocationLength(RE);
1429 return getPlainRelocationLength(this, RE);
1430 }
1431
1432 unsigned
getAnyRelocationType(const macho::RelocationEntry & RE) const1433 MachOObjectFile::getAnyRelocationType(const macho::RelocationEntry &RE) const {
1434 if (isRelocationScattered(RE))
1435 return getScatteredRelocationType(RE);
1436 return getPlainRelocationType(this, RE);
1437 }
1438
1439 SectionRef
getRelocationSection(const macho::RelocationEntry & RE) const1440 MachOObjectFile::getRelocationSection(const macho::RelocationEntry &RE) const {
1441 if (isRelocationScattered(RE) || getPlainRelocationExternal(RE))
1442 return *end_sections();
1443 unsigned SecNum = getPlainRelocationSymbolNum(RE) - 1;
1444 DataRefImpl DRI;
1445 DRI.d.a = SecNum;
1446 return SectionRef(DRI, this);
1447 }
1448
1449 MachOObjectFile::LoadCommandInfo
getFirstLoadCommandInfo() const1450 MachOObjectFile::getFirstLoadCommandInfo() const {
1451 MachOObjectFile::LoadCommandInfo Load;
1452
1453 unsigned HeaderSize = is64Bit() ? macho::Header64Size : macho::Header32Size;
1454 Load.Ptr = getPtr(this, HeaderSize);
1455 Load.C = getStruct<macho::LoadCommand>(this, Load.Ptr);
1456 return Load;
1457 }
1458
1459 MachOObjectFile::LoadCommandInfo
getNextLoadCommandInfo(const LoadCommandInfo & L) const1460 MachOObjectFile::getNextLoadCommandInfo(const LoadCommandInfo &L) const {
1461 MachOObjectFile::LoadCommandInfo Next;
1462 Next.Ptr = L.Ptr + L.C.Size;
1463 Next.C = getStruct<macho::LoadCommand>(this, Next.Ptr);
1464 return Next;
1465 }
1466
getSection(DataRefImpl DRI) const1467 macho::Section MachOObjectFile::getSection(DataRefImpl DRI) const {
1468 return getStruct<macho::Section>(this, Sections[DRI.d.a]);
1469 }
1470
getSection64(DataRefImpl DRI) const1471 macho::Section64 MachOObjectFile::getSection64(DataRefImpl DRI) const {
1472 return getStruct<macho::Section64>(this, Sections[DRI.d.a]);
1473 }
1474
getSection(const LoadCommandInfo & L,unsigned Index) const1475 macho::Section MachOObjectFile::getSection(const LoadCommandInfo &L,
1476 unsigned Index) const {
1477 const char *Sec = getSectionPtr(this, L, Index);
1478 return getStruct<macho::Section>(this, Sec);
1479 }
1480
getSection64(const LoadCommandInfo & L,unsigned Index) const1481 macho::Section64 MachOObjectFile::getSection64(const LoadCommandInfo &L,
1482 unsigned Index) const {
1483 const char *Sec = getSectionPtr(this, L, Index);
1484 return getStruct<macho::Section64>(this, Sec);
1485 }
1486
1487 macho::SymbolTableEntry
getSymbolTableEntry(DataRefImpl DRI) const1488 MachOObjectFile::getSymbolTableEntry(DataRefImpl DRI) const {
1489 const char *P = reinterpret_cast<const char *>(DRI.p);
1490 return getStruct<macho::SymbolTableEntry>(this, P);
1491 }
1492
1493 macho::Symbol64TableEntry
getSymbol64TableEntry(DataRefImpl DRI) const1494 MachOObjectFile::getSymbol64TableEntry(DataRefImpl DRI) const {
1495 const char *P = reinterpret_cast<const char *>(DRI.p);
1496 return getStruct<macho::Symbol64TableEntry>(this, P);
1497 }
1498
getLinkeditDataLoadCommand(const MachOObjectFile::LoadCommandInfo & L) const1499 macho::LinkeditDataLoadCommand MachOObjectFile::getLinkeditDataLoadCommand(
1500 const MachOObjectFile::LoadCommandInfo &L) const {
1501 return getStruct<macho::LinkeditDataLoadCommand>(this, L.Ptr);
1502 }
1503
1504 macho::SegmentLoadCommand
getSegmentLoadCommand(const LoadCommandInfo & L) const1505 MachOObjectFile::getSegmentLoadCommand(const LoadCommandInfo &L) const {
1506 return getStruct<macho::SegmentLoadCommand>(this, L.Ptr);
1507 }
1508
1509 macho::Segment64LoadCommand
getSegment64LoadCommand(const LoadCommandInfo & L) const1510 MachOObjectFile::getSegment64LoadCommand(const LoadCommandInfo &L) const {
1511 return getStruct<macho::Segment64LoadCommand>(this, L.Ptr);
1512 }
1513
1514 macho::LinkerOptionsLoadCommand
getLinkerOptionsLoadCommand(const LoadCommandInfo & L) const1515 MachOObjectFile::getLinkerOptionsLoadCommand(const LoadCommandInfo &L) const {
1516 return getStruct<macho::LinkerOptionsLoadCommand>(this, L.Ptr);
1517 }
1518
1519 macho::RelocationEntry
getRelocation(DataRefImpl Rel) const1520 MachOObjectFile::getRelocation(DataRefImpl Rel) const {
1521 const char *P = reinterpret_cast<const char *>(Rel.p);
1522 return getStruct<macho::RelocationEntry>(this, P);
1523 }
1524
1525 macho::DataInCodeTableEntry
getDice(DataRefImpl Rel) const1526 MachOObjectFile::getDice(DataRefImpl Rel) const {
1527 const char *P = reinterpret_cast<const char *>(Rel.p);
1528 return getStruct<macho::DataInCodeTableEntry>(this, P);
1529 }
1530
getHeader() const1531 macho::Header MachOObjectFile::getHeader() const {
1532 return getStruct<macho::Header>(this, getPtr(this, 0));
1533 }
1534
getHeader64Ext() const1535 macho::Header64Ext MachOObjectFile::getHeader64Ext() const {
1536 return
1537 getStruct<macho::Header64Ext>(this, getPtr(this, sizeof(macho::Header)));
1538 }
1539
getIndirectSymbolTableEntry(const macho::DysymtabLoadCommand & DLC,unsigned Index) const1540 macho::IndirectSymbolTableEntry MachOObjectFile::getIndirectSymbolTableEntry(
1541 const macho::DysymtabLoadCommand &DLC,
1542 unsigned Index) const {
1543 uint64_t Offset = DLC.IndirectSymbolTableOffset +
1544 Index * sizeof(macho::IndirectSymbolTableEntry);
1545 return getStruct<macho::IndirectSymbolTableEntry>(this, getPtr(this, Offset));
1546 }
1547
1548 macho::DataInCodeTableEntry
getDataInCodeTableEntry(uint32_t DataOffset,unsigned Index) const1549 MachOObjectFile::getDataInCodeTableEntry(uint32_t DataOffset,
1550 unsigned Index) const {
1551 uint64_t Offset = DataOffset + Index * sizeof(macho::DataInCodeTableEntry);
1552 return getStruct<macho::DataInCodeTableEntry>(this, getPtr(this, Offset));
1553 }
1554
getSymtabLoadCommand() const1555 macho::SymtabLoadCommand MachOObjectFile::getSymtabLoadCommand() const {
1556 return getStruct<macho::SymtabLoadCommand>(this, SymtabLoadCmd);
1557 }
1558
getDysymtabLoadCommand() const1559 macho::DysymtabLoadCommand MachOObjectFile::getDysymtabLoadCommand() const {
1560 return getStruct<macho::DysymtabLoadCommand>(this, DysymtabLoadCmd);
1561 }
1562
1563 macho::LinkeditDataLoadCommand
getDataInCodeLoadCommand() const1564 MachOObjectFile::getDataInCodeLoadCommand() const {
1565 if (DataInCodeLoadCmd)
1566 return getStruct<macho::LinkeditDataLoadCommand>(this, DataInCodeLoadCmd);
1567
1568 // If there is no DataInCodeLoadCmd return a load command with zero'ed fields.
1569 macho::LinkeditDataLoadCommand Cmd;
1570 Cmd.Type = macho::LCT_DataInCode;
1571 Cmd.Size = macho::LinkeditLoadCommandSize;
1572 Cmd.DataOffset = 0;
1573 Cmd.DataSize = 0;
1574 return Cmd;
1575 }
1576
getStringTableData() const1577 StringRef MachOObjectFile::getStringTableData() const {
1578 macho::SymtabLoadCommand S = getSymtabLoadCommand();
1579 return getData().substr(S.StringTableOffset, S.StringTableSize);
1580 }
1581
is64Bit() const1582 bool MachOObjectFile::is64Bit() const {
1583 return getType() == getMachOType(false, true) ||
1584 getType() == getMachOType(true, true);
1585 }
1586
ReadULEB128s(uint64_t Index,SmallVectorImpl<uint64_t> & Out) const1587 void MachOObjectFile::ReadULEB128s(uint64_t Index,
1588 SmallVectorImpl<uint64_t> &Out) const {
1589 DataExtractor extractor(ObjectFile::getData(), true, 0);
1590
1591 uint32_t offset = Index;
1592 uint64_t data = 0;
1593 while (uint64_t delta = extractor.getULEB128(&offset)) {
1594 data += delta;
1595 Out.push_back(data);
1596 }
1597 }
1598
createMachOObjectFile(MemoryBuffer * Buffer)1599 ObjectFile *ObjectFile::createMachOObjectFile(MemoryBuffer *Buffer) {
1600 StringRef Magic = Buffer->getBuffer().slice(0, 4);
1601 error_code ec;
1602 OwningPtr<ObjectFile> Ret;
1603 if (Magic == "\xFE\xED\xFA\xCE")
1604 Ret.reset(new MachOObjectFile(Buffer, false, false, ec));
1605 else if (Magic == "\xCE\xFA\xED\xFE")
1606 Ret.reset(new MachOObjectFile(Buffer, true, false, ec));
1607 else if (Magic == "\xFE\xED\xFA\xCF")
1608 Ret.reset(new MachOObjectFile(Buffer, false, true, ec));
1609 else if (Magic == "\xCF\xFA\xED\xFE")
1610 Ret.reset(new MachOObjectFile(Buffer, true, true, ec));
1611 else {
1612 delete Buffer;
1613 return NULL;
1614 }
1615
1616 if (ec)
1617 return NULL;
1618 return Ret.take();
1619 }
1620
1621 } // end namespace object
1622 } // end namespace llvm
1623