1 //===-- macho-dump.cpp - Mach Object Dumping Tool -------------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This is a testing tool for use with the MC/Mach-O LLVM components.
11 //
12 //===----------------------------------------------------------------------===//
13
14 #include "llvm/Object/MachO.h"
15 #include "llvm/ADT/StringExtras.h"
16 #include "llvm/ADT/Twine.h"
17 #include "llvm/Support/Casting.h"
18 #include "llvm/Support/CommandLine.h"
19 #include "llvm/Support/Format.h"
20 #include "llvm/Support/ManagedStatic.h"
21 #include "llvm/Support/MemoryBuffer.h"
22 #include "llvm/Support/raw_ostream.h"
23 #include <system_error>
24 using namespace llvm;
25 using namespace llvm::object;
26
27 static cl::opt<std::string>
28 InputFile(cl::Positional, cl::desc("<input file>"), cl::init("-"));
29
30 static cl::opt<bool>
31 ShowSectionData("dump-section-data", cl::desc("Dump the contents of sections"),
32 cl::init(false));
33
34 ///
35
36 static const char *ProgramName;
37
Message(const char * Type,const Twine & Msg)38 static void Message(const char *Type, const Twine &Msg) {
39 errs() << ProgramName << ": " << Type << ": " << Msg << "\n";
40 }
41
Error(const Twine & Msg)42 static int Error(const Twine &Msg) {
43 Message("error", Msg);
44 return 1;
45 }
46
Warning(const Twine & Msg)47 static void Warning(const Twine &Msg) {
48 Message("warning", Msg);
49 }
50
51 ///
52
DumpSegmentCommandData(StringRef Name,uint64_t VMAddr,uint64_t VMSize,uint64_t FileOffset,uint64_t FileSize,uint32_t MaxProt,uint32_t InitProt,uint32_t NumSections,uint32_t Flags)53 static void DumpSegmentCommandData(StringRef Name,
54 uint64_t VMAddr, uint64_t VMSize,
55 uint64_t FileOffset, uint64_t FileSize,
56 uint32_t MaxProt, uint32_t InitProt,
57 uint32_t NumSections, uint32_t Flags) {
58 outs() << " ('segment_name', '";
59 outs().write_escaped(Name, /*UseHexEscapes=*/true) << "')\n";
60 outs() << " ('vm_addr', " << VMAddr << ")\n";
61 outs() << " ('vm_size', " << VMSize << ")\n";
62 outs() << " ('file_offset', " << FileOffset << ")\n";
63 outs() << " ('file_size', " << FileSize << ")\n";
64 outs() << " ('maxprot', " << MaxProt << ")\n";
65 outs() << " ('initprot', " << InitProt << ")\n";
66 outs() << " ('num_sections', " << NumSections << ")\n";
67 outs() << " ('flags', " << Flags << ")\n";
68 }
69
DumpSectionData(const MachOObjectFile & Obj,unsigned Index,StringRef Name,StringRef SegmentName,uint64_t Address,uint64_t Size,uint32_t Offset,uint32_t Align,uint32_t RelocationTableOffset,uint32_t NumRelocationTableEntries,uint32_t Flags,uint32_t Reserved1,uint32_t Reserved2,uint64_t Reserved3=~0ULL)70 static int DumpSectionData(const MachOObjectFile &Obj, unsigned Index,
71 StringRef Name,
72 StringRef SegmentName, uint64_t Address,
73 uint64_t Size, uint32_t Offset,
74 uint32_t Align, uint32_t RelocationTableOffset,
75 uint32_t NumRelocationTableEntries,
76 uint32_t Flags, uint32_t Reserved1,
77 uint32_t Reserved2, uint64_t Reserved3 = ~0ULL) {
78 outs() << " # Section " << Index << "\n";
79 outs() << " (('section_name', '";
80 outs().write_escaped(Name, /*UseHexEscapes=*/true) << "')\n";
81 outs() << " ('segment_name', '";
82 outs().write_escaped(SegmentName, /*UseHexEscapes=*/true) << "')\n";
83 outs() << " ('address', " << Address << ")\n";
84 outs() << " ('size', " << Size << ")\n";
85 outs() << " ('offset', " << Offset << ")\n";
86 outs() << " ('alignment', " << Align << ")\n";
87 outs() << " ('reloc_offset', " << RelocationTableOffset << ")\n";
88 outs() << " ('num_reloc', " << NumRelocationTableEntries << ")\n";
89 outs() << " ('flags', " << format("0x%x", Flags) << ")\n";
90 outs() << " ('reserved1', " << Reserved1 << ")\n";
91 outs() << " ('reserved2', " << Reserved2 << ")\n";
92 if (Reserved3 != ~0ULL)
93 outs() << " ('reserved3', " << Reserved3 << ")\n";
94 outs() << " ),\n";
95
96 // Dump the relocation entries.
97 outs() << " ('_relocations', [\n";
98 unsigned RelNum = 0;
99 for (relocation_iterator I = Obj.section_rel_begin(Index),
100 E = Obj.section_rel_end(Index);
101 I != E; ++I, ++RelNum) {
102 MachO::any_relocation_info RE = Obj.getRelocation(I->getRawDataRefImpl());
103 outs() << " # Relocation " << RelNum << "\n";
104 outs() << " (('word-0', " << format("0x%x", RE.r_word0) << "),\n";
105 outs() << " ('word-1', " << format("0x%x", RE.r_word1) << ")),\n";
106 }
107 outs() << " ])\n";
108
109 // Dump the section data, if requested.
110 if (ShowSectionData) {
111 outs() << " ('_section_data', '";
112 StringRef Data = Obj.getData().substr(Offset, Size);
113 for (unsigned i = 0; i != Data.size(); ++i) {
114 if (i && (i % 4) == 0)
115 outs() << ' ';
116 outs() << hexdigit((Data[i] >> 4) & 0xF, /*LowerCase=*/true);
117 outs() << hexdigit((Data[i] >> 0) & 0xF, /*LowerCase=*/true);
118 }
119 outs() << "')\n";
120 }
121
122 return 0;
123 }
124
DumpSegmentCommand(const MachOObjectFile & Obj,const MachOObjectFile::LoadCommandInfo & LCI)125 static int DumpSegmentCommand(const MachOObjectFile &Obj,
126 const MachOObjectFile::LoadCommandInfo &LCI) {
127 MachO::segment_command SLC = Obj.getSegmentLoadCommand(LCI);
128
129 DumpSegmentCommandData(StringRef(SLC.segname, 16), SLC.vmaddr,
130 SLC.vmsize, SLC.fileoff, SLC.filesize,
131 SLC.maxprot, SLC.initprot, SLC.nsects, SLC.flags);
132
133 // Dump the sections.
134 outs() << " ('sections', [\n";
135 for (unsigned i = 0; i != SLC.nsects; ++i) {
136 MachO::section Sect = Obj.getSection(LCI, i);
137 DumpSectionData(Obj, i, StringRef(Sect.sectname, 16),
138 StringRef(Sect.segname, 16), Sect.addr,
139 Sect.size, Sect.offset, Sect.align,
140 Sect.reloff, Sect.nreloc, Sect.flags,
141 Sect.reserved1, Sect.reserved2);
142 }
143 outs() << " ])\n";
144
145 return 0;
146 }
147
DumpSegment64Command(const MachOObjectFile & Obj,const MachOObjectFile::LoadCommandInfo & LCI)148 static int DumpSegment64Command(const MachOObjectFile &Obj,
149 const MachOObjectFile::LoadCommandInfo &LCI) {
150 MachO::segment_command_64 SLC = Obj.getSegment64LoadCommand(LCI);
151 DumpSegmentCommandData(StringRef(SLC.segname, 16), SLC.vmaddr,
152 SLC.vmsize, SLC.fileoff, SLC.filesize,
153 SLC.maxprot, SLC.initprot, SLC.nsects, SLC.flags);
154
155 // Dump the sections.
156 outs() << " ('sections', [\n";
157 for (unsigned i = 0; i != SLC.nsects; ++i) {
158 MachO::section_64 Sect = Obj.getSection64(LCI, i);
159
160 DumpSectionData(Obj, i, StringRef(Sect.sectname, 16),
161 StringRef(Sect.segname, 16), Sect.addr,
162 Sect.size, Sect.offset, Sect.align,
163 Sect.reloff, Sect.nreloc, Sect.flags,
164 Sect.reserved1, Sect.reserved2,
165 Sect.reserved3);
166 }
167 outs() << " ])\n";
168
169 return 0;
170 }
171
DumpSymbolTableEntryData(const MachOObjectFile & Obj,unsigned Index,uint32_t StringIndex,uint8_t Type,uint8_t SectionIndex,uint16_t Flags,uint64_t Value,StringRef StringTable)172 static void DumpSymbolTableEntryData(const MachOObjectFile &Obj,
173 unsigned Index, uint32_t StringIndex,
174 uint8_t Type, uint8_t SectionIndex,
175 uint16_t Flags, uint64_t Value,
176 StringRef StringTable) {
177 const char *Name = &StringTable.data()[StringIndex];
178 outs() << " # Symbol " << Index << "\n";
179 outs() << " (('n_strx', " << StringIndex << ")\n";
180 outs() << " ('n_type', " << format("0x%x", Type) << ")\n";
181 outs() << " ('n_sect', " << uint32_t(SectionIndex) << ")\n";
182 outs() << " ('n_desc', " << Flags << ")\n";
183 outs() << " ('n_value', " << Value << ")\n";
184 outs() << " ('_string', '" << Name << "')\n";
185 outs() << " ),\n";
186 }
187
DumpSymtabCommand(const MachOObjectFile & Obj)188 static int DumpSymtabCommand(const MachOObjectFile &Obj) {
189 MachO::symtab_command SLC = Obj.getSymtabLoadCommand();
190
191 outs() << " ('symoff', " << SLC.symoff << ")\n";
192 outs() << " ('nsyms', " << SLC.nsyms << ")\n";
193 outs() << " ('stroff', " << SLC.stroff << ")\n";
194 outs() << " ('strsize', " << SLC.strsize << ")\n";
195
196 // Dump the string data.
197 outs() << " ('_string_data', '";
198 StringRef StringTable = Obj.getStringTableData();
199 outs().write_escaped(StringTable,
200 /*UseHexEscapes=*/true) << "')\n";
201
202 // Dump the symbol table.
203 outs() << " ('_symbols', [\n";
204 unsigned SymNum = 0;
205 for (const SymbolRef &Symbol : Obj.symbols()) {
206 DataRefImpl DRI = Symbol.getRawDataRefImpl();
207 if (Obj.is64Bit()) {
208 MachO::nlist_64 STE = Obj.getSymbol64TableEntry(DRI);
209 DumpSymbolTableEntryData(Obj, SymNum, STE.n_strx, STE.n_type,
210 STE.n_sect, STE.n_desc, STE.n_value,
211 StringTable);
212 } else {
213 MachO::nlist STE = Obj.getSymbolTableEntry(DRI);
214 DumpSymbolTableEntryData(Obj, SymNum, STE.n_strx, STE.n_type,
215 STE.n_sect, STE.n_desc, STE.n_value,
216 StringTable);
217 }
218 SymNum++;
219 }
220 outs() << " ])\n";
221
222 return 0;
223 }
224
DumpDysymtabCommand(const MachOObjectFile & Obj)225 static int DumpDysymtabCommand(const MachOObjectFile &Obj) {
226 MachO::dysymtab_command DLC = Obj.getDysymtabLoadCommand();
227
228 outs() << " ('ilocalsym', " << DLC.ilocalsym << ")\n";
229 outs() << " ('nlocalsym', " << DLC.nlocalsym << ")\n";
230 outs() << " ('iextdefsym', " << DLC.iextdefsym << ")\n";
231 outs() << " ('nextdefsym', " << DLC.nextdefsym << ")\n";
232 outs() << " ('iundefsym', " << DLC.iundefsym << ")\n";
233 outs() << " ('nundefsym', " << DLC.nundefsym << ")\n";
234 outs() << " ('tocoff', " << DLC.tocoff << ")\n";
235 outs() << " ('ntoc', " << DLC.ntoc << ")\n";
236 outs() << " ('modtaboff', " << DLC.modtaboff << ")\n";
237 outs() << " ('nmodtab', " << DLC.nmodtab << ")\n";
238 outs() << " ('extrefsymoff', " << DLC.extrefsymoff << ")\n";
239 outs() << " ('nextrefsyms', " << DLC.nextrefsyms << ")\n";
240 outs() << " ('indirectsymoff', " << DLC.indirectsymoff << ")\n";
241 outs() << " ('nindirectsyms', " << DLC.nindirectsyms << ")\n";
242 outs() << " ('extreloff', " << DLC.extreloff << ")\n";
243 outs() << " ('nextrel', " << DLC.nextrel << ")\n";
244 outs() << " ('locreloff', " << DLC.locreloff << ")\n";
245 outs() << " ('nlocrel', " << DLC.nlocrel << ")\n";
246
247 // Dump the indirect symbol table.
248 outs() << " ('_indirect_symbols', [\n";
249 for (unsigned i = 0; i != DLC.nindirectsyms; ++i) {
250 uint32_t ISTE = Obj.getIndirectSymbolTableEntry(DLC, i);
251 outs() << " # Indirect Symbol " << i << "\n";
252 outs() << " (('symbol_index', " << format("0x%x", ISTE) << "),),\n";
253 }
254 outs() << " ])\n";
255
256 return 0;
257 }
258
259 static int
DumpLinkeditDataCommand(const MachOObjectFile & Obj,const MachOObjectFile::LoadCommandInfo & LCI)260 DumpLinkeditDataCommand(const MachOObjectFile &Obj,
261 const MachOObjectFile::LoadCommandInfo &LCI) {
262 MachO::linkedit_data_command LLC = Obj.getLinkeditDataLoadCommand(LCI);
263 outs() << " ('dataoff', " << LLC.dataoff << ")\n"
264 << " ('datasize', " << LLC.datasize << ")\n"
265 << " ('_addresses', [\n";
266
267 SmallVector<uint64_t, 8> Addresses;
268 Obj.ReadULEB128s(LLC.dataoff, Addresses);
269 for (unsigned i = 0, e = Addresses.size(); i != e; ++i)
270 outs() << " # Address " << i << '\n'
271 << " ('address', " << format("0x%x", Addresses[i]) << "),\n";
272
273 outs() << " ])\n";
274
275 return 0;
276 }
277
278 static int
DumpDataInCodeDataCommand(const MachOObjectFile & Obj,const MachOObjectFile::LoadCommandInfo & LCI)279 DumpDataInCodeDataCommand(const MachOObjectFile &Obj,
280 const MachOObjectFile::LoadCommandInfo &LCI) {
281 MachO::linkedit_data_command LLC = Obj.getLinkeditDataLoadCommand(LCI);
282 outs() << " ('dataoff', " << LLC.dataoff << ")\n"
283 << " ('datasize', " << LLC.datasize << ")\n"
284 << " ('_data_regions', [\n";
285
286 unsigned NumRegions = LLC.datasize / sizeof(MachO::data_in_code_entry);
287 for (unsigned i = 0; i < NumRegions; ++i) {
288 MachO::data_in_code_entry DICE= Obj.getDataInCodeTableEntry(LLC.dataoff, i);
289 outs() << " # DICE " << i << "\n"
290 << " ('offset', " << DICE.offset << ")\n"
291 << " ('length', " << DICE.length << ")\n"
292 << " ('kind', " << DICE.kind << ")\n";
293 }
294
295 outs() <<" ])\n";
296
297 return 0;
298 }
299
300 static int
DumpLinkerOptionsCommand(const MachOObjectFile & Obj,const MachOObjectFile::LoadCommandInfo & LCI)301 DumpLinkerOptionsCommand(const MachOObjectFile &Obj,
302 const MachOObjectFile::LoadCommandInfo &LCI) {
303 MachO::linker_options_command LOLC = Obj.getLinkerOptionsLoadCommand(LCI);
304 outs() << " ('count', " << LOLC.count << ")\n"
305 << " ('_strings', [\n";
306
307 uint64_t DataSize = LOLC.cmdsize - sizeof(MachO::linker_options_command);
308 const char *P = LCI.Ptr + sizeof(MachO::linker_options_command);
309 StringRef Data(P, DataSize);
310 for (unsigned i = 0; i != LOLC.count; ++i) {
311 std::pair<StringRef,StringRef> Split = Data.split('\0');
312 outs() << "\t\"";
313 outs().write_escaped(Split.first);
314 outs() << "\",\n";
315 Data = Split.second;
316 }
317 outs() <<" ])\n";
318
319 return 0;
320 }
321
322 static int
DumpVersionMin(const MachOObjectFile & Obj,const MachOObjectFile::LoadCommandInfo & LCI)323 DumpVersionMin(const MachOObjectFile &Obj,
324 const MachOObjectFile::LoadCommandInfo &LCI) {
325 MachO::version_min_command VMLC = Obj.getVersionMinLoadCommand(LCI);
326 outs() << " ('version, " << VMLC.version << ")\n"
327 << " ('reserved, " << VMLC.reserved << ")\n";
328 return 0;
329 }
330
331 static int
DumpDylibID(const MachOObjectFile & Obj,const MachOObjectFile::LoadCommandInfo & LCI)332 DumpDylibID(const MachOObjectFile &Obj,
333 const MachOObjectFile::LoadCommandInfo &LCI) {
334 MachO::dylib_command DLLC = Obj.getDylibIDLoadCommand(LCI);
335 outs() << " ('install_name', '" << LCI.Ptr + DLLC.dylib.name << "')\n"
336 << " ('timestamp, " << DLLC.dylib.timestamp << ")\n"
337 << " ('cur_version, " << DLLC.dylib.current_version << ")\n"
338 << " ('compat_version, " << DLLC.dylib.compatibility_version << ")\n";
339 return 0;
340 }
341
DumpLoadCommand(const MachOObjectFile & Obj,MachOObjectFile::LoadCommandInfo & LCI)342 static int DumpLoadCommand(const MachOObjectFile &Obj,
343 MachOObjectFile::LoadCommandInfo &LCI) {
344 switch (LCI.C.cmd) {
345 case MachO::LC_SEGMENT:
346 return DumpSegmentCommand(Obj, LCI);
347 case MachO::LC_SEGMENT_64:
348 return DumpSegment64Command(Obj, LCI);
349 case MachO::LC_SYMTAB:
350 return DumpSymtabCommand(Obj);
351 case MachO::LC_DYSYMTAB:
352 return DumpDysymtabCommand(Obj);
353 case MachO::LC_CODE_SIGNATURE:
354 case MachO::LC_SEGMENT_SPLIT_INFO:
355 case MachO::LC_FUNCTION_STARTS:
356 return DumpLinkeditDataCommand(Obj, LCI);
357 case MachO::LC_DATA_IN_CODE:
358 return DumpDataInCodeDataCommand(Obj, LCI);
359 case MachO::LC_LINKER_OPTIONS:
360 return DumpLinkerOptionsCommand(Obj, LCI);
361 case MachO::LC_VERSION_MIN_IPHONEOS:
362 case MachO::LC_VERSION_MIN_MACOSX:
363 return DumpVersionMin(Obj, LCI);
364 case MachO::LC_ID_DYLIB:
365 return DumpDylibID(Obj, LCI);
366 default:
367 Warning("unknown load command: " + Twine(LCI.C.cmd));
368 return 0;
369 }
370 }
371
372
DumpLoadCommand(const MachOObjectFile & Obj,unsigned Index,MachOObjectFile::LoadCommandInfo & LCI)373 static int DumpLoadCommand(const MachOObjectFile &Obj, unsigned Index,
374 MachOObjectFile::LoadCommandInfo &LCI) {
375 outs() << " # Load Command " << Index << "\n"
376 << " (('command', " << LCI.C.cmd << ")\n"
377 << " ('size', " << LCI.C.cmdsize << ")\n";
378 int Res = DumpLoadCommand(Obj, LCI);
379 outs() << " ),\n";
380 return Res;
381 }
382
printHeader(const MachOObjectFile * Obj,const MachO::mach_header & Header)383 static void printHeader(const MachOObjectFile *Obj,
384 const MachO::mach_header &Header) {
385 outs() << "('cputype', " << Header.cputype << ")\n";
386 outs() << "('cpusubtype', " << Header.cpusubtype << ")\n";
387 outs() << "('filetype', " << Header.filetype << ")\n";
388 outs() << "('num_load_commands', " << Header.ncmds << ")\n";
389 outs() << "('load_commands_size', " << Header.sizeofcmds << ")\n";
390 outs() << "('flag', " << Header.flags << ")\n";
391
392 // Print extended header if 64-bit.
393 if (Obj->is64Bit()) {
394 const MachO::mach_header_64 *Header64 =
395 reinterpret_cast<const MachO::mach_header_64 *>(&Header);
396 outs() << "('reserved', " << Header64->reserved << ")\n";
397 }
398 }
399
main(int argc,char ** argv)400 int main(int argc, char **argv) {
401 ProgramName = argv[0];
402 llvm_shutdown_obj Y; // Call llvm_shutdown() on exit.
403
404 cl::ParseCommandLineOptions(argc, argv, "llvm Mach-O dumping tool\n");
405
406 ErrorOr<Binary *> BinaryOrErr = createBinary(InputFile);
407 if (std::error_code EC = BinaryOrErr.getError())
408 return Error("unable to read input: '" + EC.message() + "'");
409 std::unique_ptr<Binary> Binary(BinaryOrErr.get());
410
411 const MachOObjectFile *InputObject = dyn_cast<MachOObjectFile>(Binary.get());
412 if (!InputObject)
413 return Error("Not a MachO object");
414
415 // Print the header
416 MachO::mach_header_64 Header64;
417 MachO::mach_header *Header = reinterpret_cast<MachO::mach_header*>(&Header64);
418 if (InputObject->is64Bit())
419 Header64 = InputObject->getHeader64();
420 else
421 *Header = InputObject->getHeader();
422 printHeader(InputObject, *Header);
423
424 // Print the load commands.
425 int Res = 0;
426 MachOObjectFile::LoadCommandInfo Command =
427 InputObject->getFirstLoadCommandInfo();
428 outs() << "('load_commands', [\n";
429 for (unsigned i = 0; ; ++i) {
430 if (DumpLoadCommand(*InputObject, i, Command))
431 break;
432
433 if (i == Header->ncmds - 1)
434 break;
435 Command = InputObject->getNextLoadCommandInfo(Command);
436 }
437 outs() << "])\n";
438
439 return Res;
440 }
441