macho-dump.cpp revision 3ff9563c3e391954b2e224afcf8b2b0fcc3888aa
1//===-- macho-dump.cpp - Mach Object Dumping Tool -------------------------===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This is a testing tool for use with the MC/Mach-O LLVM components.
11//
12//===----------------------------------------------------------------------===//
13
14#include "llvm/Object/MachOObject.h"
15#include "llvm/ADT/StringExtras.h"
16#include "llvm/ADT/Twine.h"
17#include "llvm/Support/CommandLine.h"
18#include "llvm/Support/Format.h"
19#include "llvm/Support/ManagedStatic.h"
20#include "llvm/Support/MemoryBuffer.h"
21#include "llvm/Support/raw_ostream.h"
22#include "llvm/Support/system_error.h"
23using namespace llvm;
24using namespace llvm::object;
25
26static cl::opt<std::string>
27InputFile(cl::Positional, cl::desc("<input file>"), cl::init("-"));
28
29static cl::opt<bool>
30ShowSectionData("dump-section-data", cl::desc("Dump the contents of sections"),
31                cl::init(false));
32
33///
34
35static const char *ProgramName;
36
37static void Message(const char *Type, const Twine &Msg) {
38  errs() << ProgramName << ": " << Type << ": " << Msg << "\n";
39}
40
41static int Error(const Twine &Msg) {
42  Message("error", Msg);
43  return 1;
44}
45
46static void Warning(const Twine &Msg) {
47  Message("warning", Msg);
48}
49
50///
51
52static int DumpHeader(MachOObject &Obj) {
53  // Read the header.
54  const macho::Header &Hdr = Obj.getHeader();
55  outs() << "('cputype', " << Hdr.CPUType << ")\n";
56  outs() << "('cpusubtype', " << Hdr.CPUSubtype << ")\n";
57  outs() << "('filetype', " << Hdr.FileType << ")\n";
58  outs() << "('num_load_commands', " << Hdr.NumLoadCommands << ")\n";
59  outs() << "('load_commands_size', " << Hdr.SizeOfLoadCommands << ")\n";
60  outs() << "('flag', " << Hdr.Flags << ")\n";
61
62  // Print extended header if 64-bit.
63  if (Obj.is64Bit()) {
64    const macho::Header64Ext &Hdr64 = Obj.getHeader64Ext();
65    outs() << "('reserved', " << Hdr64.Reserved << ")\n";
66  }
67
68  return 0;
69}
70
71static void DumpSegmentCommandData(StringRef Name,
72                                   uint64_t VMAddr, uint64_t VMSize,
73                                   uint64_t FileOffset, uint64_t FileSize,
74                                   uint32_t MaxProt, uint32_t InitProt,
75                                   uint32_t NumSections, uint32_t Flags) {
76  outs() << "  ('segment_name', '";
77  outs().write_escaped(Name, /*UseHexEscapes=*/true) << "')\n";
78  outs() << "  ('vm_addr', " << VMAddr << ")\n";
79  outs() << "  ('vm_size', " << VMSize << ")\n";
80  outs() << "  ('file_offset', " << FileOffset << ")\n";
81  outs() << "  ('file_size', " << FileSize << ")\n";
82  outs() << "  ('maxprot', " << MaxProt << ")\n";
83  outs() << "  ('initprot', " << InitProt << ")\n";
84  outs() << "  ('num_sections', " << NumSections << ")\n";
85  outs() << "  ('flags', " << Flags << ")\n";
86}
87
88static int DumpSectionData(MachOObject &Obj, unsigned Index, StringRef Name,
89                           StringRef SegmentName, uint64_t Address,
90                           uint64_t Size, uint32_t Offset,
91                           uint32_t Align, uint32_t RelocationTableOffset,
92                           uint32_t NumRelocationTableEntries,
93                           uint32_t Flags, uint32_t Reserved1,
94                           uint32_t Reserved2, uint64_t Reserved3 = ~0ULL) {
95  outs() << "    # Section " << Index << "\n";
96  outs() << "   (('section_name', '";
97  outs().write_escaped(Name, /*UseHexEscapes=*/true) << "')\n";
98  outs() << "    ('segment_name', '";
99  outs().write_escaped(SegmentName, /*UseHexEscapes=*/true) << "')\n";
100  outs() << "    ('address', " << Address << ")\n";
101  outs() << "    ('size', " << Size << ")\n";
102  outs() << "    ('offset', " << Offset << ")\n";
103  outs() << "    ('alignment', " << Align << ")\n";
104  outs() << "    ('reloc_offset', " << RelocationTableOffset << ")\n";
105  outs() << "    ('num_reloc', " << NumRelocationTableEntries << ")\n";
106  outs() << "    ('flags', " << format("0x%x", Flags) << ")\n";
107  outs() << "    ('reserved1', " << Reserved1 << ")\n";
108  outs() << "    ('reserved2', " << Reserved2 << ")\n";
109  if (Reserved3 != ~0ULL)
110    outs() << "    ('reserved3', " << Reserved3 << ")\n";
111  outs() << "   ),\n";
112
113  // Dump the relocation entries.
114  int Res = 0;
115  outs() << "  ('_relocations', [\n";
116  for (unsigned i = 0; i != NumRelocationTableEntries; ++i) {
117    InMemoryStruct<macho::RelocationEntry> RE;
118    Obj.ReadRelocationEntry(RelocationTableOffset, i, RE);
119    if (!RE) {
120      Res = Error("unable to read relocation table entry '" + Twine(i) + "'");
121      break;
122    }
123
124    outs() << "    # Relocation " << i << "\n";
125    outs() << "    (('word-0', " << format("0x%x", RE->Word0) << "),\n";
126    outs() << "     ('word-1', " << format("0x%x", RE->Word1) << ")),\n";
127  }
128  outs() << "  ])\n";
129
130  // Dump the section data, if requested.
131  if (ShowSectionData) {
132    outs() << "  ('_section_data', '";
133    StringRef Data = Obj.getData(Offset, Size);
134    for (unsigned i = 0; i != Data.size(); ++i) {
135      if (i && (i % 4) == 0)
136        outs() << ' ';
137      outs() << hexdigit((Data[i] >> 4) & 0xF, /*LowerCase=*/true);
138      outs() << hexdigit((Data[i] >> 0) & 0xF, /*LowerCase=*/true);
139    }
140    outs() << "')\n";
141  }
142
143  return Res;
144}
145
146static int DumpSegmentCommand(MachOObject &Obj,
147                               const MachOObject::LoadCommandInfo &LCI) {
148  InMemoryStruct<macho::SegmentLoadCommand> SLC;
149  Obj.ReadSegmentLoadCommand(LCI, SLC);
150  if (!SLC)
151    return Error("unable to read segment load command");
152
153  DumpSegmentCommandData(StringRef(SLC->Name, 16), SLC->VMAddress,
154                         SLC->VMSize, SLC->FileOffset, SLC->FileSize,
155                         SLC->MaxVMProtection, SLC->InitialVMProtection,
156                         SLC->NumSections, SLC->Flags);
157
158  // Dump the sections.
159  int Res = 0;
160  outs() << "  ('sections', [\n";
161  for (unsigned i = 0; i != SLC->NumSections; ++i) {
162    InMemoryStruct<macho::Section> Sect;
163    Obj.ReadSection(LCI, i, Sect);
164    if (!SLC) {
165      Res = Error("unable to read section '" + Twine(i) + "'");
166      break;
167    }
168
169    if ((Res = DumpSectionData(Obj, i, StringRef(Sect->Name, 16),
170                               StringRef(Sect->SegmentName, 16), Sect->Address,
171                               Sect->Size, Sect->Offset, Sect->Align,
172                               Sect->RelocationTableOffset,
173                               Sect->NumRelocationTableEntries, Sect->Flags,
174                               Sect->Reserved1, Sect->Reserved2)))
175      break;
176  }
177  outs() << "  ])\n";
178
179  return Res;
180}
181
182static int DumpSegment64Command(MachOObject &Obj,
183                               const MachOObject::LoadCommandInfo &LCI) {
184  InMemoryStruct<macho::Segment64LoadCommand> SLC;
185  Obj.ReadSegment64LoadCommand(LCI, SLC);
186  if (!SLC)
187    return Error("unable to read segment load command");
188
189  DumpSegmentCommandData(StringRef(SLC->Name, 16), SLC->VMAddress,
190                         SLC->VMSize, SLC->FileOffset, SLC->FileSize,
191                         SLC->MaxVMProtection, SLC->InitialVMProtection,
192                         SLC->NumSections, SLC->Flags);
193
194  // Dump the sections.
195  int Res = 0;
196  outs() << "  ('sections', [\n";
197  for (unsigned i = 0; i != SLC->NumSections; ++i) {
198    InMemoryStruct<macho::Section64> Sect;
199    Obj.ReadSection64(LCI, i, Sect);
200    if (!SLC) {
201      Res = Error("unable to read section '" + Twine(i) + "'");
202      break;
203    }
204
205    if ((Res = DumpSectionData(Obj, i, StringRef(Sect->Name, 16),
206                               StringRef(Sect->SegmentName, 16), Sect->Address,
207                               Sect->Size, Sect->Offset, Sect->Align,
208                               Sect->RelocationTableOffset,
209                               Sect->NumRelocationTableEntries, Sect->Flags,
210                               Sect->Reserved1, Sect->Reserved2,
211                               Sect->Reserved3)))
212      break;
213  }
214  outs() << "  ])\n";
215
216  return 0;
217}
218
219static void DumpSymbolTableEntryData(MachOObject &Obj,
220                                     unsigned Index, uint32_t StringIndex,
221                                     uint8_t Type, uint8_t SectionIndex,
222                                     uint16_t Flags, uint64_t Value) {
223  outs() << "    # Symbol " << Index << "\n";
224  outs() << "   (('n_strx', " << StringIndex << ")\n";
225  outs() << "    ('n_type', " << format("0x%x", Type) << ")\n";
226  outs() << "    ('n_sect', " << uint32_t(SectionIndex) << ")\n";
227  outs() << "    ('n_desc', " << Flags << ")\n";
228  outs() << "    ('n_value', " << Value << ")\n";
229  outs() << "    ('_string', '" << Obj.getStringAtIndex(StringIndex) << "')\n";
230  outs() << "   ),\n";
231}
232
233static int DumpSymtabCommand(MachOObject &Obj,
234                             const MachOObject::LoadCommandInfo &LCI) {
235  InMemoryStruct<macho::SymtabLoadCommand> SLC;
236  Obj.ReadSymtabLoadCommand(LCI, SLC);
237  if (!SLC)
238    return Error("unable to read segment load command");
239
240  outs() << "  ('symoff', " << SLC->SymbolTableOffset << ")\n";
241  outs() << "  ('nsyms', " << SLC->NumSymbolTableEntries << ")\n";
242  outs() << "  ('stroff', " << SLC->StringTableOffset << ")\n";
243  outs() << "  ('strsize', " << SLC->StringTableSize << ")\n";
244
245  // Cache the string table data.
246  Obj.RegisterStringTable(*SLC);
247
248  // Dump the string data.
249  outs() << "  ('_string_data', '";
250  outs().write_escaped(Obj.getStringTableData(),
251                       /*UseHexEscapes=*/true) << "')\n";
252
253  // Dump the symbol table.
254  int Res = 0;
255  outs() << "  ('_symbols', [\n";
256  for (unsigned i = 0; i != SLC->NumSymbolTableEntries; ++i) {
257    if (Obj.is64Bit()) {
258      InMemoryStruct<macho::Symbol64TableEntry> STE;
259      Obj.ReadSymbol64TableEntry(SLC->SymbolTableOffset, i, STE);
260      if (!STE) {
261        Res = Error("unable to read symbol: '" + Twine(i) + "'");
262        break;
263      }
264
265      DumpSymbolTableEntryData(Obj, i, STE->StringIndex, STE->Type,
266                               STE->SectionIndex, STE->Flags, STE->Value);
267    } else {
268      InMemoryStruct<macho::SymbolTableEntry> STE;
269      Obj.ReadSymbolTableEntry(SLC->SymbolTableOffset, i, STE);
270      if (!SLC) {
271        Res = Error("unable to read symbol: '" + Twine(i) + "'");
272        break;
273      }
274
275      DumpSymbolTableEntryData(Obj, i, STE->StringIndex, STE->Type,
276                               STE->SectionIndex, STE->Flags, STE->Value);
277    }
278  }
279  outs() << "  ])\n";
280
281  return Res;
282}
283
284static int DumpDysymtabCommand(MachOObject &Obj,
285                             const MachOObject::LoadCommandInfo &LCI) {
286  InMemoryStruct<macho::DysymtabLoadCommand> DLC;
287  Obj.ReadDysymtabLoadCommand(LCI, DLC);
288  if (!DLC)
289    return Error("unable to read segment load command");
290
291  outs() << "  ('ilocalsym', " << DLC->LocalSymbolsIndex << ")\n";
292  outs() << "  ('nlocalsym', " << DLC->NumLocalSymbols << ")\n";
293  outs() << "  ('iextdefsym', " << DLC->ExternalSymbolsIndex << ")\n";
294  outs() << "  ('nextdefsym', " << DLC->NumExternalSymbols << ")\n";
295  outs() << "  ('iundefsym', " << DLC->UndefinedSymbolsIndex << ")\n";
296  outs() << "  ('nundefsym', " << DLC->NumUndefinedSymbols << ")\n";
297  outs() << "  ('tocoff', " << DLC->TOCOffset << ")\n";
298  outs() << "  ('ntoc', " << DLC->NumTOCEntries << ")\n";
299  outs() << "  ('modtaboff', " << DLC->ModuleTableOffset << ")\n";
300  outs() << "  ('nmodtab', " << DLC->NumModuleTableEntries << ")\n";
301  outs() << "  ('extrefsymoff', " << DLC->ReferenceSymbolTableOffset << ")\n";
302  outs() << "  ('nextrefsyms', "
303         << DLC->NumReferencedSymbolTableEntries << ")\n";
304  outs() << "  ('indirectsymoff', " << DLC->IndirectSymbolTableOffset << ")\n";
305  outs() << "  ('nindirectsyms', "
306         << DLC->NumIndirectSymbolTableEntries << ")\n";
307  outs() << "  ('extreloff', " << DLC->ExternalRelocationTableOffset << ")\n";
308  outs() << "  ('nextrel', " << DLC->NumExternalRelocationTableEntries << ")\n";
309  outs() << "  ('locreloff', " << DLC->LocalRelocationTableOffset << ")\n";
310  outs() << "  ('nlocrel', " << DLC->NumLocalRelocationTableEntries << ")\n";
311
312  // Dump the indirect symbol table.
313  int Res = 0;
314  outs() << "  ('_indirect_symbols', [\n";
315  for (unsigned i = 0; i != DLC->NumIndirectSymbolTableEntries; ++i) {
316    InMemoryStruct<macho::IndirectSymbolTableEntry> ISTE;
317    Obj.ReadIndirectSymbolTableEntry(*DLC, i, ISTE);
318    if (!ISTE) {
319      Res = Error("unable to read segment load command");
320      break;
321    }
322
323    outs() << "    # Indirect Symbol " << i << "\n";
324    outs() << "    (('symbol_index', "
325           << format("0x%x", ISTE->Index) << "),),\n";
326  }
327  outs() << "  ])\n";
328
329  return Res;
330}
331
332static int DumpLoadCommand(MachOObject &Obj, unsigned Index) {
333  const MachOObject::LoadCommandInfo &LCI = Obj.getLoadCommandInfo(Index);
334  int Res = 0;
335
336  outs() << "  # Load Command " << Index << "\n"
337         << " (('command', " << LCI.Command.Type << ")\n"
338         << "  ('size', " << LCI.Command.Size << ")\n";
339  switch (LCI.Command.Type) {
340  case macho::LCT_Segment:
341    Res = DumpSegmentCommand(Obj, LCI);
342    break;
343  case macho::LCT_Segment64:
344    Res = DumpSegment64Command(Obj, LCI);
345    break;
346  case macho::LCT_Symtab:
347    Res = DumpSymtabCommand(Obj, LCI);
348    break;
349  case macho::LCT_Dysymtab:
350    Res = DumpDysymtabCommand(Obj, LCI);
351    break;
352  default:
353    Warning("unknown load command: " + Twine(LCI.Command.Type));
354    break;
355  }
356  outs() << " ),\n";
357
358  return Res;
359}
360
361int main(int argc, char **argv) {
362  ProgramName = argv[0];
363  llvm_shutdown_obj Y;  // Call llvm_shutdown() on exit.
364
365  cl::ParseCommandLineOptions(argc, argv, "llvm Mach-O dumping tool\n");
366
367  // Load the input file.
368  std::string ErrorStr;
369  OwningPtr<MemoryBuffer> InputBuffer;
370  if (error_code ec = MemoryBuffer::getFileOrSTDIN(InputFile, InputBuffer))
371    return Error("unable to read input: '" + ec.message() + "'");
372
373  // Construct the Mach-O wrapper object.
374  OwningPtr<MachOObject> InputObject(
375    MachOObject::LoadFromBuffer(InputBuffer.take(), &ErrorStr));
376  if (!InputObject)
377    return Error("unable to load object: '" + ErrorStr + "'");
378
379  if (int Res = DumpHeader(*InputObject))
380    return Res;
381
382  // Print the load commands.
383  int Res = 0;
384  outs() << "('load_commands', [\n";
385  for (unsigned i = 0; i != InputObject->getHeader().NumLoadCommands; ++i)
386    if ((Res = DumpLoadCommand(*InputObject, i)))
387      break;
388  outs() << "])\n";
389
390  return Res;
391}
392